{
  "cells": [
    {
      "cell_type": "code",
      "execution_count": 72,
      "metadata": {
        "id": "HDZpHGsWreX5"
      },
      "outputs": [],
      "source": [
        "# ! pip install -U accelerate -q\n",
        "# ! pip install -U transformers -q\n",
        "# ! pip install datasets -q\n",
        "# ! pip install wandb -q"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 73,
      "metadata": {
        "id": "SMhrq00BtxZp"
      },
      "outputs": [],
      "source": [
        "import numpy as np\n",
        "import os\n",
        "import transformers\n",
        "import itertools\n",
        "import pandas as pd\n",
        "import math\n",
        "from transformers import GPTNeoXForCausalLM, AutoTokenizer\n",
        "from transformers import (\n",
        "    set_seed,\n",
        ")\n",
        "import wandb\n",
        "import pickle\n",
        "import string\n",
        "from datasets import Dataset, DatasetDict, load_dataset\n",
        "import torch\n",
        "import torch.nn.functional as F\n",
        "import logging"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 74,
      "metadata": {},
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 105
        },
        "id": "MaSlFeAxCu1A",
        "outputId": "18ec4c91-d9f5-4a66-a102-1fc1de827577"
      },
      "outputs": [],
      "source": [
        "NUM_SEQUENCES = 1\n",
        "SEQUENCE_LENGTH = 1024\n",
        "LEARNING_RATE = 0.000005\n",
        "SEED = 42\n",
        "EVALUATION_STRATEGY = 'epoch'\n",
        "SAVE_STRATEGY = 'epoch'\n",
        "NUM_TRAIN_EPOCHS = 30\n",
        "WEIGHT_DECAY = 0\n",
        "WARMUP_RATIO = 0.05\n",
        "LR_SCHEDULER = 'linear'\n",
        "PRETRAINED_CKPT_NS = 64\n",
        "PRETRAINED_CKPT_SL = 16\n",
        "PRETRAINED_CKPT = 65\n",
        "PRE_TRAINING_CHECKPOINT = f'<redacted>'\n",
        "\n",
        "params_dict = {\n",
        "    'NUM_SEQUENCES': NUM_SEQUENCES,\n",
        "    'SEQUENCE_LENGTH': SEQUENCE_LENGTH,\n",
        "    'LEARNING_RATE': LEARNING_RATE,\n",
        "    'SEED': SEED,\n",
        "    'NUM_TRAIN_EPOCHS': NUM_TRAIN_EPOCHS,\n",
        "    'PRE-TRAINING-CHECKPOINT': PRE_TRAINING_CHECKPOINT,\n",
        "    'LR_SCHEDULER': LR_SCHEDULER,\n",
        "    'WARMUP_RATIO': WARMUP_RATIO,\n",
        "    'PRE_TRAINED_CKPT_NS': PRETRAINED_CKPT_NS,\n",
        "    'PRE_TRAINED_CKPT_SL': PRETRAINED_CKPT_SL,\n",
        "}\n",
        "\n",
        "MODEL_SIZE = '1b'\n",
        "WANDB_PROJECT_NAME = \"SDDD-Experiments\"\n",
        "OUTPUT_DIR = '<redacted>'\n",
        "\n",
        "RUN_NAME = MODEL_SIZE + \"-ns-\" + str(NUM_SEQUENCES) + \"-sl-\" + \\\n",
        "          str(SEQUENCE_LENGTH) + \"-lr-\" + str(LEARNING_RATE) + \"-lr_scheduler-\" + str(LR_SCHEDULER) + \"-warmup-ratio-\" + str(WARMUP_RATIO) + \\\n",
        "            \"-seed-\" + str(SEED) + \"-epochs-\" + str(NUM_TRAIN_EPOCHS) + \"-pretraining_ckpt-ns-\" + str(PRETRAINED_CKPT_NS) + \"-pretraining_ckpt-sl-\" + str(PRETRAINED_CKPT_SL) + \"-pretraining_ckpt-\" + str(PRETRAINED_CKPT)\n",
        "OUTPUT_DIR = os.path.join(OUTPUT_DIR, RUN_NAME)\n",
        "\n",
        "# Make sure output directory exists\n",
        "if not os.path.exists(OUTPUT_DIR):\n",
        "    os.makedirs(OUTPUT_DIR)\n",
        "\n",
        "MODEL_NAME = f\"EleutherAI/pythia-{MODEL_SIZE}\"\n",
        "\n",
        "os.environ[\"WANDB_PROJECT\"] = WANDB_PROJECT_NAME\n",
        "os.environ[\"WANDB_WATCH\"] = \"all\"\n",
        "os.environ[\"TOKENIZERS_PARALLELISM\"] = \"false\"\n",
        "os.environ[\"WANDB__SERVICE_WAIT\"] = \"300\"\n",
        "# Set API key (for wandb)\n",
        "\n",
        "wandb.init(project=WANDB_PROJECT_NAME)\n",
        "wandb.run.name = RUN_NAME\n",
        "wandb.config.update(params_dict)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 76,
      "metadata": {
        "id": "QNPBAG4Dzm-T"
      },
      "outputs": [],
      "source": [
        "set_seed(SEED)"
      ]
    },
    {
      "cell_type": "markdown",
      "metadata": {},
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": 77,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 36
        },
        "id": "rjkLQxzjfMrB",
        "outputId": "59618031-5e47-45b2-c6f5-606a45c7433e"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "'1b-ns-1-sl-1024-lr-5e-06-lr_scheduler-linear-warmup-ratio-0.05-seed-42-epochs-30-pretraining_ckpt-ns-32-pretraining_ckpt-sl-32-pretraining_ckpt-65'"
            ]
          },
          "execution_count": 77,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "RUN_NAME"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 78,
      "metadata": {
        "id": "o-7xHpa3tTIt"
      },
      "outputs": [],
      "source": [
        "# model = GPTNeoXForCausalLM.from_pretrained(\n",
        "#   MODEL_NAME,\n",
        "#   revision=PRE_TRAINING_CHECKPOINT\n",
        "# )\n",
        "\n",
        "tokenizer = AutoTokenizer.from_pretrained(\n",
        "  MODEL_NAME\n",
        ")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 79,
      "metadata": {
        "id": "0XNL1m7L2YOW"
      },
      "outputs": [],
      "source": [
        "logger = logging.getLogger(__name__)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 80,
      "metadata": {
        "id": "6v9yac2-3kK-"
      },
      "outputs": [],
      "source": [
        "tokenizer.pad_token = tokenizer.eos_token"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 81,
      "metadata": {
        "id": "auNDQ9vctVJH"
      },
      "outputs": [],
      "source": [
        "def generate_random_strings(seed, num_sequences, sequence_length):\n",
        "    rng = np.random.default_rng(seed)\n",
        "    sequences = generate_strings(\n",
        "        num_sequences, sequence_length, rng\n",
        "    )\n",
        "    dataset = Dataset.from_dict(\n",
        "        {\n",
        "            \"text\": sequences,\n",
        "        }\n",
        "    )\n",
        "    datasets = DatasetDict(\n",
        "        {\n",
        "            \"train\": dataset,\n",
        "            \"test\": dataset,\n",
        "        }\n",
        "    )\n",
        "    datasets.set_format(\"torch\")\n",
        "    return datasets\n",
        "\n",
        "def generate_strings(num_sequences, sequence_length, rng):\n",
        "    letters = string.ascii_lowercase\n",
        "    sequences = rng.choice(list(letters), size=(1, sequence_length*num_sequences))\n",
        "\n",
        "    reshaped_sequences = []\n",
        "    for i in range(num_sequences):\n",
        "        reshaped_sequences.append(\n",
        "            sequences[0, i*sequence_length:(i+1)*sequence_length]\n",
        "        )\n",
        "    sequences = reshaped_sequences\n",
        "    print(sequences)\n",
        "    strs = [\"\".join(seq) for seq in sequences]\n",
        "    return strs\n",
        "\n",
        "def encode_character_wise(tokenizer, dataset):\n",
        "    def characterwise_encoding(example):\n",
        "        sequences = example[\"text\"]\n",
        "        max_length = max(len(s) for s in sequences)\n",
        "        sequence_token_ids = []\n",
        "        sequence_token_masks = []\n",
        "        for sequence in sequences:\n",
        "            sequence_chars = list(sequence)\n",
        "            encoded_chars = tokenize(\n",
        "                tokenizer,\n",
        "                sequence_chars,\n",
        "                max_length=1,\n",
        "            )\n",
        "            # add padding\n",
        "            num_padding = max_length - len(sequence)\n",
        "            padded_input_ids = torch.cat(\n",
        "                (\n",
        "                    torch.tensor(\n",
        "                        [tokenizer.pad_token_id] * num_padding, dtype=torch.long\n",
        "                    ),\n",
        "                    encoded_chars.input_ids.squeeze(1),\n",
        "                )\n",
        "            )\n",
        "            padded_attention_mask = torch.cat(\n",
        "                (\n",
        "                    torch.tensor([0] * num_padding, dtype=torch.long),\n",
        "                    encoded_chars.attention_mask.squeeze(1),\n",
        "                )\n",
        "            )\n",
        "            sequence_token_ids.append(padded_input_ids)\n",
        "            sequence_token_masks.append(padded_attention_mask)\n",
        "        return {\n",
        "            \"input_ids\": torch.stack(sequence_token_ids),\n",
        "            \"attention_mask\": torch.stack(sequence_token_masks),\n",
        "        }\n",
        "\n",
        "    return dataset.map(\n",
        "        characterwise_encoding,\n",
        "        batched=True,\n",
        "        batch_size=NUM_SEQUENCES,\n",
        "    )\n",
        "\n",
        "def tokenize(tokenizer, text, max_length):\n",
        "    if tokenizer.padding_side == \"right\":\n",
        "        logger.warning(\"Padding side is right, setting it to left\")\n",
        "        tokenizer.padding_side = \"left\"\n",
        "    if max_length is None:\n",
        "        padding = \"longest\"\n",
        "    else:\n",
        "        padding = \"max_length\"\n",
        "    return tokenizer(\n",
        "        text,\n",
        "        return_tensors=\"pt\",\n",
        "        return_token_type_ids=False,\n",
        "        truncation=True,\n",
        "        padding=padding,\n",
        "        max_length=max_length,\n",
        "    )\n"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 82,
      "metadata": {},
      "outputs": [],
      "source": [
        "map_tok = {}\n",
        "import string\n",
        "for i in string.ascii_lowercase:\n",
        "  map_tok[i] = tokenizer(i)['input_ids'][0]\n",
        "\n",
        "def doCharLevelTokenization(input_string):\n",
        "  custom_input = transformers.tokenization_utils_base.BatchEncoding()\n",
        "  custom_input['input_ids'] = []\n",
        "  custom_input['attention_mask'] = []\n",
        "  for i in input_string:\n",
        "    custom_input['input_ids'].append(map_tok[i])\n",
        "    custom_input['attention_mask'].append(1)\n",
        "  custom_input['input_ids'] = torch.tensor(custom_input['input_ids']).unsqueeze(0)\n",
        "  custom_input['attention_mask'] = torch.tensor(custom_input['attention_mask']).unsqueeze(0)\n",
        "  return custom_input"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 83,
      "metadata": {},
      "outputs": [],
      "source": [
        "import numpy as np\n",
        "import string"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 84,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/",
          "height": 99,
          "referenced_widgets": [
            "e0b6986f85d64adabbbf744ea47569fc",
            "ff130235ea0c4a22ba15c7baaba3a72e",
            "f1b76799c37440b0a6d0f033e4155db3",
            "3c611debfd5e47e4b6529fcaf4cd54c1",
            "1dbb314cd5974ddaae6af16afff7a319",
            "802c7c178c2d41e28f4d6a6bfbf57bb5",
            "7778f22a938c4ac5b16e56f09ed13263",
            "6937d8ef02ac45efb3e50a99ba1c6147",
            "b6ba28a0ffd345f896243e996b6ae06c",
            "6350ea1786e04c86a74d921c49fb5351",
            "b2ebfde2f2b34dbda4d2f07f5917ba52",
            "132b82bd4f9943629d54a565a644633c",
            "cbdc90ba5eb34c3cad181d177c573728",
            "f05696473b9c42a3b5264236db46e834",
            "cc701cf0c9a442c981447424db02a81c",
            "9bba65685aa642e39bef092b3640811c",
            "5e996612766347049f0849632721632d",
            "afdeddc092a246749f4685179df7213a",
            "edcc36cfe19a49ba9d13c6c3caff60f1",
            "b75cc076fd5140db8b1647212a60a409",
            "a5a6ec55deac48c7b9800b34242c9375",
            "e5604c9925444c79b7b7925f3b9f5a13"
          ]
        },
        "id": "TgyTM7Z-tvXK",
        "outputId": "256010b4-d762-490f-feba-75880732a70e"
      },
      "outputs": [
        {
          "name": "stdout",
          "output_type": "stream",
          "text": [
            "[array(['c', 'u', 'r', ..., 'b', 'w', 'v'], dtype='<U1')]\n"
          ]
        },
        {
          "data": {
            "application/vnd.jupyter.widget-view+json": {
              "model_id": "d6a9d9d40aeb4c0f90a57fab84115c2f",
              "version_major": 2,
              "version_minor": 0
            },
            "text/plain": [
              "Map:   0%|          | 0/1 [00:00<?, ? examples/s]"
            ]
          },
          "metadata": {},
          "output_type": "display_data"
        },
        {
          "name": "stderr",
          "output_type": "stream",
          "text": [
            "Padding side is right, setting it to left\n"
          ]
        },
        {
          "data": {
            "application/vnd.jupyter.widget-view+json": {
              "model_id": "0e7a7adcef7d4142a2a56c22b2ab9f92",
              "version_major": 2,
              "version_minor": 0
            },
            "text/plain": [
              "Map:   0%|          | 0/1 [00:00<?, ? examples/s]"
            ]
          },
          "metadata": {},
          "output_type": "display_data"
        }
      ],
      "source": [
        "dataset = generate_random_strings(seed=SEED,num_sequences=NUM_SEQUENCES,sequence_length=SEQUENCE_LENGTH)\n",
        "encoded_dataset = encode_character_wise(tokenizer, dataset)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {},
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": 85,
      "metadata": {
        "id": "7ctjWI7f01-g"
      },
      "outputs": [],
      "source": [
        "training_dataset = encoded_dataset.remove_columns([\"text\"])\n",
        "logger.info(f\"Generated {len(encoded_dataset['test'])} sequences\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 86,
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "x_PfnU8uTyvP",
        "outputId": "c75b95a6-f4e0-4ad3-c73a-1e212509651d"
      },
      "outputs": [
        {
          "data": {
            "text/plain": [
              "DatasetDict({\n",
              "    train: Dataset({\n",
              "        features: ['input_ids', 'attention_mask'],\n",
              "        num_rows: 1\n",
              "    })\n",
              "    test: Dataset({\n",
              "        features: ['input_ids', 'attention_mask'],\n",
              "        num_rows: 1\n",
              "    })\n",
              "})"
            ]
          },
          "execution_count": 86,
          "metadata": {},
          "output_type": "execute_result"
        }
      ],
      "source": [
        "training_dataset"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 87,
      "metadata": {},
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "background_save": true,
          "base_uri": "https://localhost:8080/",
          "height": 1000
        },
        "id": "cmhReXuxVgsk",
        "outputId": "2d5690d3-c5e3-407b-b0dc-7590c9d0d72b"
      },
      "outputs": [],
      "source": [
        "from transformers import DataCollatorForLanguageModeling\n",
        "\n",
        "tokenizer.pad_token = tokenizer.eos_token\n",
        "data_collator = DataCollatorForLanguageModeling(tokenizer=tokenizer, mlm=False)\n",
        "\n",
        "from transformers import AutoModelForCausalLM, TrainingArguments, Trainer\n",
        "\n",
        "model = AutoModelForCausalLM.from_pretrained(PRE_TRAINING_CHECKPOINT)\n",
        "\n",
        "training_args = TrainingArguments(\n",
        "    output_dir = OUTPUT_DIR,\n",
        "    evaluation_strategy = EVALUATION_STRATEGY,\n",
        "    learning_rate = LEARNING_RATE,\n",
        "    lr_scheduler_type = LR_SCHEDULER,\n",
        "    warmup_ratio = WARMUP_RATIO,\n",
        "    num_train_epochs = NUM_TRAIN_EPOCHS,\n",
        "    save_strategy = SAVE_STRATEGY,\n",
        "    run_name = RUN_NAME,\n",
        "    report_to=[\"wandb\"],\n",
        "    # push_to_hub=True,\n",
        ")\n",
        "\n",
        "trainer = Trainer(\n",
        "    model=model,\n",
        "    args=training_args,\n",
        "    train_dataset=training_dataset[\"train\"],\n",
        "    eval_dataset=training_dataset[\"test\"],\n",
        "    data_collator=data_collator,\n",
        "    # resume_from_checkpoint = True,\n",
        "    # callbacks=[NextTokenProbabilityCallback(dataset[\"test\"].to_pandas()['text'].to_list(), OUTPUT_DIR)],\n",
        ")\n",
        "\n",
        "trainer.train()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "background_save": true
        },
        "id": "6fd1twEOdNU9",
        "outputId": "c738d233-13ae-4b04-cd23-b5d7195ca73d"
      },
      "outputs": [],
      "source": [
        "import math\n",
        "\n",
        "eval_results = trainer.evaluate()\n",
        "print(f\"Perplexity: {math.exp(eval_results['eval_loss']):.2f}\")"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 90,
      "metadata": {
        "colab": {
          "background_save": true
        },
        "id": "YglJNJNhke1r",
        "outputId": "90451ad5-0bfb-44e5-f7fa-5efbbc086070"
      },
      "outputs": [],
      "source": [
        "inp_strs = dataset['train'].to_pandas()['text'].to_list()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 91,
      "metadata": {},
      "outputs": [],
      "source": [
        "str_save_path = '<redacted>'\n",
        "\n",
        "# clear the file\n",
        "open(str_save_path + f'inp_str_{RUN_NAME}.txt', 'w').close()\n",
        "\n",
        "# save inp_str in a text file\n",
        "with open(str_save_path + f'inp_str_{RUN_NAME}.txt', 'w') as f:\n",
        "    # write all strings to file\n",
        "    for item in inp_strs:\n",
        "        f.write(\"%s\\n\" % item)"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 92,
      "metadata": {
        "colab": {
          "background_save": true
        },
        "id": "rPFjdBDiY85y"
      },
      "outputs": [],
      "source": [
        "# trainer.save_model()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": 93,
      "metadata": {
        "colab": {
          "background_save": true
        },
        "id": "2UrFo1AdY9Px"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": 94,
      "metadata": {
        "colab": {
          "background_save": true
        },
        "id": "Ote2wgEVZEtI",
        "outputId": "6f1d2021-e152-4c3d-cff2-3bba86726d45"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": 95,
      "metadata": {
        "colab": {
          "background_save": true
        },
        "id": "ERftQref-cj0",
        "outputId": "97989645-7246-4f28-de82-c21c93ea13fe"
      },
      "outputs": [],
      "source": []
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "colab": {
          "background_save": true
        },
        "id": "h78gdeVK05dS",
        "outputId": "5ece98ef-2fb8-4776-fb67-f7719703f225"
      },
      "outputs": [],
      "source": [
        "wandb.finish()"
      ]
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {},
      "outputs": [],
      "source": []
    }
  ],
  "metadata": {
    "accelerator": "GPU",
    "colab": {
      "provenance": []
    },
    "kernelspec": {
      "display_name": "myenv",
      "language": "python",
      "name": "python3"
    },
    "language_info": {
      "codemirror_mode": {
        "name": "ipython",
        "version": 3
      },
      "file_extension": ".py",
      "mimetype": "text/x-python",
      "name": "python",
      "nbconvert_exporter": "python",
      "pygments_lexer": "ipython3",
      "version": "3.11.4"
    },
    "widgets": {
      "application/vnd.jupyter.widget-state+json": {
        "132b82bd4f9943629d54a565a644633c": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HBoxModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HBoxModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HBoxView",
            "box_style": "",
            "children": [
              "IPY_MODEL_cbdc90ba5eb34c3cad181d177c573728",
              "IPY_MODEL_f05696473b9c42a3b5264236db46e834",
              "IPY_MODEL_cc701cf0c9a442c981447424db02a81c"
            ],
            "layout": "IPY_MODEL_9bba65685aa642e39bef092b3640811c"
          }
        },
        "1dbb314cd5974ddaae6af16afff7a319": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "3c611debfd5e47e4b6529fcaf4cd54c1": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_6350ea1786e04c86a74d921c49fb5351",
            "placeholder": "​",
            "style": "IPY_MODEL_b2ebfde2f2b34dbda4d2f07f5917ba52",
            "value": " 1/1 [00:00&lt;00:00, 17.37 examples/s]"
          }
        },
        "5e996612766347049f0849632721632d": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "6350ea1786e04c86a74d921c49fb5351": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "6937d8ef02ac45efb3e50a99ba1c6147": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "7778f22a938c4ac5b16e56f09ed13263": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "802c7c178c2d41e28f4d6a6bfbf57bb5": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "9bba65685aa642e39bef092b3640811c": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "a5a6ec55deac48c7b9800b34242c9375": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "afdeddc092a246749f4685179df7213a": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "b2ebfde2f2b34dbda4d2f07f5917ba52": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "b6ba28a0ffd345f896243e996b6ae06c": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "ProgressStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "ProgressStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "bar_color": null,
            "description_width": ""
          }
        },
        "b75cc076fd5140db8b1647212a60a409": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "ProgressStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "ProgressStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "bar_color": null,
            "description_width": ""
          }
        },
        "cbdc90ba5eb34c3cad181d177c573728": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_5e996612766347049f0849632721632d",
            "placeholder": "​",
            "style": "IPY_MODEL_afdeddc092a246749f4685179df7213a",
            "value": "Map: 100%"
          }
        },
        "cc701cf0c9a442c981447424db02a81c": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_a5a6ec55deac48c7b9800b34242c9375",
            "placeholder": "​",
            "style": "IPY_MODEL_e5604c9925444c79b7b7925f3b9f5a13",
            "value": " 1/1 [00:00&lt;00:00, 21.25 examples/s]"
          }
        },
        "e0b6986f85d64adabbbf744ea47569fc": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HBoxModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HBoxModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HBoxView",
            "box_style": "",
            "children": [
              "IPY_MODEL_ff130235ea0c4a22ba15c7baaba3a72e",
              "IPY_MODEL_f1b76799c37440b0a6d0f033e4155db3",
              "IPY_MODEL_3c611debfd5e47e4b6529fcaf4cd54c1"
            ],
            "layout": "IPY_MODEL_1dbb314cd5974ddaae6af16afff7a319"
          }
        },
        "e5604c9925444c79b7b7925f3b9f5a13": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "DescriptionStyleModel",
          "state": {
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "DescriptionStyleModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "StyleView",
            "description_width": ""
          }
        },
        "edcc36cfe19a49ba9d13c6c3caff60f1": {
          "model_module": "@jupyter-widgets/base",
          "model_module_version": "1.2.0",
          "model_name": "LayoutModel",
          "state": {
            "_model_module": "@jupyter-widgets/base",
            "_model_module_version": "1.2.0",
            "_model_name": "LayoutModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/base",
            "_view_module_version": "1.2.0",
            "_view_name": "LayoutView",
            "align_content": null,
            "align_items": null,
            "align_self": null,
            "border": null,
            "bottom": null,
            "display": null,
            "flex": null,
            "flex_flow": null,
            "grid_area": null,
            "grid_auto_columns": null,
            "grid_auto_flow": null,
            "grid_auto_rows": null,
            "grid_column": null,
            "grid_gap": null,
            "grid_row": null,
            "grid_template_areas": null,
            "grid_template_columns": null,
            "grid_template_rows": null,
            "height": null,
            "justify_content": null,
            "justify_items": null,
            "left": null,
            "margin": null,
            "max_height": null,
            "max_width": null,
            "min_height": null,
            "min_width": null,
            "object_fit": null,
            "object_position": null,
            "order": null,
            "overflow": null,
            "overflow_x": null,
            "overflow_y": null,
            "padding": null,
            "right": null,
            "top": null,
            "visibility": null,
            "width": null
          }
        },
        "f05696473b9c42a3b5264236db46e834": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "FloatProgressModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "FloatProgressModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "ProgressView",
            "bar_style": "success",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_edcc36cfe19a49ba9d13c6c3caff60f1",
            "max": 1,
            "min": 0,
            "orientation": "horizontal",
            "style": "IPY_MODEL_b75cc076fd5140db8b1647212a60a409",
            "value": 1
          }
        },
        "f1b76799c37440b0a6d0f033e4155db3": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "FloatProgressModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "FloatProgressModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "ProgressView",
            "bar_style": "success",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_6937d8ef02ac45efb3e50a99ba1c6147",
            "max": 1,
            "min": 0,
            "orientation": "horizontal",
            "style": "IPY_MODEL_b6ba28a0ffd345f896243e996b6ae06c",
            "value": 1
          }
        },
        "ff130235ea0c4a22ba15c7baaba3a72e": {
          "model_module": "@jupyter-widgets/controls",
          "model_module_version": "1.5.0",
          "model_name": "HTMLModel",
          "state": {
            "_dom_classes": [],
            "_model_module": "@jupyter-widgets/controls",
            "_model_module_version": "1.5.0",
            "_model_name": "HTMLModel",
            "_view_count": null,
            "_view_module": "@jupyter-widgets/controls",
            "_view_module_version": "1.5.0",
            "_view_name": "HTMLView",
            "description": "",
            "description_tooltip": null,
            "layout": "IPY_MODEL_802c7c178c2d41e28f4d6a6bfbf57bb5",
            "placeholder": "​",
            "style": "IPY_MODEL_7778f22a938c4ac5b16e56f09ed13263",
            "value": "Map: 100%"
          }
        }
      }
    }
  },
  "nbformat": 4,
  "nbformat_minor": 0
}
