{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "1fad92d0",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import numpy.random as npr\n",
    "import random\n",
    "import tensorflow as tf\n",
    "from tensorflow import keras\n",
    "from tensorflow.keras import layers\n",
    "from tensorflow.keras import backend as K\n",
    "from keras.optimizers import Adam\n",
    "from keras_nlp.layers import PositionEmbedding"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "df3b6089",
   "metadata": {},
   "outputs": [],
   "source": [
    "seed = 428\n",
    "\n",
    "np.random.seed(seed)\n",
    "tf.random.set_seed(seed)\n",
    "random.seed(seed)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "e6302f08",
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_masked_input_and_labels(encoded_texts, n_cat):\n",
    "    # For each sentence, mask each word one-by-one\n",
    "\n",
    "    encoded_texts_masked = []\n",
    "    y_labels = []\n",
    "\n",
    "    for encoded_text in encoded_texts:\n",
    "        for i in range(len(encoded_text)):\n",
    "            encoded_text_masked = np.copy(encoded_text)\n",
    "            y_label = encoded_text_masked[i]\n",
    "            encoded_texts_masked.append(np.delete(encoded_text_masked, i))\n",
    "            y_labels.append(np.array([y_label]))\n",
    "\n",
    "    return np.array(encoded_texts_masked), np.array(y_labels)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "7a9a18d6",
   "metadata": {},
   "outputs": [],
   "source": [
    "#### K = number of countries = number of capitals = number of universities = number of mascots\n",
    "#### M = number of words only used by each topic\n",
    "#### S = number of words used by both topics\n",
    "#### L = sentence length\n",
    "#### q1, q2 = probability of having 1 or 2 pairs\n",
    "#### embed_dim = dimension of embeddings\n",
    "#### n_sentences = number of training sentences\n",
    "\n",
    "def train_model(K, M, S, L, q1, q2, embed_dim, n_sentences):\n",
    "    \n",
    "    countries = ['country_' + str(i) for i in range(K)]\n",
    "    capitals = ['capital_' + str(i) for i in range(K)]\n",
    "    universities = ['university_' + str(i) for i in range(K)]\n",
    "    mascots = ['mascot_' + str(i) for i in range(K)]\n",
    "    random_capitals = ['random_capital_' + str(i) for i in range(M)]\n",
    "    random_mascots = ['random_mascot_' + str(i) for i in range(M)]\n",
    "    randoms = ['random_' + str(i) for i in range(S)]\n",
    "\n",
    "    vocabs = countries + capitals + universities + mascots + random_capitals + random_mascots + randoms\n",
    "    vocab_map = {}\n",
    "\n",
    "    for i in range(len(vocabs)):\n",
    "        vocab_map[vocabs[i]] = i\n",
    "        \n",
    "    sentences = []\n",
    "    sentences_number = []\n",
    "    \n",
    "    q0 = 1 - q1 - q2\n",
    "\n",
    "    for i in range(n_sentences):\n",
    "\n",
    "        sentence = []\n",
    "        \n",
    "        temp = npr.uniform()\n",
    "        temp2 = npr.uniform()\n",
    "        \n",
    "        if temp2 <= q0:\n",
    "            n_pairs = 0\n",
    "        elif temp2 <= q0 + q1:\n",
    "            n_pairs = 1\n",
    "        else:\n",
    "            n_pairs = 2\n",
    "        \n",
    "        if temp <= 0.5: ### country - capital\n",
    "        \n",
    "            pairs = np.random.choice(np.arange(K), n_pairs, replace = False)\n",
    "#             pairs2 = np.random.choice(np.arange(M), n_pairs, replace = False)\n",
    "            for pair in pairs:\n",
    "                sentence.append(countries[pair])\n",
    "                sentence.append(capitals[pair])        \n",
    "#             for pair in pairs2:\n",
    "#                 temp3 = npr.uniform()\n",
    "#                 if temp3 <= 0.5:\n",
    "#                     sentence.append(random_capitals[pair])\n",
    "#                 else:\n",
    "#                     sentence.append(random_mascots[pair])\n",
    "            \n",
    "            randoms_dup = 4 * random_capitals + 2 * randoms + 1 * random_mascots\n",
    "            sentence += list(np.random.choice(randoms_dup, L - 2 * n_pairs, replace = False))  \n",
    "                 \n",
    "        else: ### university - mascot\n",
    "            \n",
    "            pairs = np.random.choice(np.arange(K), n_pairs, replace = False)\n",
    "#             pairs2 = np.random.choice(np.arange(M), n_pairs, replace = False)\n",
    "            for pair in pairs:\n",
    "                sentence.append(universities[pair])\n",
    "                sentence.append(mascots[pair])        \n",
    "#             for pair in pairs2:\n",
    "#                 temp3 = npr.uniform()\n",
    "#                 if temp3 <= 0.5:\n",
    "#                     sentence.append(random_mascots[pair])\n",
    "#                 else:\n",
    "#                     sentence.append(random_capitals[pair])\n",
    "\n",
    "            \n",
    "            randoms_dup = 1 * random_capitals + 2 * randoms + 4 * random_mascots\n",
    "            sentence += list(np.random.choice(randoms_dup, L - 2 * n_pairs, replace = False))  \n",
    "            \n",
    "        \n",
    "        \n",
    "\n",
    "        #sentence += list(np.random.choice(randoms + random_capitals + random_mascots, L - 2 * n_pairs, replace = False))  \n",
    "\n",
    "        sentence_number = [vocab_map[i] for i in sentence]\n",
    "        sentences.append(sentence)\n",
    "        sentences_number.append(sentence_number)\n",
    "        \n",
    "    x_train = np.array(sentences_number)\n",
    "    n_cat = len(vocab_map)\n",
    "    x_masked_train, y_masked_labels_train = get_masked_input_and_labels(x_train, n_cat)\n",
    "    \n",
    "    callback = keras.callbacks.EarlyStopping(monitor = 'val_loss', patience = 5, restore_best_weights = True)\n",
    "    inputs = layers.Input((x_masked_train.shape[1],), dtype=tf.int64)\n",
    "    word_embeddings = layers.Embedding(n_cat, embed_dim, name=\"word_embedding\")(inputs)\n",
    "    encoder_output = layers.GlobalAveragePooling1D()(word_embeddings)\n",
    "    mlm_output = layers.Dense(n_cat, name=\"mlm_cls\", activation=\"softmax\", use_bias=False)(encoder_output)\n",
    "    mlm_model = keras.Model(inputs = inputs, outputs = mlm_output)\n",
    "    adam = Adam()\n",
    "    mlm_model.compile(loss='sparse_categorical_crossentropy', optimizer=adam)\n",
    "\n",
    "    history = mlm_model.fit(x_masked_train, y_masked_labels_train,\n",
    "                        validation_split = 0.5, callbacks = [callback], \n",
    "                        epochs=500, batch_size=128, verbose=0)\n",
    "    \n",
    "    return sentences, vocab_map, mlm_model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "85be6230",
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_acc_prob(K, M, S, L, q1, q2, embed_dim, n_sentences, n_samples):\n",
    "    \n",
    "    sentences, vocab_map, current_model = train_model(K, M, S, L, q1, q2, embed_dim, n_sentences)\n",
    "\n",
    "    acc_capitals = []\n",
    "    prob_capitals = []\n",
    "\n",
    "    for _ in range(n_samples):\n",
    "        sentence = []\n",
    "        random_capitals = np.random.choice(np.arange(K), int(L/2), replace = False)\n",
    "        for random_capital in random_capitals:\n",
    "            sentence.append('country_' + str(random_capital))\n",
    "            sentence.append('capital_' + str(random_capital))\n",
    "        sentence = sentence[:-1]\n",
    "        sentence_number = [vocab_map[i] for i in sentence]\n",
    "        temp = keras.backend.function(inputs = current_model.layers[0].input, outputs = current_model.layers[-1].output) \\\n",
    "            (np.array(sentence_number).reshape(1,len(sentence_number)))\n",
    "        actual = vocab_map['capital_' + str(random_capitals[-1])]\n",
    "        acc_capitals.append(1 if np.argsort(-1 * temp)[0][0] == actual else 0)\n",
    "        prob_capitals.append(temp[0][vocab_map['capital_' + str(random_capitals[-1])]])\n",
    "        \n",
    "    acc_mascots = []\n",
    "    prob_mascots = []\n",
    "\n",
    "    for _ in range(n_samples):\n",
    "        sentence = []\n",
    "        random_mascots = np.random.choice(np.arange(K), int(L/2), replace = False)\n",
    "        for random_mascot in random_mascots:\n",
    "            sentence.append('university_' + str(random_mascot))\n",
    "            sentence.append('mascot_' + str(random_mascot))\n",
    "        sentence = sentence[:-1]\n",
    "        sentence_number = [vocab_map[i] for i in sentence]\n",
    "        temp = keras.backend.function(inputs = current_model.layers[0].input, outputs = current_model.layers[-1].output) \\\n",
    "            (np.array(sentence_number).reshape(1,len(sentence_number)))\n",
    "        actual = vocab_map['mascot_' + str(random_mascots[-1])]\n",
    "        acc_mascots.append(1 if np.argsort(-1 * temp)[0][0] == actual else 0)\n",
    "        prob_mascots.append(temp[0][vocab_map['mascot_' + str(random_mascots[-1])]])\n",
    "        \n",
    "\n",
    "    return sentences, current_model, vocab_map, (np.mean(acc_capitals), np.mean(prob_capitals)), \\\n",
    "                (np.mean(acc_mascots), np.mean(prob_mascots))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "d19dd717",
   "metadata": {},
   "outputs": [],
   "source": [
    "K = 10 # number of countries\n",
    "L = 8 # sentence length\n",
    "M = 20 # number of words used by each topic\n",
    "S = 20 # number of words used by both topics\n",
    "embed_dim = 10 # CBOW embedding dimension\n",
    "n_sentences = 50000 # number of sentences in the training set\n",
    "n_samples = 1000"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "id": "0e89e3d9",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(0.0, 4.308565e-26)\n",
      "(0.0, 1.3986933e-25)\n",
      "(0.0, 1.8090795e-24)\n",
      "(0.0, 4.942542e-28)\n",
      "(0.0, 1.0876332e-29)\n",
      "(0.0, 2.3819443e-29)\n",
      "(0.0, 2.453412e-26)\n",
      "(0.0, 4.064949e-27)\n",
      "(0.0, 1.1428793e-31)\n",
      "(0.0, 3.1511555e-31)\n",
      "(0.0, 3.1780113e-32)\n",
      "(0.0, 3.857537e-30)\n",
      "(0.0, 8.7947545e-26)\n",
      "(0.0, 4.918049e-25)\n",
      "(0.0, 3.9887345e-32)\n",
      "(0.0, 2.8513771e-31)\n",
      "(0.0, 3.3897772e-34)\n",
      "(0.0, 5.3152313e-33)\n",
      "(0.0, 4.2526162e-24)\n",
      "(0.0, 2.0675768e-28)\n",
      "(0.0, 6.217274122795354e-25)\n",
      "(0.0, 6.364684503165447e-26)\n"
     ]
    }
   ],
   "source": [
    "q0 = 0 # probability of having 0 pairs\n",
    "q1 = 1 # probability of having 1 pair\n",
    "q2 = 0 # probability of having 2 pairs\n",
    "\n",
    "accs_c = 0\n",
    "probs_c = 0\n",
    "accs_d = 0\n",
    "probs_d = 0\n",
    "\n",
    "for _ in range(10):\n",
    "    sentences, mlm_model, vocab_map, acc_c, acc_d \\\n",
    "        = get_acc_prob(K, M, S, L, q1, q2, embed_dim, n_sentences, n_samples)\n",
    "    \n",
    "    print(acc_c)\n",
    "    print(acc_d)\n",
    "    \n",
    "    accs_c += acc_c[0]/10\n",
    "    probs_c += acc_c[1]/10\n",
    "    accs_d += acc_d[0]/10\n",
    "    probs_d += acc_d[1]/10\n",
    "    \n",
    "print((accs_c, probs_c))\n",
    "print((accs_d, probs_d))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "5910567f",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(0.0, 3.04641e-05)\n",
      "(0.004, 0.0014195961)\n",
      "(0.1, 0.01512116)\n",
      "(0.186, 0.029488053)\n",
      "(0.0, 9.938566e-06)\n",
      "(0.0, 2.2380182e-05)\n",
      "(0.268, 0.099668704)\n",
      "(0.347, 0.123830736)\n",
      "(0.484, 0.10750331)\n",
      "(0.008, 0.0031037098)\n",
      "(0.0, 9.88072e-05)\n",
      "(0.002, 0.0018419767)\n",
      "(0.0, 0.00012829478)\n",
      "(0.0, 0.00012847265)\n",
      "(0.555, 0.2068598)\n",
      "(0.454, 0.19144528)\n",
      "(0.106, 0.02168327)\n",
      "(0.38, 0.063758)\n",
      "(0.049, 0.012646965)\n",
      "(0.0, 3.684311e-05)\n",
      "(0.15619999999999998, 0.04637507106390331)\n",
      "(0.1381, 0.041507504424407676)\n"
     ]
    }
   ],
   "source": [
    "q0 = 0 # probability of having 0 pairs\n",
    "q1 = 0 # probability of having 1 pair\n",
    "q2 = 1 # probability of having 2 pairs\n",
    "\n",
    "accs_c = 0\n",
    "probs_c = 0\n",
    "accs_d = 0\n",
    "probs_d = 0\n",
    "\n",
    "for _ in range(10):\n",
    "    sentences, mlm_model, vocab_map, acc_c, acc_d \\\n",
    "        = get_acc_prob(K, M, S, L, q1, q2, embed_dim, n_sentences, n_samples)\n",
    "    \n",
    "    print(acc_c)\n",
    "    print(acc_d)\n",
    "    \n",
    "    accs_c += acc_c[0]/10\n",
    "    probs_c += acc_c[1]/10\n",
    "    accs_d += acc_d[0]/10\n",
    "    probs_d += acc_d[1]/10\n",
    "    \n",
    "print((accs_c, probs_c))\n",
    "print((accs_d, probs_d))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "id": "f3480dd3",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(0.272, 0.18631977)\n",
      "(0.161, 0.09608693)\n",
      "(0.283, 0.17925784)\n",
      "(0.315, 0.21639058)\n",
      "(0.259, 0.16353607)\n",
      "(0.248, 0.16416918)\n",
      "(0.163, 0.0949261)\n",
      "(0.496, 0.35963252)\n",
      "(0.344, 0.26159865)\n",
      "(0.259, 0.17734715)\n",
      "(0.18, 0.13733216)\n",
      "(0.199, 0.14726505)\n",
      "(0.471, 0.33643916)\n",
      "(0.263, 0.1592943)\n",
      "(0.248, 0.1677058)\n",
      "(0.364, 0.21958761)\n",
      "(0.274, 0.19665843)\n",
      "(0.217, 0.14915676)\n",
      "(0.28, 0.17286813)\n",
      "(0.211, 0.12408617)\n",
      "(0.2774, 0.18966421112418175)\n",
      "(0.2733, 0.18130162581801412)\n"
     ]
    }
   ],
   "source": [
    "q0 = 1/2 # probability of having 0 pairs\n",
    "q1 = 1/2 # probability of having 1 pair\n",
    "q2 = 0 # probability of having 2 pairs\n",
    "\n",
    "accs_c = 0\n",
    "probs_c = 0\n",
    "accs_d = 0\n",
    "probs_d = 0\n",
    "\n",
    "for _ in range(10):\n",
    "    sentences, mlm_model, vocab_map, acc_c, acc_d \\\n",
    "        = get_acc_prob(K, M, S, L, q1, q2, embed_dim, n_sentences, n_samples)\n",
    "    \n",
    "    print(acc_c)\n",
    "    print(acc_d)\n",
    "    \n",
    "    accs_c += acc_c[0]/10\n",
    "    probs_c += acc_c[1]/10\n",
    "    accs_d += acc_d[0]/10\n",
    "    probs_d += acc_d[1]/10\n",
    "    \n",
    "print((accs_c, probs_c))\n",
    "print((accs_d, probs_d))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "id": "46ca5547",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(1.0, 0.9998805)\n",
      "(1.0, 0.9997428)\n",
      "(1.0, 0.99991995)\n",
      "(1.0, 0.99981165)\n",
      "(1.0, 0.9998041)\n",
      "(1.0, 0.9998212)\n",
      "(1.0, 0.9999597)\n",
      "(1.0, 0.9999724)\n",
      "(1.0, 0.99983376)\n",
      "(1.0, 0.9999105)\n",
      "(1.0, 0.99993104)\n",
      "(1.0, 0.9998866)\n",
      "(1.0, 0.9999068)\n",
      "(1.0, 0.99989814)\n",
      "(1.0, 0.9999528)\n",
      "(1.0, 0.99996865)\n",
      "(1.0, 0.99989855)\n",
      "(1.0, 0.9999031)\n",
      "(1.0, 0.99996424)\n",
      "(1.0, 0.9999544)\n",
      "(0.9999999999999999, 0.99990513920784)\n",
      "(0.9999999999999999, 0.9998869359493255)\n"
     ]
    }
   ],
   "source": [
    "q0 = 1/2 # probability of having 0 pairs\n",
    "q1 = 0 # probability of having 1 pair\n",
    "q2 = 1/2 # probability of having 2 pairs\n",
    "\n",
    "accs_c = 0\n",
    "probs_c = 0\n",
    "accs_d = 0\n",
    "probs_d = 0\n",
    "\n",
    "for _ in range(10):\n",
    "    sentences, mlm_model, vocab_map, acc_c, acc_d \\\n",
    "        = get_acc_prob(K, M, S, L, q1, q2, embed_dim, n_sentences, n_samples)\n",
    "    \n",
    "    print(acc_c)\n",
    "    print(acc_d)\n",
    "    \n",
    "    accs_c += acc_c[0]/10\n",
    "    probs_c += acc_c[1]/10\n",
    "    accs_d += acc_d[0]/10\n",
    "    probs_d += acc_d[1]/10\n",
    "    \n",
    "print((accs_c, probs_c))\n",
    "print((accs_d, probs_d))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "cd93057c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(1.0, 0.99772245)\n",
      "(1.0, 0.9950919)\n",
      "(1.0, 0.99523866)\n",
      "(1.0, 0.99691105)\n",
      "(1.0, 0.9974566)\n",
      "(1.0, 0.9967803)\n",
      "(1.0, 0.99286866)\n",
      "(1.0, 0.9958752)\n",
      "(1.0, 0.99812424)\n",
      "(1.0, 0.99575967)\n",
      "(1.0, 0.99908465)\n",
      "(1.0, 0.99904484)\n",
      "(1.0, 0.9934894)\n",
      "(1.0, 0.99956924)\n",
      "(1.0, 0.9980884)\n",
      "(1.0, 0.99824464)\n",
      "(1.0, 0.9978714)\n",
      "(1.0, 0.99777293)\n",
      "(1.0, 0.99634326)\n",
      "(1.0, 0.9982415)\n",
      "(0.9999999999999999, 0.9966287732124329)\n",
      "(0.9999999999999999, 0.9973291218280792)\n"
     ]
    }
   ],
   "source": [
    "q0 = 0 # probability of having 0 pairs\n",
    "q1 = 1/2 # probability of having 1 pair\n",
    "q2 = 1/2 # probability of having 2 pairs\n",
    "\n",
    "accs_c = 0\n",
    "probs_c = 0\n",
    "accs_d = 0\n",
    "probs_d = 0\n",
    "\n",
    "for _ in range(10):\n",
    "    sentences, mlm_model, vocab_map, acc_c, acc_d \\\n",
    "        = get_acc_prob(K, M, S, L, q1, q2, embed_dim, n_sentences, n_samples)\n",
    "    \n",
    "    print(acc_c)\n",
    "    print(acc_d)\n",
    "    \n",
    "    accs_c += acc_c[0]/10\n",
    "    probs_c += acc_c[1]/10\n",
    "    accs_d += acc_d[0]/10\n",
    "    probs_d += acc_d[1]/10\n",
    "    \n",
    "print((accs_c, probs_c))\n",
    "print((accs_d, probs_d))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "id": "bb9a28cf",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "(1.0, 0.99972963)\n",
      "(1.0, 0.9996282)\n",
      "(1.0, 0.99952465)\n",
      "(1.0, 0.99956495)\n",
      "(1.0, 0.9996334)\n",
      "(1.0, 0.99982065)\n",
      "(1.0, 0.99957174)\n",
      "(1.0, 0.9994311)\n",
      "(1.0, 0.999811)\n",
      "(1.0, 0.9994858)\n",
      "(1.0, 0.99963486)\n",
      "(1.0, 0.9994331)\n",
      "(1.0, 0.99978125)\n",
      "(1.0, 0.9999253)\n",
      "(1.0, 0.99969566)\n",
      "(1.0, 0.9994158)\n",
      "(1.0, 0.9997359)\n",
      "(1.0, 0.99883)\n",
      "(1.0, 0.9998027)\n",
      "(1.0, 0.99984115)\n",
      "(0.9999999999999999, 0.9996920764446258)\n",
      "(0.9999999999999999, 0.999537605047226)\n"
     ]
    }
   ],
   "source": [
    "q0 = 1/3 # probability of having 0 pairs\n",
    "q1 = 1/3 # probability of having 1 pair\n",
    "q2 = 1/3 # probability of having 2 pairs\n",
    "\n",
    "accs_c = 0\n",
    "probs_c = 0\n",
    "accs_d = 0\n",
    "probs_d = 0\n",
    "\n",
    "for _ in range(10):\n",
    "    sentences, mlm_model, vocab_map, acc_c, acc_d \\\n",
    "        = get_acc_prob(K, M, S, L, q1, q2, embed_dim, n_sentences, n_samples)\n",
    "    \n",
    "    print(acc_c)\n",
    "    print(acc_d)\n",
    "    \n",
    "    accs_c += acc_c[0]/10\n",
    "    probs_c += acc_c[1]/10\n",
    "    accs_d += acc_d[0]/10\n",
    "    probs_d += acc_d[1]/10\n",
    "    \n",
    "print((accs_c, probs_c))\n",
    "print((accs_d, probs_d))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d96c6d47",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9095fbc3",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.7"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
