{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "18931504-770b-4bd0-b524-e366491cb55d",
   "metadata": {},
   "outputs": [],
   "source": [
    "import logging\n",
    "import time\n",
    "import math\n",
    "import json\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import random\n",
    "import os\n",
    "from collections import defaultdict\n",
    "\n",
    "import torch.nn.functional as F\n",
    "from scipy.optimize import brentq\n",
    "import torch.jit as jit\n",
    "from torch.jit import script\n",
    "from typing import Optional, Tuple, List, Dict, Any\n",
    "from torch.nn.parameter import Parameter, UninitializedParameter"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9f5580f1-ddd7-4be6-8d2d-7dd2b6c0b22b",
   "metadata": {},
   "outputs": [],
   "source": [
    "#please comment out if you use cpu\n",
    "os.environ['CUDA_VISIBLE_DEVICES'] = 0\n",
    "\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.optim as optim\n",
    "\n",
    "logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')\n",
    "logger = logging.getLogger()\n",
    "device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n",
    "logger.info(f'Using device: {device}')\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d57adecf-8f67-40ed-aff7-45a41f855dfc",
   "metadata": {},
   "outputs": [],
   "source": [
    "def set_seed(seed: int = 42):\n",
    "    random.seed(seed)\n",
    "    os.environ['PYTHONHASHSEED'] = str(seed)\n",
    "    np.random.seed(seed)\n",
    "    torch.manual_seed(seed)\n",
    "    torch.cuda.manual_seed(seed) \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "67be57ce-1b95-426d-8714-a12245c4a1af",
   "metadata": {},
   "outputs": [],
   "source": [
    "\"\"\"\n",
    "This code is adopted the following links:\n",
    "https://github.com/MinhZou/selective-copying-mamba/blob/main/data_generator.py\n",
    "\"\"\"\n",
    "\n",
    "import torch\n",
    "import random\n",
    "import numpy as np\n",
    "import torch.nn.functional as F\n",
    "\n",
    "def torch_copying_data(L, M, A, variable=False, variable_length=False, batch_shape=(), one_hot=False, reverse=False):\n",
    "    \"\"\"\n",
    "    Generate a dataset for a sequence copying task.\n",
    "    This code is adopted from the copying.py script in the S4 repository. The original code can be found at:\n",
    "    https://github.com/state-spaces/s4/blob/e757cef57d89e448c413de7325ed5601aceaac13/src/dataloaders/datasets/copying.py\n",
    "\n",
    "    Parameters:\n",
    "    L (int): Number of padding tokens\n",
    "    M (int): Number of tokens to memorize\n",
    "    A (int): Alphabet size\n",
    "    variable (bool): If True, selective copying task\n",
    "    variable_length (bool): If True, randomize number of tokens to memorize\n",
    "    batch_shape (tuple): Shape of the batch\n",
    "    one_hot (bool): If True, convert the input sequence into a one-hot encoded tensor\n",
    "    reverse (bool): If True, reverse the order of the target sequence\n",
    "\n",
    "    Returns:\n",
    "    tuple: Generated input sequence and target sequence\n",
    "    \"\"\"\n",
    "    if variable_length:\n",
    "        M = int(random.random() * M) + 1\n",
    "    tokens = torch.randint(low=1, high=A-1, size=batch_shape+(M,))\n",
    "    if variable:\n",
    "        total_batch = int(np.prod(batch_shape))\n",
    "        inds = torch.stack([\n",
    "            torch.randperm(L+M)[:M]\n",
    "            for _ in range(total_batch)\n",
    "            ], 0)\n",
    "        inds = inds.reshape(batch_shape+(M,))\n",
    "        inds, _ = inds.sort()\n",
    "    else:\n",
    "        inds = torch.arange(M).repeat(batch_shape+(1,))\n",
    "    zeros_x = torch.zeros(batch_shape+(M+L,), dtype=torch.long)\n",
    "    zeros_x.scatter_(-1, inds, tokens)\n",
    "    markers = (A-1) * torch.ones(batch_shape+(M,), dtype=torch.long)\n",
    "\n",
    "    if reverse: zeros_x = zeros_x.flip(-1)\n",
    "    x_ = torch.cat([zeros_x, markers], dim=-1)\n",
    "    y_ = torch.cat([tokens], dim=-1)\n",
    "    #from IPython.core.debugger import Pdb; Pdb().set_trace()\n",
    "    #if reverse: y_ = y_.flip(-1)\n",
    "    #from IPython.core.debugger import Pdb; Pdb().set_trace()\n",
    "    if one_hot: x = F.one_hot(x_, A).float()\n",
    "    else: x = x_\n",
    "    y = y_\n",
    "    return x, y\n",
    "\n",
    "\"\"\"\n",
    "Examples:\n",
    "print(torch_copying_data(10, 5, 10, variable=False, variable_length=False, batch_shape=(), one_hot=False, reverse=False))\n",
    "print(torch_copying_data(10, 5, 10, variable=True, variable_length=False, batch_shape=(), one_hot=False, reverse=False))\n",
    "Outputs:\n",
    "(tensor([2, 2, 2, 4, 6, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 9, 9, 9, 9, 9]), tensor([2, 2, 2, 4, 6])) # copying memory task\n",
    "(tensor([0, 6, 0, 0, 0, 0, 0, 6, 7, 0, 7, 5, 0, 0, 0, 9, 9, 9, 9, 9]), tensor([6, 6, 7, 7, 5])) # selective copying task\n",
    "\"\"\"\n",
    "def generate_dataset(dataset_config, training_config):\n",
    "    \"\"\"\n",
    "    Generate a dataset based on the provided configuration.\n",
    "\n",
    "    Parameters:\n",
    "    dataset_config (dict): Configuration for the dataset\n",
    "    training_config (dict): Configuration for the training\n",
    "\n",
    "    Returns:\n",
    "    tuple: Generated inputs and targets\n",
    "    \"\"\"\n",
    "    x, y  = torch_copying_data(dataset_config[\"l_noise\"], dataset_config[\"l_memorize\"], dataset_config[\"n_tokens\"],\n",
    "                              batch_shape=(training_config[\"batch_size\"],),variable=dataset_config[\"variable\"],\n",
    "                              variable_length=dataset_config[\"variable_length\"], one_hot=dataset_config[\"one_hot\"],\n",
    "                              reverse=dataset_config[\"reverse\"])\n",
    "    return x, y\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7d8170f6-d62c-4756-ab19-b1106224240f",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "@script\n",
    "def mingru_cell_forward(x_t: torch.Tensor, h_prev: torch.Tensor, \n",
    "                        W_h: torch.Tensor, b_h: torch.Tensor,\n",
    "                        W_u: torch.Tensor, b_u: torch.Tensor) -> torch.Tensor:\n",
    "    \n",
    "    z_t = torch.sigmoid(F.linear(x_t, W_u) + b_u)\n",
    "    \n",
    "    x_tilde = F.linear(x_t, W_h) + b_h\n",
    "\n",
    "    h_t = (1 - z_t) * x_tilde + z_t * h_prev\n",
    "    \n",
    "    return h_t\n",
    "\n",
    "class MinGRUCell_v0_hi(nn.Module):\n",
    "    def __init__(self, input_size, hidden_size, bias_mean=1.0, bias_scale=1.0, init_type=\"ugi\"):\n",
    "        super(MinGRUCell_v0_hi, self).__init__()\n",
    "        self.hidden_size = hidden_size\n",
    "        self.bias_scale = bias_scale\n",
    "        self.bias_mean = bias_mean \n",
    "        self.init_type = init_type\n",
    "        self.W_ih = Parameter(\n",
    "            torch.empty((hidden_size, input_size))\n",
    "        )\n",
    "        self.W_iu = Parameter(\n",
    "            torch.empty((hidden_size, input_size))\n",
    "        )\n",
    "        self.b_ih = Parameter(torch.empty(hidden_size))\n",
    "        self.b_iu = Parameter(torch.empty(hidden_size))\n",
    "        self.reset_parameters()\n",
    "\n",
    "    def reset_parameters(self):\n",
    "        logger.info(self.init_type) \n",
    "        nn.init.kaiming_uniform_(self.W_ih, a=math.sqrt(5))\n",
    "        nn.init.kaiming_uniform_(self.W_iu, a=math.sqrt(5))\n",
    "        if self.init_type == 'st':\n",
    "            stdv = 1.0 / math.sqrt(self.hidden_size)\n",
    "            nn.init.uniform_(self.b_ih, -stdv, stdv)\n",
    "            nn.init.uniform_(self.b_iu, -stdv, stdv)\n",
    "            self.b_iu.data.add_(self.bias_mean)\n",
    "            logger.info(self.b_iu.mean()) \n",
    "        elif self.init_type == 'ugi':\n",
    "            stdv = 1.0 / math.sqrt(self.hidden_size)\n",
    "            nn.init.uniform_(self.b_ih, -stdv, stdv)\n",
    "            with torch.no_grad():\n",
    "                stdv2 = 1.0 / self.hidden_size\n",
    "                nn.init.uniform_(self.b_iu, stdv2, 1 - stdv2)\n",
    "                #self.b_iu.uniform_(stdv2, 1 - stdv2)\n",
    "                self.b_iu.data = -torch.log(1/self.b_iu.data - 1)\n",
    "            logger.info(self.b_iu.mean()) \n",
    "        elif self.init_type.find('gumbel_gate') >= 0:\n",
    "            stdv = 1.0 / math.sqrt(self.hidden_size)\n",
    "            nn.init.uniform_(self.b_ih, -stdv, stdv)\n",
    "            nn.init.uniform_(self.b_iu, -stdv, stdv)\n",
    "            self.b_iu.data.add_(self.bias_mean)\n",
    "            logger.info(self.b_iu.mean()) \n",
    "            with torch.no_grad():\n",
    "                stdv2 = 1.0 / self.hidden_size\n",
    "                nn.init.uniform_(self.b_ig, stdv2, 1 - stdv2)\n",
    "                sampled_bias = torch.log(self.b_ig.data) - torch.log(1-self.b_ig.data)\n",
    "                self.b_ig.data = sampled_bias\n",
    "            logger.info(self.b_ig.mean()) \n",
    "            self.tau = float(self.init_type.split('_')[-1])\n",
    "        elif self.init_type == 'chrono':\n",
    "            stdv = 1.0 / math.sqrt(self.hidden_size)\n",
    "            nn.init.uniform_(self.b_ih, -stdv, stdv)\n",
    "            with torch.no_grad():\n",
    "                nn.init.uniform_(self.b_iu, 1, self.bias_mean)\n",
    "                self.b_iu.data = torch.log(self.b_iu.data)\n",
    "            logger.info(self.b_iu.mean()) \n",
    "        elif self.init_type.find('gumbel') >= 0:\n",
    "            logger.info('gumbel') \n",
    "            stdv = 1.0 / math.sqrt(self.hidden_size)\n",
    "            nn.init.uniform_(self.b_ih, -stdv, stdv)\n",
    "            with torch.no_grad():\n",
    "                tau = float(self.init_type.split('_')[-1])\n",
    "                stdv2 = 1.0 / self.hidden_size\n",
    "                nn.init.uniform_(self.b_iu, stdv2, 1 - stdv2)\n",
    "                sampled_bias = torch.tensor(self.bias_mean) + torch.log(self.b_iu.data) - torch.log(1-self.b_iu.data)\n",
    "                self.b_iu.data = sampled_bias/tau\n",
    "            logger.info(self.b_iu.mean()) \n",
    "\n",
    "    def forward(self, x_t, h_prev):\n",
    "        h_t = mingru_cell_forward(x_t, h_prev, \n",
    "                                 self.W_ih, self.b_ih,\n",
    "                                 self.W_iu, self.b_iu)\n",
    "        \n",
    "        return h_t\n",
    "\n",
    "class MinGRU_v0_hi(nn.Module):\n",
    "    def __init__(self, input_size, hidden_size, output_size, num_layers=2, init_types=['ugi', 'ugi'], bias_mean=[1.0, 1.0]):\n",
    "        super(MinGRU_v0_hi, self).__init__()\n",
    "        self.hidden_size = hidden_size\n",
    "        self.num_layers = num_layers\n",
    "        self.cells = nn.ModuleList()\n",
    "        self.cells.append(MinGRUCell_v0_hi(input_size, hidden_size, bias_mean=bias_mean[0], init_type=init_types[0]))\n",
    "        for l_num in range(1, num_layers):\n",
    "            self.cells.append(MinGRUCell_v0_hi(hidden_size, hidden_size, bias_mean=bias_mean[l_num], init_type=init_types[l_num]))\n",
    "        self.output_layer = nn.Linear(hidden_size, output_size)\n",
    "    def forward(self, x_embedded, h_0=None):\n",
    "        \n",
    "        batch_size, seq_len, _ = x_embedded.shape\n",
    "        if h_0 is None: h_0 = torch.zeros(self.num_layers, batch_size, self.hidden_size, device=x_embedded.device)\n",
    "        \n",
    "        hidden_states = list(h_0)\n",
    "        output_seq = torch.empty(batch_size, seq_len, self.hidden_size, \n",
    "                                device=device, dtype=x_embedded.dtype)\n",
    "\n",
    "        for t in range(seq_len):\n",
    "            x_t = x_embedded[:, t, :]\n",
    "            for i, cell in enumerate(self.cells):\n",
    "                hidden_states[i] = cell(x_t, hidden_states[i])\n",
    "                x_t = hidden_states[i] \n",
    "        \n",
    "            output_seq[:, t, :] = hidden_states[-1]\n",
    "        return self.output_layer(output_seq) \n",
    "\n",
    "    def clear_all_histories(self):\n",
    "        for cell in self.cells:\n",
    "            cell.clear_history()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "02e50cae-6c36-4196-a0d0-603b38616f3a",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "2de27a78-8e24-41e9-adcd-9f42c484443a",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "def train(seed, model):\n",
    "\n",
    "    #set seed\n",
    "    set_seed(seed)\n",
    "\n",
    "    embedding = nn.Embedding(dataset_config[\"n_tokens\"], EMBEDDING_DIM).to(device)\n",
    "    \n",
    "    formatted_string = json.dumps(dataset_config, indent=4, ensure_ascii=False)\n",
    "\n",
    "    logger.info(\"--- Combined Configuration ---\\n\" + formatted_string)\n",
    "    criterion = nn.CrossEntropyLoss(ignore_index=-100)\n",
    "    optimizer = optim.AdamW(list(model.parameters()) + list(embedding.parameters()), lr=training_config[\"learning_rate\"])\n",
    "\n",
    "    total_train_loss, total_train_correct, total_train_tokens = 0, 0, 0\n",
    "    logger.info(f\"Starting training with {MODEL_TYPE} model...\")\n",
    "    best_val = 0\n",
    "    log_records = []\n",
    "\n",
    "    #check initial result\n",
    "    val_loss, val_acc, best_val = validate(model, criterion, embedding, best_val, 0, seed)\n",
    "\n",
    "    for step in range(1, training_config[\"num_steps\"] + 1):\n",
    "        total_training_start_time = time.time() \n",
    "\n",
    "        optimizer.zero_grad()\n",
    "\n",
    "        model.train(), embedding.train()\n",
    "\n",
    "        inputs, targets = generate_dataset(dataset_config, training_config)\n",
    "        inputs, targets = inputs.to(device), targets.to(device)\n",
    "        full_targets = torch.full((training_config[\"batch_size\"], SEQ_LEN), -100, dtype=torch.long, device=device)\n",
    "        full_targets[:, -dataset_config[\"l_memorize\"]:] = targets\n",
    "\n",
    "        full_targets = full_targets[:, -dataset_config[\"l_memorize\"]:]\n",
    "\n",
    "        outputs = model(embedding(inputs))[:, -dataset_config[\"l_memorize\"]:]\n",
    "        loss = criterion(outputs.reshape(-1, dataset_config[\"n_tokens\"]), full_targets.reshape(-1))\n",
    "\n",
    "        loss.backward()\n",
    "        optimizer.step()\n",
    "\n",
    "        total_train_loss += loss.item()\n",
    "        with torch.no_grad():\n",
    "            preds = outputs[:, -dataset_config[\"l_memorize\"]:, :].argmax(dim=-1)\n",
    "            total_train_correct += (preds == targets).sum().item()\n",
    "            total_train_tokens += targets.numel()\n",
    "\n",
    "        if step % LOG_INTERVAL == 0:\n",
    "            avg_train_loss = total_train_loss / LOG_INTERVAL\n",
    "            avg_train_acc = 100 * total_train_correct / total_train_tokens\n",
    "            logger.info(f'Step [{step}/{training_config[\"num_steps\"]}], Avg Train Loss: {avg_train_loss:.4f}, Train Accuracy: {avg_train_acc:.2f}%')\n",
    "            total_train_loss, total_train_correct, total_train_tokens = 0, 0, 0\n",
    "        \n",
    "        if step % VALIDATION_INTERVAL == 0:\n",
    "            val_loss, val_acc, best_val = validate(model, criterion, embedding, best_val, step, seed)\n",
    "\n",
    "            log_records.append({\n",
    "                'Step': step, 'Type': 'Validation', \n",
    "                'Loss': val_loss, 'Accuracy': val_acc, 'Best accuracy': best_val\n",
    "            })\n",
    "\n",
    "    logger.info('Training completed.')\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a9be111e-a06d-486e-8884-567ac01b5635",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "def validate(model, criterion, embedding, best_val, step, seed):\n",
    "    logger.info(\"--- Starting Validation ---\")\n",
    "    model.eval(), embedding.eval()\n",
    "    total_val_loss, total_val_correct, total_val_tokens = 0, 0, 0\n",
    "    with torch.no_grad():\n",
    "\n",
    "        for _ in range(VALIDATION_STEPS):\n",
    "            inputs, targets = generate_dataset(dataset_config, training_config)\n",
    "            inputs, targets = inputs.to(device), targets.to(device)\n",
    "            full_targets = torch.full((training_config[\"batch_size\"], SEQ_LEN), -100, dtype=torch.long, device=device)\n",
    "            full_targets[:, -dataset_config[\"l_memorize\"]:] = targets\n",
    "            full_targets = full_targets[:, -dataset_config[\"l_memorize\"]:]\n",
    "            outputs = model(embedding(inputs))[:, -dataset_config[\"l_memorize\"]:]\n",
    "            loss = criterion(outputs.reshape(-1, dataset_config[\"n_tokens\"]), full_targets.reshape(-1))\n",
    "            total_val_loss += loss.item()\n",
    "            preds = outputs[:, -dataset_config[\"l_memorize\"]:, :].argmax(dim=-1)\n",
    "            total_val_correct += (preds == targets).sum().item()\n",
    "            total_val_tokens += targets.numel()\n",
    "            \n",
    "    avg_loss = total_val_loss / VALIDATION_STEPS\n",
    "    accuracy = 100 * total_val_correct / total_val_tokens\n",
    "    logger.info(f\"Validation Results: Avg Loss: {avg_loss:.4f}, Accuracy: {accuracy:.2f}%\")\n",
    "    logger.info(f\"Best Validation Results: Accuracy: {best_val:.2f}%\")\n",
    "    logger.info(\"--- Validation Finished ---\")\n",
    "\n",
    "    if accuracy > best_val:\n",
    "        best_val = accuracy\n",
    "\n",
    "    return avg_loss, accuracy, best_val"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9c3f6774-554e-4a0c-b4ec-c374fbe6a708",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8fdc1023-a666-4943-81c0-8cf02df7bd0b",
   "metadata": {},
   "outputs": [],
   "source": [
    "dataset_config = {\n",
    "    \"l_noise\": 10,\n",
    "    \"l_memorize\": 10,\n",
    "    \"n_tokens\": 10,\n",
    "    \"lag\": False,\n",
    "    #\"variable\": True,\n",
    "    \"variable\": False,\n",
    "    \"variable_length\": False,\n",
    "    \"one_hot\": False,\n",
    "    \"reverse\": False,\n",
    "    \"static\": False,\n",
    "}\n",
    "\n",
    "batch_size = 64\n",
    "training_config = {\n",
    "    \"batch_size\": batch_size,\n",
    "    \"learning_rate\": 0.0001,\n",
    "    \"num_steps\": 10000,\n",
    "}\n",
    "\n",
    "SEQ_LEN = dataset_config[\"l_noise\"] + 2 * dataset_config[\"l_memorize\"]\n",
    "EMBEDDING_DIM = 128\n",
    "LOG_INTERVAL = 500\n",
    "VALIDATION_INTERVAL = 1000\n",
    "VALIDATION_STEPS = 50\n",
    "\n",
    "MODEL_TYPE = 'MinGRU_v0_hi'\n",
    "n_layers = 3\n",
    "\n",
    "init_types = []\n",
    "init_type = 'gumbel_st'\n",
    "init_types.append('gumbel_sigmoid_0.5')\n",
    "for l in range(n_layers - 1):\n",
    "    init_types.append('st')\n",
    "\n",
    "bias_means = []\n",
    "for l in range(n_layers):\n",
    "    bias_means.append(0.0)\n",
    "\n",
    "gru_params = {\n",
    "    'hidden_dim': 128,\n",
    "    'init_type':init_type,\n",
    "    'n_layers': n_layers,\n",
    "    'bias_mean': bias_means\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "457ba5e4-096e-45a3-85b3-4a75b8fe864e",
   "metadata": {},
   "outputs": [],
   "source": [
    "if MODEL_TYPE == 'MinGRU_v0_hi':\n",
    "    logger.info(\"Initializing MinGRU_v0 model...\")\n",
    "    model = MinGRU_v0_hi(EMBEDDING_DIM, gru_params['hidden_dim'], dataset_config[\"n_tokens\"], num_layers=gru_params['n_layers'], init_types=init_types, bias_mean=gru_params['bias_mean']).to(device)\n",
    "    formatted_string = json.dumps(gru_params, indent=4, ensure_ascii=False)\n",
    "    logger.info(\"--- Combined Configuration ---\\n\" + formatted_string)\n",
    "else:\n",
    "    raise ValueError(\"Invalid MODEL_TYPE. \")\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e78c9458-c757-4c57-b384-1eb6684f54f8",
   "metadata": {},
   "outputs": [],
   "source": [
    "seeds_to_run = [42]\n",
    "all_results = []\n",
    "for seed in seeds_to_run:\n",
    "    train(seed, model)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8e4b9119-b679-4715-b8b3-d518a01556f5",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d166282e-926e-4752-b2c2-a4fda0b9d4c6",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
