{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "valued-value",
   "metadata": {},
   "source": [
    "# Evaluating the Linear Hard Case"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "senior-constitutional",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import torch\n",
    "from torch.optim import LBFGS, SGD\n",
    "import matplotlib.pyplot as plt\n",
    "from scipy.io import loadmat, savemat\n",
    "from tqdm.notebook import trange, tqdm\n",
    "\n",
    "torch.set_default_tensor_type(torch.cuda.FloatTensor)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "integral-synthetic",
   "metadata": {},
   "outputs": [],
   "source": [
    "def generate_inputs(d, k, n, T, eps):\n",
    "    top_block_samples = np.sqrt(eps) * torch.randn(T, n, d-k)\n",
    "    bottom_block_samples = torch.randn(T, n, k)\n",
    "    return torch.cat([top_block_samples, bottom_block_samples], dim=-1)\n",
    "\n",
    "def generate_weights(d, k, T, eps):\n",
    "    dominant, residual = torch.randn(T, k), torch.randn(T, k)\n",
    "    dominant /= torch.norm(dominant, dim=-1, keepdim=True)\n",
    "    residual /= torch.norm(residual, dim=-1, keepdim=True)\n",
    "    return torch.cat([np.sqrt(1/(2*eps)) * dominant, torch.zeros((T, d-2*k)), residual], axis=-1)\n",
    "\n",
    "def generate_labels(inputs, predictors, noise_stddev):\n",
    "    means = torch.matmul(inputs, predictors[:, :, None])[:, :, 0]\n",
    "    return means + noise_stddev * torch.randn(*means.shape)\n",
    "\n",
    "\n",
    "def train_loop(opt_vars, optimizer, loss_fn, projection, datasets, train_params, plot_losses=False):\n",
    "    \"\"\"\n",
    "    opt_vars: list of PyTorch variables\n",
    "    optimizer: pytorch.optim\n",
    "    loss_fn: takes (opt_vars, X, y)\n",
    "    projection: takes opt_vars, applies changes to .data only\n",
    "    datasets: list containing two tensors of shapes [(T, n, d), (T, n)]\n",
    "              first tensor is inputs, second is labels, T is number of parallel datasets\n",
    "    train_params: {batch_size, num_batches, train_desc}\n",
    "    \"\"\"\n",
    "    dataset_size = datasets[0].shape[1]\n",
    "    batch_size = train_params[\"batch_size\"]\n",
    "    num_batches_per_pass = int(np.ceil(dataset_size / batch_size))\n",
    "    \n",
    "    with torch.no_grad():\n",
    "        projection(opt_vars)\n",
    "        \n",
    "    best_opt_vars, best_loss = [opt_var.data.clone() for opt_var in opt_vars], np.inf\n",
    "    losses = []\n",
    "    for num_batch in trange(train_params[\"num_batches\"], leave=False, desc=train_params[\"train_desc\"]):\n",
    "        batch_idx = num_batch % num_batches_per_pass\n",
    "        \n",
    "        # Check if this is a new_pass - if so, shuffle the data\n",
    "        if batch_idx == 0:   \n",
    "            perm = torch.randperm(dataset_size)\n",
    "            datasets = [datasets[0][:, perm], datasets[1][:, perm]]\n",
    "            \n",
    "        start_idx, end_idx = batch_idx * batch_size, (batch_idx + 1) * batch_size\n",
    "        batch_X, batch_y = datasets[0][:, start_idx:end_idx], datasets[1][:, start_idx:end_idx]\n",
    "\n",
    "        optimizer.zero_grad()\n",
    "        loss_fn(opt_vars, batch_X, batch_y).backward()\n",
    "        optimizer.step(lambda: loss_fn(opt_vars, batch_X, batch_y))\n",
    "\n",
    "        with torch.no_grad():\n",
    "            projection(opt_vars)\n",
    "            cur_loss = loss_fn(opt_vars, datasets[0], datasets[1]).item()\n",
    "            if cur_loss <= best_loss:\n",
    "                best_opt_vars = [opt_var.data.clone() for opt_var in opt_vars]\n",
    "                best_loss = cur_loss\n",
    "            losses.append(cur_loss)\n",
    "            \n",
    "    if plot_losses:\n",
    "        plt.plot(losses)\n",
    "        plt.xlim((0, train_params[\"num_batches\"]))\n",
    "        plt.show()\n",
    "        \n",
    "    return best_opt_vars"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "fuzzy-examination",
   "metadata": {},
   "source": [
    "## Source Training"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "funky-attention",
   "metadata": {},
   "outputs": [],
   "source": [
    "def prep_frozenrep_training(d, k, T, n, eps, noise_stddev):\n",
    "    B_train, W_train = torch.randn(d, k, requires_grad=True), torch.randn(k, T, requires_grad=True)\n",
    "    opt_vars = [B_train, W_train]\n",
    "    optimizer = LBFGS(opt_vars, lr=0.1, history_size=5)\n",
    "\n",
    "    def loss_fn(opt_vars, inputs, labels):\n",
    "        B_train, W_train = opt_vars\n",
    "        weights_train = torch.matmul(B_train, W_train).T\n",
    "        predictions = torch.matmul(inputs, weights_train[:, :, None])[:, :, 0]\n",
    "        mse = torch.mean(torch.square(labels - predictions))\n",
    "        regularization = 1/(4*T) * torch.sum(torch.square(torch.matmul(B_train.T, B_train) - torch.matmul(W_train, W_train.T)))\n",
    "        return mse + regularization\n",
    "\n",
    "    def create_projection(C0):\n",
    "        def projection(opt_vars):\n",
    "            B_train, W_train = opt_vars\n",
    "            W_train.data /= torch.max(torch.norm(W_train, dim=0, keepdim=True) / np.sqrt(C0 * np.sqrt(k / T)), torch.tensor([1.]))\n",
    "            W_train.data /= torch.max(torch.svd(W_train, compute_uv=False)[1][0] / np.sqrt(C0 * np.sqrt(T / k)), torch.tensor([1.]))\n",
    "            B_train.data /= torch.max(torch.svd(B_train, compute_uv=False)[1][0] / np.sqrt(C0 * np.sqrt(T / k)), torch.tensor([1.]))\n",
    "        return projection\n",
    "    \n",
    "    return opt_vars, optimizer, loss_fn, create_projection(3) \n",
    "\n",
    "def prep_adaptrep_training(d, k, T, n, eps, noise_stddev):\n",
    "    B_train = torch.randn(d, k, requires_grad=True) \n",
    "    W_train = torch.randn(k, T, requires_grad=True)\n",
    "    Delta_train = torch.randn(d, T, requires_grad=True)\n",
    "    opt_vars = [B_train, W_train, Delta_train]\n",
    "    optimizer = LBFGS(opt_vars, lr=0.1, history_size=5)\n",
    "\n",
    "    def loss_fn(opt_vars, inputs, labels):\n",
    "        B_train, W_train, Delta_train = opt_vars\n",
    "        weights_train = (torch.matmul(B_train, W_train) + Delta_train).T\n",
    "        predictions = torch.matmul(inputs, weights_train[:, :, None])[:, :, 0]\n",
    "        mse = torch.mean(torch.square(labels - predictions))\n",
    "        regularization = 1/(4*T) * torch.sum(torch.square(torch.matmul(B_train.T, B_train) - torch.matmul(W_train, W_train.T)))\n",
    "        delta_reg = noise_stddev * (np.sqrt(k * d / (n * T)) + np.sqrt(k / n)) * torch.mean(torch.norm(Delta_train, dim=0))\n",
    "        return mse + regularization + delta_reg\n",
    "\n",
    "    def create_projection(C0):\n",
    "        def projection(opt_vars):\n",
    "            B_train, W_train, Delta_train = opt_vars\n",
    "            W_train.data /= torch.max(torch.norm(W_train, dim=0, keepdim=True) / np.sqrt(C0 * np.sqrt(k / T)), torch.tensor([1.]))\n",
    "            W_train.data /= torch.max(torch.svd(W_train, compute_uv=False)[1][0] / np.sqrt(C0 * np.sqrt(T / k)), torch.tensor([1.]))\n",
    "            B_train.data /= torch.max(torch.svd(B_train, compute_uv=False)[1][0] / np.sqrt(C0 * np.sqrt(T / k)), torch.tensor([1.]))\n",
    "            Delta_train.data /= torch.max(torch.norm(Delta_train, dim=0, keepdim=True) / 2, torch.tensor([1]).float().cuda())\n",
    "        return projection\n",
    "    \n",
    "    return opt_vars, optimizer, loss_fn, create_projection(3) "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "korean-contract",
   "metadata": {},
   "outputs": [],
   "source": [
    "k = 2\n",
    "T = 1000\n",
    "noise_stddev = 1\n",
    "\n",
    "for exp_set in trange(1):\n",
    "    for d in tqdm([4 * (i + 1) for i in range(25)], leave=False):\n",
    "        n = 10 * d\n",
    "        eps = k / d\n",
    "\n",
    "        X = generate_inputs(d, k, n, T, eps)\n",
    "        true_weights = generate_weights(d, k, T, eps)\n",
    "        y = generate_labels(X, true_weights, noise_stddev)\n",
    "\n",
    "        # Train representation via FrozenRep\n",
    "        for att in range(10):\n",
    "            while True:\n",
    "                try:\n",
    "                    opt_vars, optimizer, loss_fn, projector = prep_frozenrep_training(d, k, T, n, eps, noise_stddev)\n",
    "                    opt_vars = train_loop(\n",
    "                        opt_vars, optimizer, loss_fn, projector, (X, y),\n",
    "                        {\"num_batches\": 500, \"batch_size\": 64, \"train_desc\": \"Training by ERM-LTL\"}\n",
    "                    )\n",
    "                    break\n",
    "                except RuntimeError:\n",
    "                    pass\n",
    "            savemat(\"representation-learning/set%i/frozenrep-k%i-d%i-attempt%i.mat\" % (exp_set, k, d, att), {\n",
    "                \"representation\": opt_vars[0].cpu().numpy(),\n",
    "                \"k\": k,\n",
    "                \"T\": T,\n",
    "                \"d\": d,\n",
    "                \"n\": n,\n",
    "                \"eps\": eps,\n",
    "                \"noise_stddev\": noise_stddev\n",
    "            })\n",
    "\n",
    "        # Train representation via AdaptRep\n",
    "        for att in range(10):\n",
    "            while True:\n",
    "                try:\n",
    "                    opt_vars, optimizer, loss_fn, projector = prep_adaptrep_training(d, k, T, n, eps, noise_stddev)\n",
    "                    opt_vars = train_loop(\n",
    "                        opt_vars, optimizer, loss_fn, projector, (X, y),\n",
    "                        {\"num_batches\": 500, \"batch_size\": 64, \"train_desc\": \"Training by adaptation\"}\n",
    "                    )\n",
    "                    break\n",
    "                except RuntimeError:\n",
    "                    pass\n",
    "            savemat(\"representation-learning/set%i/adaptrep-k%i-d%i-attempt%i.mat\" % (exp_set, k, d, att), {\n",
    "                \"representation\": opt_vars[0].cpu().numpy(),\n",
    "                \"k\": k,\n",
    "                \"T\": T,\n",
    "                \"d\": d,\n",
    "                \"n\": n,\n",
    "                \"eps\": eps,\n",
    "                \"noise_stddev\": noise_stddev\n",
    "            })"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "tired-reviewer",
   "metadata": {},
   "source": [
    "## Target Training"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "under-trail",
   "metadata": {},
   "outputs": [],
   "source": [
    "def find_adversary(B_learned):\n",
    "    d, k = B_learned.shape\n",
    "    orth_opt = torch.cat([torch.eye(k), torch.zeros(d-k, k)], axis=0)\n",
    "    delta_opt = torch.cat([torch.zeros(d-k, k), torch.eye(k)], axis=0)\n",
    "    \n",
    "    orth_learned = torch.svd(B_learned, some=True)[0]\n",
    "    projector_learned = torch.matmul(orth_learned, orth_learned.T)\n",
    "    proj_perp_learned = torch.eye(projector_learned.shape[0]) - projector_learned\n",
    "    \n",
    "    opt_res = torch.matmul(proj_perp_learned, orth_opt)\n",
    "    delta_res = torch.matmul(proj_perp_learned, delta_opt)\n",
    "    \n",
    "    return torch.matmul(orth_opt, torch.svd(opt_res, some=True)[2][:, :1]), \\\n",
    "           torch.matmul(delta_opt, torch.svd(delta_res, some=True)[2][:, :1])\n",
    "\n",
    "def prep_training_w_rep(B_learned, d, k, T, n, eps, noise_stddev):\n",
    "    W_train = torch.randn(k, T, requires_grad=True)\n",
    "    Delta_train = torch.randn(d, T, requires_grad=True)\n",
    "    opt_vars = [W_train, Delta_train]\n",
    "    optimizer = SGD(opt_vars, lr=0.01)\n",
    "\n",
    "    def loss_fn(opt_vars, inputs, labels):\n",
    "        W_train, Delta_train = opt_vars\n",
    "        weights_train = (torch.matmul(B_learned, W_train) + Delta_train).T\n",
    "        predictions = torch.matmul(inputs, weights_train[:, :, None])[:, :, 0]\n",
    "        mse = torch.sum(torch.mean(torch.square(labels - predictions), dim=-1))\n",
    "        regularization = (2 * k / np.sqrt(n)) * torch.sum(torch.norm(Delta_train, dim=0))\n",
    "        return mse + regularization\n",
    "\n",
    "    def projection(opt_vars):\n",
    "        pass\n",
    "    \n",
    "    return opt_vars, optimizer, loss_fn, projection\n",
    "\n",
    "def prep_baseline(d, k, T, n, eps, noise_stddev):\n",
    "    Delta_train = torch.randn(d, T, requires_grad=True)\n",
    "    opt_vars = [Delta_train]\n",
    "    optimizer = SGD(opt_vars, lr=0.1)\n",
    "    \n",
    "    def loss_fn(opt_vars, inputs, labels):\n",
    "        Delta_train = opt_vars[0]\n",
    "        weights_train = Delta_train.T\n",
    "        predictions = torch.matmul(inputs, weights_train[:, :, None])[:, :, 0]\n",
    "        return torch.sum(torch.mean(torch.square(labels - predictions), dim=-1))\n",
    "    \n",
    "    def projection(opt_vars):\n",
    "        pass\n",
    "    \n",
    "    return opt_vars, optimizer, loss_fn, projection"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "occasional-farmer",
   "metadata": {},
   "outputs": [],
   "source": [
    "rep_k = 2\n",
    "\n",
    "ERM_losses, adapt_losses, opt_losses, baseline_losses = [], [], [], []\n",
    "\n",
    "for rep_d in tqdm([4 * (i + 1) for i in range(25)]):\n",
    "    ERM_data = [loadmat(\"representation-learning/set0/frozenrep-k%i-d%i-attempt%i.mat\" % (rep_k, rep_d, att))\n",
    "                for att in range(10)]\n",
    "    adapt_data = [loadmat(\"representation-learning/set0/adaptrep-k%i-d%i-attempt%i.mat\" % (rep_k, rep_d, att))\n",
    "                  for att in range(10)]\n",
    "\n",
    "    k = int(ERM_data[0][\"k\"].item())\n",
    "    d = int(ERM_data[0][\"d\"].item())\n",
    "    n = d\n",
    "    T = 1000\n",
    "    eps = ERM_data[0][\"eps\"].item()\n",
    "    noise_stddev = 1\n",
    "\n",
    "    # Load representations\n",
    "    Bs_ERM = [torch.svd(torch.from_numpy(data[\"representation\"]).cuda(), some=True)[0] for data in ERM_data]\n",
    "    Bs_adapt = [torch.svd(torch.from_numpy(data[\"representation\"]).cuda(), some=True)[0] for data in adapt_data]\n",
    "    B_opt = torch.cat([torch.eye(k), torch.zeros(d-k, k)], axis=0)\n",
    "\n",
    "    # Compute worst-case predictor for FrozenRep\n",
    "    adv_dirs = [find_adversary(B_ERM) for B_ERM in Bs_ERM]\n",
    "    ERM_advs = [np.sqrt(1 / (2 * eps)) * opt_dir + delta_dir for (opt_dir, delta_dir) in adv_dirs]\n",
    "\n",
    "    # Compute worst-case predictor for AdaptRep\n",
    "    adv_dirs = [find_adversary(B_adapt) for B_adapt in Bs_adapt]\n",
    "    adapt_advs = [np.sqrt(1 / (2 * eps)) * opt_dir + delta_dir for (opt_dir, delta_dir) in adv_dirs]\n",
    "    \n",
    "    # Compute worst-case predictor for optimum\n",
    "    opt_dir, delta_dir = find_adversary(B_opt)\n",
    "    opt_adversary = np.sqrt(1 / (2 * eps)) * opt_dir + delta_dir\n",
    "\n",
    "    # Generate data\n",
    "    X = generate_inputs(d, k, n, T, eps)\n",
    "    ys_ERM = [generate_labels(X, torch.tile(ERM_adv.T, [T, 1]), noise_stddev) for ERM_adv in ERM_advs]\n",
    "    ys_adapt = [generate_labels(X, torch.tile(adapt_adv.T, [T, 1]), noise_stddev) for adapt_adv in adapt_advs]\n",
    "    y_opt = generate_labels(X, torch.tile(opt_adversary.T, [T, 1]), noise_stddev)\n",
    "    \n",
    "    # Train using optimal representation\n",
    "    opt_vars, optimizer, loss_fn, projection = prep_training_w_rep(B_opt, d, k, T, n, eps, noise_stddev)\n",
    "    W_train, Delta_train = train_loop(\n",
    "        opt_vars, optimizer, loss_fn, projection, (X, y_opt),\n",
    "        {\"num_batches\": 3000, \"batch_size\": 16, \"train_desc\": \"Training using optimal representation\"},\n",
    "    )\n",
    "    estimator_delta = (torch.matmul(B_opt, W_train) + Delta_train).T.detach() - opt_adversary.T\n",
    "    opt_excess_risks = eps * torch.square(torch.norm(estimator_delta[:, :-k], dim=-1)) + torch.square(torch.norm(estimator_delta[:, -k:], dim=-1))\n",
    "    opt_losses.append(torch.mean(opt_excess_risks).item())\n",
    "\n",
    "    # Train using FrozenRep-derived representation\n",
    "    min_loss = np.inf\n",
    "    for (B_ERM, y_ERM, ERM_adversary) in tqdm(zip(Bs_ERM, ys_ERM, ERM_advs), leave=False, total=len(Bs_ERM)):\n",
    "        opt_vars, optimizer, loss_fn, projection = prep_training_w_rep(B_ERM, d, k, T, n, eps, noise_stddev)\n",
    "        W_train, Delta_train = train_loop(\n",
    "            opt_vars, optimizer, loss_fn, projection, (X, y_ERM),\n",
    "            {\"num_batches\": 3000, \"batch_size\": 16, \"train_desc\": \"Training using FrozenRep-derived representation\"},\n",
    "        )\n",
    "        estimator_delta = (torch.matmul(B_ERM, W_train) + Delta_train).T.detach() - ERM_adversary.T\n",
    "        ERM_excess_risks = eps * torch.square(torch.norm(estimator_delta[:, :-k], dim=-1)) + torch.square(torch.norm(estimator_delta[:, -k:], dim=-1))\n",
    "        min_loss = np.minimum(torch.mean(ERM_excess_risks).item(), min_loss)\n",
    "    ERM_losses.append(min_loss)\n",
    "\n",
    "    # Train using AdaptRep-derived representation\n",
    "    min_loss = np.inf\n",
    "    for (B_adapt, y_adapt, adapt_adversary) in tqdm(zip(Bs_adapt, ys_adapt, adapt_advs), leave=False, total=len(Bs_ERM)):\n",
    "        opt_vars, optimizer, loss_fn, projection = prep_training_w_rep(B_adapt, d, k, T, n, eps, noise_stddev)\n",
    "        W_train, Delta_train = train_loop(\n",
    "            opt_vars, optimizer, loss_fn, projection, (X, y_adapt),\n",
    "            {\"num_batches\": 3000, \"batch_size\": 16, \"train_desc\": \"Training using AdaptRep-derived representation\"},\n",
    "        )\n",
    "        estimator_delta = (torch.matmul(B_adapt, W_train) + Delta_train).T.detach() - adapt_adversary.T\n",
    "        adapt_excess_risks = eps * torch.square(torch.norm(estimator_delta[:, :-k], dim=-1)) + torch.square(torch.norm(estimator_delta[:, -k:], dim=-1))\n",
    "        min_loss = np.minimum(torch.mean(adapt_excess_risks).item(), min_loss)\n",
    "    adapt_losses.append(min_loss)\n",
    "    \n",
    "    # Train baseline linear regression\n",
    "    opt_vars, optimizer, loss_fn, projection = prep_baseline(d, k, T, n, eps, noise_stddev)\n",
    "    Delta_train = train_loop(\n",
    "        opt_vars, optimizer, loss_fn, projection, (X, y_ERM),\n",
    "        {\"num_batches\": 5000, \"batch_size\": 16, \"train_desc\": \"Training using baseline linear regression\"},\n",
    "    )[0]\n",
    "    estimator_delta = Delta_train.T.detach() - ERM_adversary.T\n",
    "    baseline_excess_risks = eps * torch.square(torch.norm(estimator_delta[:, :-k], dim=-1)) + torch.square(torch.norm(estimator_delta[:, -k:], dim=-1))\n",
    "    baseline_losses.append(torch.mean(baseline_excess_risks).item())\n",
    "    \n",
    "savemat(\"representation-learning-evals.mat\", {\n",
    "    \"FrozenRep\": np.array(ERM_losses),\n",
    "    \"AdaptRep\": np.array(adapt_losses),\n",
    "    \"optimal\": np.array(opt_losses),\n",
    "    \"baseline\": np.array(baseline_losses)\n",
    "})"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "private-excellence",
   "metadata": {},
   "source": [
    "## Plotting"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "moderate-tractor",
   "metadata": {},
   "outputs": [],
   "source": [
    "results = loadmat(\"representation-learning-evals.mat\")\n",
    "opt_losses = results[\"optimal\"][0]\n",
    "frozenrep_losses = results[\"FrozenRep\"][0]\n",
    "adaptrep_losses = results[\"AdaptRep\"][0]\n",
    "baseline_losses = results[\"baseline\"][0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "nuclear-reward",
   "metadata": {},
   "outputs": [],
   "source": [
    "plt.figure(figsize=(10, 5))\n",
    "plt.plot([4 * (i + 1) for i in range(25)], opt_losses, label=\"$B*$\", linewidth=3, color=\"black\", linestyle=\"--\")\n",
    "plt.plot([4 * (i + 1) for i in range(25)], ERM_losses, label=\"FreezeRep\", linewidth=3, color=\"orange\")\n",
    "plt.plot([4 * (i + 1) for i in range(25)], adapt_losses, label=\"AdaptRep\", linewidth=3, color=\"green\")\n",
    "plt.plot([4 * (i + 1) for i in range(25)], baseline_losses, label=\"Linear Regression\", linewidth=3, color=\"red\")\n",
    "\n",
    "plt.xlim((4, 4 * 25))\n",
    "plt.semilogy()\n",
    "plt.xticks([4 * (2 * i + 1) for i in range(12)] + [100], fontsize=12)\n",
    "plt.yticks(fontsize=12)\n",
    "plt.xlabel(\"$n_{\\mathrm{T}}$\", fontsize=15)\n",
    "plt.ylabel(\"Target Task Excess Risk\", fontsize=15)\n",
    "plt.legend(fontsize=15)\n",
    "\n",
    "plt.savefig(\"plots-semilogy.pdf\", bbox_inches='tight')"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.6.9"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
