{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "This notebook prepares the data for the subsequent notebook `1-Step-Entropy-Analyze.ipynb`, which generates figures illustrating the uncertainty analysis of instruction-tuned variants of Llama-3 models, as described in Appendix A.4 of the paper."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import os\n",
    "os.environ[\"TOKENIZERS_PARALLELISM\"] = \"false\"\n",
    "\n",
    "import torch\n",
    "num_devices = torch.cuda.device_count()\n",
    "print(\"Number of visible GPUs:\", num_devices)\n",
    "\n",
    "for i in range(num_devices):\n",
    "    print(f\"GPU {i}: {torch.cuda.get_device_name(i)}\")\n",
    "\n",
    "current_device = torch.cuda.current_device()\n",
    "print(\"Current device index:\", current_device)\n",
    "print(\"Current device name:\", torch.cuda.get_device_name(current_device))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import random\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "from tqdm import tqdm\n",
    "\n",
    "from allen_cahn_equation import (\n",
    "    compute_exact_solution_random_ic_vary_Nx,\n",
    "    visualize_spline_ic,\n",
    "    plot_both_grids,\n",
    ")\n",
    "\n",
    "from data_processing import (\n",
    "    SimpleSerializerSettings,\n",
    "    scale_2d_array,\n",
    "    serialize_2d_integers,\n",
    "    extract_training_and_test\n",
    ")\n",
    "\n",
    "from llama_utils import load_model_and_tokenizer, generate_text_multiple\n",
    "\n",
    "MODEL_NAME = \"meta-llama/Llama-3.1-8B-Instruct\"\n",
    "# MODEL_NAME = \"meta-llama/Llama-3.2-3B-Instruct\"\n",
    "# MODEL_NAME = \"meta-llama/Llama-3.2-1B-Instruct\"\n",
    "seed = 42\n",
    "random.seed(seed)\n",
    "np.random.seed(seed)\n",
    "torch.manual_seed(seed)\n",
    "if torch.cuda.is_available():\n",
    "    torch.cuda.manual_seed_all(seed)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "model, tokenizer = load_model_and_tokenizer(MODEL_NAME)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Define parameters for the Allen-Cahn equation\n",
    "L = 2       # Length of the spatial domain\n",
    "k = 0.001   # Thermal diffusivity\n",
    "T = 0.5     # Total simulation time\n",
    "Nx = 14     # Number of spatial steps (excluding boundary points)\n",
    "Nt = 20     # Number of time steps \n",
    "dx = L/(Nx+1)\n",
    "dt = T/Nt\n",
    "\n",
    "# Example: Demonstrating the process of generating and visualizing a random initial condition\n",
    "init_cond_random = np.random.uniform(-0.5, 0.5, size=Nx)\n",
    "fig = visualize_spline_ic(L, Nx, init_cond_random)\n",
    "plt.tight_layout()\n",
    "plt.show()\n",
    "\n",
    "# Example: Demonstrating how to resample spatial points from an underlying random initial condition\n",
    "Nx_original = Nx\n",
    "Nx_new = 14\n",
    "fig, cs, init_cond_random_new = plot_both_grids(L, Nx_original, Nx_new, init_cond_random)\n",
    "plt.tight_layout()\n",
    "plt.show()\n",
    "\n",
    "# Serialization setup\n",
    "settings = SimpleSerializerSettings(space_sep=\",\", time_sep=\";\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def calculate_entropies(generation_outputs, Nx):\n",
    "    \"\"\"\n",
    "    Calculate entropy values from generation outputs.\n",
    "    Output:\n",
    "        entropies: Array of shape (Nx, n_future_steps) containing entropy values\n",
    "        avg_entropy: Average entropy across spatial points\n",
    "    \"\"\"\n",
    "    n_future_steps = len(generation_outputs)\n",
    "    entropies = np.zeros((Nx, n_future_steps))\n",
    "    \n",
    "    # Calculate entropy for all spatial points\n",
    "    for time_idx in range(n_future_steps):\n",
    "        gen_output = generation_outputs[time_idx]\n",
    "        for grid_idx in range(Nx):\n",
    "            token_position = grid_idx * 2  # accounting for spatial separators\n",
    "            if token_position < len(gen_output.scores):\n",
    "                logits = gen_output.scores[token_position][0]\n",
    "                p = torch.softmax(logits, -1).clamp_min(1e-30)\n",
    "                entropy = -(p * torch.log(p)).sum().item()\n",
    "                entropies[grid_idx, time_idx] = entropy\n",
    "    # Calculate average entropy across all spatial points\n",
    "    avg_entropy = entropies.mean(axis=0)\n",
    "    return entropies, avg_entropy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_Nt_values = range(2, 41, 2)\n",
    "n_seeds = 50\n",
    "all_mean_entropies = []\n",
    "all_std_entropies = []\n",
    "all_se_entropies = []\n",
    "\n",
    "for Nt in tqdm(all_Nt_values):\n",
    "    dt = T / Nt\n",
    "    avg_entropies_for_this_Nt = []\n",
    "    for seed in range(n_seeds):\n",
    "        random.seed(seed)\n",
    "        np.random.seed(seed)\n",
    "        torch.manual_seed(seed)\n",
    "        if torch.cuda.is_available():\n",
    "            torch.cuda.manual_seed_all(seed)\n",
    "        # Generate a new random initial condition for this seed\n",
    "        init_cond_random_seed = np.random.uniform(-0.5, 0.5, size=Nx)\n",
    "        # Create new cubic spline for this initial condition\n",
    "        fig, cs_seed, _ = plot_both_grids(L, Nx, Nx, init_cond_random_seed)\n",
    "        plt.close(fig)\n",
    "        # Compute exact solution with this initial condition\n",
    "        u_exact = compute_exact_solution_random_ic_vary_Nx(L, k, T, Nx, Nt, spline_obj=cs_seed)\n",
    "        u_exact_scaled, vmin_exact, vmax_exact = scale_2d_array(u_exact)\n",
    "        u_exact_serialized = serialize_2d_integers(u_exact_scaled, settings)\n",
    "        input_time_steps = Nt\n",
    "        train_serial, test_serial = extract_training_and_test(\n",
    "            u_exact_serialized, input_time_steps, settings\n",
    "        )\n",
    "        # LLM prediction\n",
    "        generated_token, gen_output = generate_text_multiple(\n",
    "            prompt=train_serial,\n",
    "            model=model,\n",
    "            tokenizer=tokenizer,\n",
    "            Nx=Nx,\n",
    "        )\n",
    "        # Calculate entropy\n",
    "        entropies, avg_entropy = calculate_entropies([gen_output], Nx)\n",
    "        avg_entropies_for_this_Nt.append(avg_entropy[0])\n",
    "    avg_entropies_array = np.array(avg_entropies_for_this_Nt)\n",
    "    mean_entropy = np.mean(avg_entropies_array)\n",
    "    std_entropy = np.std(avg_entropies_array, ddof=1)\n",
    "    se_entropy = std_entropy / np.sqrt(n_seeds)\n",
    "    all_mean_entropies.append(mean_entropy)\n",
    "    all_std_entropies.append(std_entropy)\n",
    "    all_se_entropies.append(se_entropy)\n",
    "mean_entropies = np.array(all_mean_entropies)\n",
    "std_entropies = np.array(all_std_entropies)\n",
    "se_entropies = np.array(all_se_entropies)\n",
    "\n",
    "np.savez_compressed(\n",
    "    \"8B_1_step_token_time_variation.npz\",\n",
    "    mean_entropies_8B=mean_entropies,\n",
    "    std_entropies_8B=std_entropies,\n",
    "    se_entropies_8B=se_entropies,\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "all_Nx_values = range(2, 41, 2)\n",
    "fixed_Nt = 50\n",
    "all_mean_entropies = []\n",
    "all_std_entropies = []\n",
    "all_se_entropies = []\n",
    "# Reference resolution for generating initial conditions\n",
    "Nx_reference = 14\n",
    "\n",
    "for Nx in tqdm(all_Nx_values):\n",
    "    dt = T / fixed_Nt\n",
    "    avg_entropies_for_this_Nx = []\n",
    "    for seed in range(n_seeds):\n",
    "        # Set random seed for generating different initial conditions\n",
    "        random.seed(seed)\n",
    "        np.random.seed(seed)\n",
    "        torch.manual_seed(seed)\n",
    "        if torch.cuda.is_available():\n",
    "            torch.cuda.manual_seed_all(seed)\n",
    "        # Generate a new random initial condition at reference resolution\n",
    "        init_cond_random_seed = np.random.uniform(-0.5, 0.5, size=Nx_reference)\n",
    "        # Resample the initial condition from reference resolution to current Nx\n",
    "        fig, cs_seed, init_cond_resampled = plot_both_grids(L, Nx_reference, Nx, init_cond_random_seed)\n",
    "        plt.close(fig)\n",
    "        # Compute exact solution for this Nx with the resampled initial condition\n",
    "        u_exact = compute_exact_solution_random_ic_vary_Nx(L, k, T, Nx, fixed_Nt, spline_obj=cs_seed)\n",
    "        u_exact_scaled, vmin_exact, vmax_exact = scale_2d_array(u_exact)\n",
    "        u_exact_serialized = serialize_2d_integers(u_exact_scaled, settings)\n",
    "        input_time_steps = fixed_Nt\n",
    "        train_serial, test_serial = extract_training_and_test(\n",
    "            u_exact_serialized, input_time_steps, settings\n",
    "        )\n",
    "        # LLM prediction\n",
    "        generated_token, gen_output = generate_text_multiple(\n",
    "            prompt=train_serial,\n",
    "            model=model,\n",
    "            tokenizer=tokenizer,\n",
    "            Nx=Nx,\n",
    "        )\n",
    "        # Calculate entropy\n",
    "        entropies, avg_entropy = calculate_entropies([gen_output], Nx)\n",
    "        avg_entropies_for_this_Nx.append(avg_entropy[0])\n",
    "    avg_entropies_array = np.array(avg_entropies_for_this_Nx)\n",
    "    mean_entropy = np.mean(avg_entropies_array)\n",
    "    std_entropy = np.std(avg_entropies_array, ddof=1)\n",
    "    se_entropy = std_entropy / np.sqrt(n_seeds)\n",
    "    all_mean_entropies.append(mean_entropy)\n",
    "    all_std_entropies.append(std_entropy)\n",
    "    all_se_entropies.append(se_entropy)\n",
    "mean_entropies_Nx = np.array(all_mean_entropies)\n",
    "std_entropies_Nx = np.array(all_std_entropies)\n",
    "se_entropies_Nx = np.array(all_se_entropies)\n",
    "\n",
    "np.savez_compressed(\n",
    "    \"8B_1_step_token_space_variation.npz\",\n",
    "    mean_entropies_8B_Nx=mean_entropies_Nx,\n",
    "    std_entropies_8B_Nx=std_entropies_Nx,\n",
    "    se_entropies_8B_Nx=se_entropies_Nx,\n",
    ")"
   ]
  }
 ],
 "metadata": {
  "accelerator": "GPU",
  "colab": {
   "gpuType": "A100",
   "machine_shape": "hm",
   "provenance": []
  },
  "kernelspec": {
   "display_name": "smollm",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.11"
  },
  "widgets": {
   "application/vnd.jupyter.widget-state+json": {
    "4bca38f991eb477fb6f6448ed40b7953": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_f282a01a1fa94fd3841fa84b0bf85801",
      "placeholder": "​",
      "style": "IPY_MODEL_bfdb859e858e42869e6da9b1482a5702",
      "value": "Loading checkpoint shards: 100%"
     }
    },
    "79d7edd2ec684e25b3674d375812e5fc": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "82fd26e315b6460ab439920956ecfc4b": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "8d598e552e3e4f3f9ffd47c953554ad0": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HTMLModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HTMLModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HTMLView",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_79d7edd2ec684e25b3674d375812e5fc",
      "placeholder": "​",
      "style": "IPY_MODEL_b9ca4f266f0247a3aca54430f78c7bf4",
      "value": " 2/2 [00:04&lt;00:00,  2.25s/it]"
     }
    },
    "b9ca4f266f0247a3aca54430f78c7bf4": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "be3db56ffe3047a6ab8493d65d18f5c6": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "bfdb859e858e42869e6da9b1482a5702": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "DescriptionStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "DescriptionStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "description_width": ""
     }
    },
    "e0dd1da9791a4911932193befbfd4dd0": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "ProgressStyleModel",
     "state": {
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "ProgressStyleModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "StyleView",
      "bar_color": null,
      "description_width": ""
     }
    },
    "e8bbace417ee4d74ae8e9fdcaf023b44": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "FloatProgressModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "FloatProgressModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "ProgressView",
      "bar_style": "success",
      "description": "",
      "description_tooltip": null,
      "layout": "IPY_MODEL_be3db56ffe3047a6ab8493d65d18f5c6",
      "max": 2,
      "min": 0,
      "orientation": "horizontal",
      "style": "IPY_MODEL_e0dd1da9791a4911932193befbfd4dd0",
      "value": 2
     }
    },
    "f282a01a1fa94fd3841fa84b0bf85801": {
     "model_module": "@jupyter-widgets/base",
     "model_module_version": "1.2.0",
     "model_name": "LayoutModel",
     "state": {
      "_model_module": "@jupyter-widgets/base",
      "_model_module_version": "1.2.0",
      "_model_name": "LayoutModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/base",
      "_view_module_version": "1.2.0",
      "_view_name": "LayoutView",
      "align_content": null,
      "align_items": null,
      "align_self": null,
      "border": null,
      "bottom": null,
      "display": null,
      "flex": null,
      "flex_flow": null,
      "grid_area": null,
      "grid_auto_columns": null,
      "grid_auto_flow": null,
      "grid_auto_rows": null,
      "grid_column": null,
      "grid_gap": null,
      "grid_row": null,
      "grid_template_areas": null,
      "grid_template_columns": null,
      "grid_template_rows": null,
      "height": null,
      "justify_content": null,
      "justify_items": null,
      "left": null,
      "margin": null,
      "max_height": null,
      "max_width": null,
      "min_height": null,
      "min_width": null,
      "object_fit": null,
      "object_position": null,
      "order": null,
      "overflow": null,
      "overflow_x": null,
      "overflow_y": null,
      "padding": null,
      "right": null,
      "top": null,
      "visibility": null,
      "width": null
     }
    },
    "fd21f3afeb514a51a73822346535fdec": {
     "model_module": "@jupyter-widgets/controls",
     "model_module_version": "1.5.0",
     "model_name": "HBoxModel",
     "state": {
      "_dom_classes": [],
      "_model_module": "@jupyter-widgets/controls",
      "_model_module_version": "1.5.0",
      "_model_name": "HBoxModel",
      "_view_count": null,
      "_view_module": "@jupyter-widgets/controls",
      "_view_module_version": "1.5.0",
      "_view_name": "HBoxView",
      "box_style": "",
      "children": [
       "IPY_MODEL_4bca38f991eb477fb6f6448ed40b7953",
       "IPY_MODEL_e8bbace417ee4d74ae8e9fdcaf023b44",
       "IPY_MODEL_8d598e552e3e4f3f9ffd47c953554ad0"
      ],
      "layout": "IPY_MODEL_82fd26e315b6460ab439920956ecfc4b"
     }
    }
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
