{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "bc16b7ce",
   "metadata": {},
   "outputs": [
    {
     "ename": "TypeError",
     "evalue": "__init__() missing 1 required positional argument: 'dim'",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mTypeError\u001b[0m                                 Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[4], line 15\u001b[0m\n\u001b[1;32m     13\u001b[0m N_dim \u001b[38;5;241m=\u001b[39m \u001b[38;5;241m5\u001b[39m\n\u001b[1;32m     14\u001b[0m N_test \u001b[38;5;241m=\u001b[39m \u001b[38;5;241m10000\u001b[39m\n\u001b[0;32m---> 15\u001b[0m problem \u001b[38;5;241m=\u001b[39m \u001b[43mZDT2\u001b[49m\u001b[43m(\u001b[49m\u001b[43mnegate\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\u001b[43m)\u001b[49m\u001b[38;5;241m.\u001b[39mto(\u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mtkwargs)\n\u001b[1;32m     16\u001b[0m np\u001b[38;5;241m.\u001b[39mrandom\u001b[38;5;241m.\u001b[39mseed(\u001b[38;5;241m5\u001b[39m)\n\u001b[1;32m     17\u001b[0m X_test_all\u001b[38;5;241m=\u001b[39mlhs(N_dim,N_test)\n",
      "\u001b[0;31mTypeError\u001b[0m: __init__() missing 1 required positional argument: 'dim'"
     ]
    }
   ],
   "source": [
    "from pyDOE import *\n",
    "from botorch.test_functions.multi_objective import ZDT2\n",
    "from botorch.utils.transforms import unnormalize, normalize\n",
    "from botorch.utils.multi_objective.pareto import is_non_dominated\n",
    "from botorch.utils.multi_objective.box_decompositions.dominated import DominatedPartitioning\n",
    "import torch\n",
    "\n",
    "tkwargs = {\n",
    "    \"dtype\": torch.double,\n",
    "    \"device\": torch.device(\"cpu\"),\n",
    "}\n",
    "\n",
    "N_dim = 5\n",
    "N_test = 10000\n",
    "problem = ZDT2(num_objectives=3, dim=4, negate=True).to(**tkwargs)\n",
    "np.random.seed(5)\n",
    "X_test_all=lhs(N_dim,N_test)\n",
    "X_test_all=torch.tensor(X_test_all)\n",
    "X_test_all=unnormalize(X_test_all, problem.bounds)\n",
    "Y_test_all = problem(X_test_all)\n",
    "X_test_all = torch.tensor(X_test_all).to(**tkwargs)\n",
    "\n",
    "pareto_mask_test_all = is_non_dominated(Y_test_all)\n",
    "Y_true_pf = Y_test_all[pareto_mask_test_all]\n",
    "X_true_pf = X_test_all[pareto_mask_test_all]\n",
    "bd_test_all = DominatedPartitioning(ref_point=problem.ref_point, Y=Y_true_pf)\n",
    "volume_test_all = bd_test_all.compute_hypervolume().item()\n",
    "print(volume_test_all)\n",
    "X_save_path = 'X_true_pf'\n",
    "Y_save_path = 'Y_true_pf'\n",
    "# Save the tensor\n",
    "torch.save(X_true_pf, X_save_path)\n",
    "torch.save(Y_true_pf, Y_save_path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "dc1926d0",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "\n",
    "# Initialize lists to store loaded data\n",
    "data_y = []\n",
    "data_x = []\n",
    "\n",
    "# Loop through file indices\n",
    "for i in range(20):  # i ranges from 0 to 19\n",
    "    # Load data_yi.csv and data_xi.csv\n",
    "    data_yi = pd.read_csv(f\"data_y{i}.csv\", header=None)\n",
    "    data_xi = pd.read_csv(f\"data_x{i}.csv\", header=None)\n",
    "    \n",
    "    # Append to the lists\n",
    "    data_y.append(data_yi)\n",
    "    data_x.append(data_xi)\n",
    "\n",
    "# Example: Access the first loaded dataset\n",
    "print(\"First Y dataset:\")\n",
    "print(data_y[0].values)\n",
    "\n",
    "print(\"First X dataset:\")\n",
    "print(data_x[0].values)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "54e443c0",
   "metadata": {},
   "outputs": [],
   "source": [
    "def compute_igd_torch(approx_front, true_front):\n",
    "    \"\"\"\n",
    "    Compute the Inverted Generational Distance (IGD) using PyTorch.\n",
    "\n",
    "    Parameters:\n",
    "    - approx_front: torch.Tensor of shape (N, M), representing N points in the M-dimensional approximate Pareto front.\n",
    "    - true_front: torch.Tensor of shape (T, M), representing T points in the M-dimensional true Pareto front.\n",
    "\n",
    "    Returns:\n",
    "    - igd: float, the Inverted Generational Distance (IGD) value.\n",
    "    \"\"\"\n",
    "    # Compute the pairwise distances between true_front and approx_front\n",
    "    distances = []\n",
    "    for true_point in true_front:\n",
    "        # Compute Euclidean distances from the true point to all points in the approx front\n",
    "        dist = torch.norm(approx_front - true_point, dim=1)\n",
    "        # Find the minimum distance for this true point\n",
    "        distances.append(torch.min(dist))\n",
    "    \n",
    "    # Compute the mean of the minimum distances\n",
    "    igd = torch.mean(torch.tensor(distances))\n",
    "    return igd.item()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "3fe47bef",
   "metadata": {},
   "outputs": [
    {
     "ename": "NameError",
     "evalue": "name 'data_x' is not defined",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mNameError\u001b[0m                                 Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[2], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m data_x \u001b[38;5;241m=\u001b[39m torch\u001b[38;5;241m.\u001b[39mtensor(np\u001b[38;5;241m.\u001b[39marray(\u001b[43mdata_x\u001b[49m))\n\u001b[1;32m      2\u001b[0m data_y \u001b[38;5;241m=\u001b[39m torch\u001b[38;5;241m.\u001b[39mtensor(np\u001b[38;5;241m.\u001b[39marray(data_y))\n\u001b[1;32m      3\u001b[0m all_true_igd \u001b[38;5;241m=\u001b[39m []\n",
      "\u001b[0;31mNameError\u001b[0m: name 'data_x' is not defined"
     ]
    }
   ],
   "source": [
    "data_x = torch.tensor(np.array(data_x))\n",
    "data_y = torch.tensor(np.array(data_y))\n",
    "all_true_igd = []\n",
    "for j in range(20):\n",
    "    true_igd = []\n",
    "    for i in range(1, data_y[0].shape[0]+1):\n",
    "        igd = compute_igd_torch(data_y[j][:i], Y_true_pf)\n",
    "        true_igd.append(igd)\n",
    "    all_true_igd.append(true_igd)\n",
    "all_true_igd = torch.tensor(all_true_igd)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "ff4eb5b5",
   "metadata": {},
   "outputs": [
    {
     "ename": "NameError",
     "evalue": "name 'all_true_igd' is not defined",
     "output_type": "error",
     "traceback": [
      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[0;31mNameError\u001b[0m                                 Traceback (most recent call last)",
      "Cell \u001b[0;32mIn[3], line 4\u001b[0m\n\u001b[1;32m      1\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01mmatplotlib\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m pyplot \u001b[38;5;28;01mas\u001b[39;00m plt\n\u001b[1;32m      3\u001b[0m \u001b[38;5;66;03m# Compute the mean and variance of hypervolumes across trials\u001b[39;00m\n\u001b[0;32m----> 4\u001b[0m mean_true_pf_igd_qehvi \u001b[38;5;241m=\u001b[39m torch\u001b[38;5;241m.\u001b[39mmean(\u001b[43mall_true_igd\u001b[49m, dim\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m0\u001b[39m)\n\u001b[1;32m      5\u001b[0m std_true_pf_igd_qehvi \u001b[38;5;241m=\u001b[39m torch\u001b[38;5;241m.\u001b[39mstd(all_true_igd, dim\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m0\u001b[39m)\n\u001b[1;32m      6\u001b[0m mean_save_path \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m'\u001b[39m\u001b[38;5;124mEHVI_igdmin_mean\u001b[39m\u001b[38;5;124m'\u001b[39m\n",
      "\u001b[0;31mNameError\u001b[0m: name 'all_true_igd' is not defined"
     ]
    }
   ],
   "source": [
    "from matplotlib import pyplot as plt\n",
    "\n",
    "# Compute the mean and variance of hypervolumes across trials\n",
    "mean_true_pf_igd_qehvi = torch.mean(all_true_igd, dim=0)\n",
    "std_true_pf_igd_qehvi = torch.std(all_true_igd, dim=0)\n",
    "mean_save_path = 'EHVI_igdmin_mean'\n",
    "std_save_path = 'EHVI_igdmin_std'\n",
    "# Save the tensor\n",
    "torch.save(mean_true_pf_igd_qehvi, mean_save_path)\n",
    "torch.save(std_true_pf_igd_qehvi, std_save_path)\n",
    "\n",
    "# Compute upper and lower bounds for the plot (mean ± std)\n",
    "upper_bound = mean_true_pf_igd_qehvi + std_true_pf_igd_qehvi\n",
    "lower_bound = mean_true_pf_igd_qehvi - std_true_pf_igd_qehvi\n",
    "\n",
    "# Plot mean and confidence bounds\n",
    "x_vals = list(range(data_y[0].shape[0]))  # Batch numbers\n",
    "\n",
    "plt.figure(figsize=(10, 6))\n",
    "\n",
    "# Plot mean hypervolume\n",
    "plt.plot(x_vals, mean_true_pf_igd_qehvi.cpu().numpy(), label=\"Mean Hypervolume\", color='b', marker='o')\n",
    "\n",
    "# Fill between upper and lower bounds\n",
    "plt.fill_between(x_vals, lower_bound.cpu().numpy(), upper_bound.cpu().numpy(), \n",
    "                 color='blue', alpha=0.2, label=\"Mean ± 1 Std Dev\")\n",
    "\n",
    "# Labels and title\n",
    "plt.xlabel('Batch Number')\n",
    "plt.ylabel('Hypervolume')\n",
    "plt.title('Mean Hypervolume with Confidence Bounds Across Trials')\n",
    "plt.legend()\n",
    "plt.grid(True)\n",
    "plt.show()\n",
    "plt.savefig(\"EHVI GMM.png\", dpi=300) \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "c26d5c11",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
