{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Bayesian optimization for Random Heteropolypeptides\n",
    "The Botorch and Ax were developed by Meta Platform Inc. and is available at https://botorch.org and https://ax.dev.  \n",
    "The version of the key Python packages are:\n",
    "- Python: 3.8.8  \n",
    "- Torch: 1.9.0 + cu111  \n",
    "- gpytorch: 1.6.0  \n",
    "- Botorch: 0.5.1  \n",
    "- Ax: 0.2.2   \n",
    "  \n",
    "Beyasian optimization (BO) was performed on a Lenovo Legion R9000k laptop with AMD Ryzen 9 5900HX CPU and NVDIA GeForce RTX 3080 Laptop GPU (16GB). \n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 1. Import required modules"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [],
   "source": [
    "from botorch.models.gpytorch import GPyTorchModel\n",
    "from gpytorch.distributions import MultivariateNormal\n",
    "from botorch.acquisition.acquisition import AcquisitionFunction\n",
    "from gpytorch.means import ConstantMean\n",
    "from gpytorch.models import ExactGP\n",
    "from gpytorch.kernels import RBFKernel, ScaleKernel, MaternKernel\n",
    "from gpytorch.likelihoods import GaussianLikelihood\n",
    "from gpytorch.mlls import ExactMarginalLogLikelihood\n",
    "import torch\n",
    "import random\n",
    "from torch.optim.lr_scheduler import ExponentialLR\n",
    "from sklearn.model_selection import train_test_split\n",
    "from ax.modelbridge.factory import get_botorch\n",
    "from botorch.optim.optimize import optimize_acqf\n",
    "from ax import SimpleExperiment, Arm\n",
    "from ax.models.torch.botorch_defaults import _get_acquisition_func\n",
    "from typing import Tuple\n",
    "from ax import (\n",
    "    ParameterType,\n",
    "    RangeParameter,\n",
    "    SearchSpace,\n",
    "    SumConstraint,\n",
    ")\n",
    "from ax.core.generator_run import GeneratorRun\n",
    "import numpy as np\n",
    "import pandas as pd\n",
    "import csv"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 2. Set the functions for BO"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Set the random seeds for the repeatability"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "def setup_seed(seed):\n",
    "    #Setup the random seed for repeatibility\n",
    "    torch.manual_seed(seed)\n",
    "    torch.cuda.manual_seed_all(seed)\n",
    "    np.random.seed(seed)\n",
    "    torch.cuda.manual_seed(seed)\n",
    "    random.seed(seed)\n",
    "    torch.backends.cudnn.deterministic = True"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Implement a custom gpytorch ExactGP model that allows to choose within RBF, Matern-0.5, Matern-1.5 and Matern-2.5"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "class SimpleCustomGP(ExactGP, GPyTorchModel):\n",
    "\n",
    "    _num_outputs = 1  # to inform GPyTorchModel API\n",
    "    def __init__(self, train_X, train_Y, Kernel):\n",
    "        \"\"\"\n",
    "        Args:\n",
    "        train_X (torch.Tensor) : training examples.\n",
    "        train_Y (torch.Tensor) : testing examples.\n",
    "        Kernel (string) : GP kernel.\n",
    "        \"\"\"\n",
    "        # squeeze output dim before passing train_Y to ExactGP\n",
    "        super().__init__(train_X, train_Y.squeeze(-1), GaussianLikelihood())\n",
    "        self.mean_module = ConstantMean()\n",
    "        if (Kernel == 'RBF'):\n",
    "            self.covar_module = ScaleKernel(\n",
    "                base_kernel = RBFKernel(),\n",
    "                )\n",
    "        elif (Kernel == 'Matern-0.5'):\n",
    "            self.covar_module = ScaleKernel(\n",
    "                base_kernel = MaternKernel(nu=0.5),\n",
    "                )\n",
    "        elif (Kernel == 'Matern-1.5'):\n",
    "            self.covar_module = ScaleKernel(\n",
    "                base_kernel = MaternKernel(nu=1.5),\n",
    "                )\n",
    "        elif (Kernel == 'Matern-2.5'):\n",
    "            self.covar_module = ScaleKernel(\n",
    "                base_kernel = MaternKernel(nu=2.5),\n",
    "                )\n",
    "        else:\n",
    "            print('Specify a valid Kernel.')\n",
    "        self.to(train_X)  \n",
    "\n",
    "    def forward(self, x):\n",
    "        mean_x = self.mean_module(x)\n",
    "        covar_x = self.covar_module(x)\n",
    "        return MultivariateNormal(mean_x, covar_x)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Build a model_constructor that instantiates and fits a model on data and optimize the parameters with RMSprop"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "def _get_and_fit_model(Xs, Ys, **kwargs):\n",
    "    \"\"\"\n",
    "    Args:\n",
    "    Xs (torch.Tensor) : training examples.\n",
    "    Ys (torch.Tensor) : testing examples.\n",
    "    \"\"\"\n",
    "    global TrainingSummary, best_loss, best_kernel\n",
    "    \n",
    "    setup_seed(Seed)\n",
    "    iteration = Iteration\n",
    "    RandomStates = Randomstates\n",
    "    train_X, test_X, train_Y, test_Y = train_test_split(\n",
    "        Xs[0], Ys[0].squeeze(1), \n",
    "        test_size=0.2, train_size=0.8, \n",
    "        random_state=40)\n",
    "    best_test_loss, best_train_loss = 0, 0\n",
    "    #choices: 'RBF','Matern-0.5','Matern-1.5','Matern-2.5'\n",
    "    for kernel in ['RBF', 'Matern-0.5', 'Matern-1.5', 'Matern-2.5']:\n",
    "\n",
    "        model = SimpleCustomGP(train_X=train_X, train_Y=train_Y, Kernel=kernel)\n",
    "\n",
    "        for i in range(RandomStates):\n",
    "            # Randomly initiate the parameters\n",
    "            hypers = {\n",
    "                'likelihood.noise_covar.noise':torch.rand(1).cuda()*5,\n",
    "                'covar_module.base_kernel.lengthscale': torch.rand(1).cuda()+0.05,\n",
    "                'covar_module.outputscale': torch.rand(1).cuda()*5,\n",
    "                'mean_module.constant': torch.tensor(0).cuda()\n",
    "            }\n",
    "            # Perform the optimization\n",
    "            model.initialize(**hypers)\n",
    "            mll = ExactMarginalLogLikelihood(model.likelihood, model).to(train_X)\n",
    "            optimizer = torch.optim.RMSprop([{'params': model.parameters()}], lr=LearningRate)\n",
    "            scheduler = ExponentialLR(optimizer, gamma=0.7) \n",
    "\n",
    "            for epoch in range(iteration):\n",
    "                model.train()\n",
    "                optimizer.zero_grad()\n",
    "                output_train = model(train_X)\n",
    "                loss_on_train = -mll(output_train, model.train_targets)\n",
    "                loss_on_train.backward()\n",
    "\n",
    "                if (epoch + 1) % 10 == 0:\n",
    "                    model.eval()\n",
    "                    output_test = model(test_X)\n",
    "                    loss_on_test = -mll(output_test, test_Y)\n",
    "                    #pick the best model based on the cost function of test set\n",
    "                    if (best_loss > loss_on_test):\n",
    "                        best_loss = loss_on_test\n",
    "                        torch.save(model.state_dict(), 'best_model_state.pth')\n",
    "                        best_test_loss = loss_on_test.item()\n",
    "                        best_train_loss = loss_on_train.item()\n",
    "                        best_kernel = kernel\n",
    "                optimizer.step()\n",
    "                scheduler.step()\n",
    "    # After parameter optimization, return the best model\n",
    "    state_dict = torch.load('best_model_state.pth')\n",
    "    model_final = SimpleCustomGP(train_X, train_Y, best_kernel)\n",
    "    model_final.load_state_dict(state_dict)\n",
    "    print('Done!')\n",
    "    # Append the optimization results to a global sheet for output\n",
    "    TrainingResults = pd.DataFrame(\n",
    "        {\n",
    "        'Random Seed': Seed,\n",
    "        'Learning Rate': LearningRate,\n",
    "        'Best Kernel': best_kernel,\n",
    "        'Length Scale': model_final.covar_module.base_kernel.lengthscale.item(),\n",
    "        'Noise': model_final.likelihood.noise.item(),\n",
    "        'Output Scale': model_final.covar_module.outputscale.item(),\n",
    "        'Best Loss': best_loss.cpu().detach().numpy()\n",
    "         },\n",
    "         index = [0]\n",
    "    )\n",
    "    TrainingSummary = pd.concat([TrainingSummary, TrainingResults], ignore_index = True)\n",
    "    return model_final"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Build acqf_constructor that creates an acquisition function from a fitted model  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_aquisition(\n",
    "    model,\n",
    "    objective_weights,\n",
    "    outcome_constraints=None,\n",
    "    X_observed=None,\n",
    "    X_pending=None,\n",
    "    **kwargs,\n",
    ")-> AcquisitionFunction:\n",
    "    objective_weights.to(device=device)\n",
    "    \n",
    "    r\"\"\"Instantiates an acquisition function.\n",
    "    choices: \n",
    "    \"qEI\":qExpectedImprovement\n",
    "    \"qPI\"：qProbabilityOfImprovement\n",
    "    \"qNEI\":qNoisyExpectedImprovement\n",
    "    \"qSR\":qSimpleRegret\n",
    "    \"qUCB\":qUpperConfidenceBound\n",
    "    \"qEHVI\":qExpectedHypervolumeImprovement\n",
    "    \"qNEHVI\":qNoisyExpectedHypervolumeImprovement\n",
    "    \"\"\"\n",
    "    setup_seed(Seed)\n",
    "    return _get_acquisition_func(\n",
    "        model=model,\n",
    "        acquisition_function_name=acqf_func,\n",
    "        objective_weights=objective_weights,\n",
    "        outcome_constraints=outcome_constraints,\n",
    "        X_observed=X_observed,\n",
    "        X_pending=X_pending,\n",
    "        **kwargs,\n",
    "    )"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Build an optimizer that optimizes the acquisition function"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [],
   "source": [
    "def optimize_aquisition(\n",
    "    acq_function,\n",
    "    bounds:torch.tensor,\n",
    "    n,\n",
    "    inequality_constraints=None,\n",
    "    equality_constraints=None,\n",
    "    fixed_features=None,\n",
    "    rounding_func=None,\n",
    "    **kwargs,\n",
    ")-> Tuple:\n",
    "    r\"\"\"Optimize an acquisition function.\n",
    "    \"\"\"\n",
    "    setup_seed(Seed)\n",
    "    return optimize_acqf(\n",
    "        acq_function=acq_function,\n",
    "        bounds=bounds,\n",
    "        q=n,\n",
    "        num_restarts=RestartNumber,\n",
    "        raw_samples=RawsampleNumber,\n",
    "        options=kwargs,\n",
    "        inequality_constraints=inequality_constraints,\n",
    "        equality_constraints=equality_constraints,\n",
    "        fixed_features=fixed_features,\n",
    "        sequential=False,\n",
    "        post_processing_func=rounding_func,\n",
    "    )"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Define a custom metric that could get the activity of the RHP from the RawData array"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [],
   "source": [
    "##Define a data_fetching function\n",
    "def GPx_datafetching(parameterization, *args):\n",
    "    '''\n",
    "    parameterization (pandas.DataFrame): \n",
    "    '''\n",
    "    global RawData\n",
    "    x=np.array([parameterization[f'x{i+1}'] for i in range(FeatureNumber)])\n",
    "    for i in range(RawData.shape[0]):\n",
    "        if ((RawData[i, :FeatureNumber] == x).all()) and (RawData[i, FeatureNumber+1] == 0):\n",
    "            # Label the fetched data, would be useful for experiments with replicated RHPs\n",
    "            RawData[i, FeatureNumber+1] = 1\n",
    "            # return (mean, standard error)\n",
    "            return {\"GPx\": (RawData[i, FeatureNumber], 0.0)}\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Print the RHPs that are chosen by the model with predicted activities"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "def prediction_result_output(candidates)->pd.DataFrame:\n",
    "\n",
    "    output=candidates.param_df.round(4)\n",
    "    prediction = pd.DataFrame(candidates.model_predictions_by_arm)\n",
    "    prediction = prediction.transpose()\n",
    "    mean_list = []\n",
    "    covar_list = []\n",
    "    # Match the signature with the mean and covar\n",
    "    for i in range(prediction.index.__len__()):\n",
    "        prediction[0][i] = prediction[0][i]['GPx']\n",
    "        prediction[1][i] = prediction[1][i]['GPx']['GPx']\n",
    "        if (output.index[i] in prediction.index[i]):\n",
    "            mean_list.append(prediction.iloc[i, 0])\n",
    "            covar_list.append(prediction.iloc[i, 1])\n",
    "    output['Predict_Mean'] = mean_list\n",
    "    output['Predict_Covar'] = covar_list\n",
    "    return output"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Transform the chosen RHP compositions to csv file that is used to control the Janus workstation for liquid handling.  \n",
    "The first 13 wells were used for contorl experiments."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "##Transfer the prediction to Janus adding file\n",
    "def Janus_print(c,path):\n",
    "    \n",
    "    TotalVolume = 60    # Total volume of the organohalides in each well\n",
    "    RawMatrix = c.param_df.to_numpy()   \n",
    "    SaveAddMatrix = np.zeros([96, FeatureNumber])\n",
    "    AddMatrix = RawMatrix * TotalVolume # Transfer the RHPs composition to the volume of organohalides that should be added to each well\n",
    "    AddMatrix = np.round(AddMatrix, 1)\n",
    "    n=0\n",
    "    for i in range(6, 6+FeatureNumber):\n",
    "        SaveAddMatrix[i,n] = TotalVolume\n",
    "        n=n+1\n",
    "    for i in range(SaveAddMatrix.shape[0] - FeatureNumber - 6):\n",
    "        SaveAddMatrix[i+FeatureNumber+6,] = AddMatrix[i, ]\n",
    "    np.savetxt(RawMatrixPath, SaveAddMatrix, fmt = (\n",
    "        '%1.1f', '%1.1f', '%1.1f', '%1.1f', '%1.1f', '%1.1f', '%1.1f'\n",
    "        ), delimiter=',')\n",
    "    janus = open(path, 'w', newline='')\n",
    "    janusCreater = csv.writer(janus)\n",
    "    for r in range(SaveAddMatrix.shape[0]):\n",
    "        for c in range(SaveAddMatrix.shape[1]):\n",
    "            volume = SaveAddMatrix[r, c]\n",
    "            imputCSV = ['Source', c+1, 'Dest', r+1, volume]\n",
    "            janusCreater.writerow(imputCSV)\n",
    "    janus.close()\n",
    "    return"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 3. Setup the parameters for BO"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "FeatureNumber = 7   # Number of features in the study, in this paper it is 7.\n",
    "device = torch.device(\"cuda\")   # Device on which to perform the optimization\n",
    "\n",
    "# Initiate an Summary Table to record the optimization of Gaussian Process (GP) model\n",
    "pd.set_option('display.max_columns', None)\n",
    "TrainingSummary = pd.DataFrame(columns = ('Random Seed', 'Learning Rate', 'Best Kernel', 'Length Scale', 'Noise', 'Output Scale'))\n",
    "\n",
    "# Initiate the parameters for GP optimization\n",
    "best_loss = 10\n",
    "best_kernel = 'RBF'\n",
    "Iteration = 30 # Iteration number for GP hypermater optimization\n",
    "Randomstates = 50 # Number of restart during optimization of the GP model parameter\n",
    "\n",
    "# AF parameters\n",
    "acqf_func = 'qNEI' # Acquisition function (AF). See get_acquisition for choices\n",
    "RestartNumber = 5   # Number of restarts for acquisition function optimization\n",
    "RawsampleNumber = 100   # Number of samples used for initializing the acquisition function optimization\n",
    "\n",
    "# Output setting\n",
    "RawMatrixPath = 'Predict_volume.csv'    # Path for the csv file with volume of organohalides solution for each RHP\n",
    "PredictionPath = \"Predict_RHP_activity.csv\"   # Path for the csv file with composition of predicted RHPs and their predicted GPx-like activity\n",
    "JanusPath = 'JanusAddingFile_next_round.csv'          # Path for the file that control the Janus workstation"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Define the search space\n",
    "GPx_search_space = SearchSpace(\n",
    "    parameters=[\n",
    "        RangeParameter(\n",
    "            name='x1', parameter_type=ParameterType.FLOAT, lower=0.0, upper=1.0\n",
    "        ),\n",
    "        RangeParameter(\n",
    "            name='x2', parameter_type=ParameterType.FLOAT, lower=0.0, upper=1.0\n",
    "        ),\n",
    "        RangeParameter(\n",
    "            name='x3', parameter_type=ParameterType.FLOAT, lower=0.0, upper=1.0\n",
    "        ),\n",
    "        RangeParameter(\n",
    "            name='x4', parameter_type=ParameterType.FLOAT, lower=0.0, upper=1.0\n",
    "        ),\n",
    "        RangeParameter(\n",
    "            name='x5', parameter_type=ParameterType.FLOAT, lower=0.0, upper=1.0\n",
    "        ),\n",
    "        RangeParameter(\n",
    "            name='x6', parameter_type=ParameterType.FLOAT, lower=0.0, upper=0.5\n",
    "        ),\n",
    "        RangeParameter(\n",
    "            name='x7', parameter_type=ParameterType.FLOAT, lower=0.0, upper=1.0\n",
    "        )\n",
    "    ]\n",
    ")\n",
    "# Set sum constraints on the search space \n",
    "sum_constraint_upper = SumConstraint(\n",
    "    parameters = [GPx_search_space.parameters[f'x{i+1}'] for i in range(FeatureNumber)],\n",
    "    is_upper_bound = True,\n",
    "    bound = 1.001,\n",
    ")\n",
    "sum_constraint_lower = SumConstraint(\n",
    "    parameters = [GPx_search_space.parameters[f'x{i+1}'] for i in range(FeatureNumber)],\n",
    "    is_upper_bound = False,\n",
    "    bound = 0.999,\n",
    ")\n",
    "GPx_search_space.add_parameter_constraints([sum_constraint_upper])\n",
    "GPx_search_space.add_parameter_constraints([sum_constraint_lower])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 4. BO"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "exp = SimpleExperiment(\n",
    "    name = \"GPx_optimization\",\n",
    "    search_space = GPx_search_space,\n",
    "    evaluation_function = GPx_datafetching,\n",
    "    objective_name = \"GPx\",\n",
    "    minimize = False,\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Fetching Repeated data...\n"
     ]
    }
   ],
   "source": [
    "# Read the data from csv file\n",
    "'''\n",
    "DomainPath is the path where the experimental results is stored. \n",
    "The first 7 rows are the mole fraction of the modifiers\n",
    "The last rows is the activity of the coresponding RHP\n",
    "'''\n",
    "DomainPath = 'ExperimentData.csv' \n",
    "f = open(DomainPath, 'r')\n",
    "RawData = np.genfromtxt(f, delimiter=\",\")\n",
    "y0 = np.zeros([RawData.shape[0]])   # add an additional column to label the chosen data\n",
    "RawData = np.c_[RawData, y0]\n",
    "\n",
    "#Fetching Data\n",
    "b = []\n",
    "print('Fetching Repeated data...')\n",
    "for i in range(RawData.shape[0]):\n",
    "    a = [Arm(parameters = {\n",
    "        \"x1\" : RawData[i,0], \n",
    "        \"x2\" : RawData[i,1],\n",
    "        \"x3\" : RawData[i,2],\n",
    "        \"x4\" : RawData[i,3],\n",
    "        \"x5\" : RawData[i,4],\n",
    "        \"x6\" : RawData[i,5],\n",
    "        \"x7\" : RawData[i,6]\n",
    "        }\n",
    "        )]\n",
    "    b = b+a\n",
    "\n",
    "gr = GeneratorRun(b)\n",
    "trial = exp.new_batch_trial(generator_run=gr)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Running optimization...\n",
      "Running  1/30 training\n",
      "Done!\n",
      "Running  2/30 training\n",
      "Done!\n",
      "Running  3/30 training\n",
      "Done!\n",
      "Running  4/30 training\n",
      "Done!\n",
      "Running  5/30 training\n",
      "Done!\n",
      "Running  6/30 training\n",
      "Done!\n",
      "Running  7/30 training\n",
      "Done!\n",
      "Running  8/30 training\n",
      "Done!\n",
      "Running  9/30 training\n",
      "Done!\n",
      "Running 10/30 training\n",
      "Done!\n",
      "Running 11/30 training\n",
      "Done!\n",
      "Running 12/30 training\n",
      "Done!\n",
      "Running 13/30 training\n",
      "Done!\n",
      "Running 14/30 training\n",
      "Done!\n",
      "Running 15/30 training\n",
      "Done!\n",
      "Running 16/30 training\n",
      "Done!\n",
      "Running 17/30 training\n",
      "Done!\n",
      "Running 18/30 training\n",
      "Done!\n",
      "Running 19/30 training\n",
      "Done!\n",
      "Running 20/30 training\n",
      "Done!\n",
      "Running 21/30 training\n",
      "Done!\n",
      "Running 22/30 training\n",
      "Done!\n",
      "Running 23/30 training\n",
      "Done!\n",
      "Running 24/30 training\n",
      "Done!\n",
      "Running 25/30 training\n",
      "Done!\n",
      "Running 26/30 training\n",
      "Done!\n",
      "Running 27/30 training\n",
      "Done!\n",
      "Running 28/30 training\n",
      "Done!\n",
      "Running 29/30 training\n",
      "Done!\n",
      "Running 30/30 training\n",
      "Done!\n",
      "   Random Seed  Learning Rate Best Kernel  Length Scale     Noise  \\\n",
      "0           12           0.01  Matern-2.5      0.858844  0.174173   \n",
      "1           12           0.02  Matern-2.5      0.858844  0.174173   \n",
      "2           12           0.20  Matern-2.5      0.910820  0.211767   \n",
      "3            3           0.01         RBF      0.443164  0.161654   \n",
      "4            3           0.02         RBF      0.356502  0.199423   \n",
      "5            3           0.20         RBF      0.356502  0.199423   \n",
      "6            5           0.01  Matern-2.5      0.870372  0.202475   \n",
      "7            5           0.02  Matern-2.5      0.870372  0.202475   \n",
      "8            5           0.20  Matern-2.5      0.870372  0.202475   \n",
      "9           78           0.01  Matern-2.5      0.870372  0.202475   \n",
      "10          78           0.02  Matern-2.5      0.870372  0.202475   \n",
      "11          78           0.20  Matern-2.5      0.870372  0.202475   \n",
      "12          49           0.01  Matern-2.5      0.870372  0.202475   \n",
      "13          49           0.02  Matern-2.5      0.870372  0.202475   \n",
      "14          49           0.20  Matern-2.5      0.870372  0.202475   \n",
      "15          44           0.01  Matern-2.5      0.870372  0.202475   \n",
      "16          44           0.02  Matern-2.5      0.870372  0.202475   \n",
      "17          44           0.20  Matern-2.5      0.870372  0.202475   \n",
      "18          55           0.01  Matern-2.5      0.870372  0.202475   \n",
      "19          55           0.02  Matern-2.5      0.870372  0.202475   \n",
      "20          55           0.20  Matern-2.5      0.870372  0.202475   \n",
      "21          81           0.01  Matern-2.5      0.870372  0.202475   \n",
      "22          81           0.02  Matern-2.5      0.870372  0.202475   \n",
      "23          81           0.20  Matern-2.5      0.870372  0.202475   \n",
      "24          91           0.01  Matern-2.5      0.870372  0.202475   \n",
      "25          91           0.02  Matern-2.5      0.870372  0.202475   \n",
      "26          91           0.20  Matern-2.5      0.870372  0.202475   \n",
      "27          47           0.01  Matern-2.5      0.870372  0.202475   \n",
      "28          47           0.02  Matern-2.5      0.870372  0.202475   \n",
      "29          47           0.20  Matern-2.5      0.870372  0.202475   \n",
      "\n",
      "    Output Scale  Best Loss  \n",
      "0       2.777409   0.680956  \n",
      "1       2.777409   0.680956  \n",
      "2       2.423419   0.664609  \n",
      "3       0.359401   0.648876  \n",
      "4       0.133799   0.646927  \n",
      "5       0.133799   0.646927  \n",
      "6       1.100514   0.646384  \n",
      "7       1.100514   0.646384  \n",
      "8       1.100514   0.646384  \n",
      "9       1.100514   0.646384  \n",
      "10      1.100514   0.646384  \n",
      "11      1.100514   0.646384  \n",
      "12      1.100514   0.646384  \n",
      "13      1.100514   0.646384  \n",
      "14      1.100514   0.646384  \n",
      "15      1.100514   0.646384  \n",
      "16      1.100514   0.646384  \n",
      "17      1.100514   0.646384  \n",
      "18      1.100514   0.646384  \n",
      "19      1.100514   0.646384  \n",
      "20      1.100514   0.646384  \n",
      "21      1.100514   0.646384  \n",
      "22      1.100514   0.646384  \n",
      "23      1.100514   0.646384  \n",
      "24      1.100514   0.646384  \n",
      "25      1.100514   0.646384  \n",
      "26      1.100514   0.646384  \n",
      "27      1.100514   0.646384  \n",
      "28      1.100514   0.646384  \n",
      "29      1.100514   0.646384  \n"
     ]
    }
   ],
   "source": [
    "print(\"Running optimization...\")\n",
    "# The model is trained on 10 random seeds with 3 different learning rate\n",
    "# The model with the lowest cost function on test set was chosen\n",
    "n = 0\n",
    "for i in [12, 3, 5, 78, 49, 44, 55, 81, 91, 47]:\n",
    "    '''[12, 3, 5, 78, 49, 44, 55, 81, 91, 47]'''\n",
    "    Seed = i\n",
    "    for j in [0.01, 0.02, 0.2]:\n",
    "        LearningRate = j\n",
    "        n = n+1\n",
    "        print(f\"Running {n:>2}/30 training\")\n",
    "        model = get_botorch(\n",
    "                    experiment=exp,\n",
    "                    data=exp.eval(),\n",
    "                    search_space=exp.search_space,\n",
    "                    model_constructor=_get_and_fit_model,\n",
    "                    acqf_constructor=get_aquisition,\n",
    "                    acqf_optimizer=optimize_aquisition,\n",
    "                    device=torch.device(\"cuda\"),\n",
    "                )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(TrainingSummary)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Generate the candidate RHPs for next round\n",
    "c = model.gen(83)\n",
    "output = prediction_result_output(c)\n",
    "output.to_csv(PredictionPath,index=False,sep=',')\n",
    "Janus_print(c, JanusPath)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3.10.4 ('GPxnewAx')",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.4"
  },
  "orig_nbformat": 4,
  "vscode": {
   "interpreter": {
    "hash": "f174b701d96cf54e99d9c29899846cad1923d2912ed16485ddc762ad2a2656e8"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
