{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "11c007f2",
   "metadata": {},
   "outputs": [],
   "source": [
    "import openai\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "# Set your API key\n",
    "openai.api_key = 'API KEY'\n",
    "from tqdm import tqdm\n",
    "import GPy\n",
    "import re\n",
    "import copy\n",
    "import math\n",
    "import concurrent.futures"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "3797608e",
   "metadata": {},
   "outputs": [],
   "source": [
    "%run optimize.py\n",
    "%run make_prompt.py\n",
    "%run synthetic_reward_function.py\n",
    "%run get_response.py"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "ea6bc8f2",
   "metadata": {},
   "outputs": [],
   "source": [
    "def LLM_for_bandits_oracle(random_seed, d, K, N_init, num_iter, noise_intensity, delta):\n",
    "    \n",
    "    rewards = []\n",
    "    rewards_2 = []\n",
    "\n",
    "    all_xx = []\n",
    "    all_f = []\n",
    "    all_theta = []\n",
    "    all_x_init = []\n",
    "    all_y_init = []\n",
    "\n",
    "    X, Y = [], []\n",
    "    \n",
    "    np.random.seed(random_seed)\n",
    "    \n",
    "    # Generate features and rewards\n",
    "    # xx, f, theta = generate_xx_f_linear(d, K) \n",
    "    # xx, f, theta = generate_xx_f_square(d, K) \n",
    "    xx, f, theta = generate_xx_f_sin(d, K) \n",
    "    # xx, f = generate_xx_f_GP(d, K) \n",
    "    \n",
    "    all_xx.append(xx)\n",
    "    all_f.append(f)\n",
    "    # all_theta.append(theta)\n",
    "\n",
    "    # We first randomly select some arms\n",
    "    for i in range(N_init): \n",
    "        np.random.seed(random_seed + i)\n",
    "        init_idx = np.random.choice(np.arange(xx.shape[0]))  # Randomly select a row index\n",
    "        init = xx[init_idx, :]  # Select this row (corresponding to a specific arm)\n",
    "        X.append(init)  # Add to X\n",
    "        y_init = f[init_idx] + np.random.normal(0, np.sqrt(noise_intensity))  # Reward corresponding to X (with Gaussian noise)\n",
    "        y_init = round(y_init, 4)  # Keep four decimal places\n",
    "        Y.append(y_init) \n",
    "        print(\"x_init: \", init)\n",
    "        print(\"y_init: \", y_init)\n",
    "        all_x_init.append(init)\n",
    "        all_y_init.append(y_init)\n",
    "        rewards.append(f[init_idx])\n",
    "        \n",
    "    np.random.seed(random_seed)\n",
    "    \n",
    "    X = np.squeeze(X) \n",
    "    X = np.array(X)\n",
    "    Y = np.array(Y)\n",
    "    \n",
    "    # Iteration\n",
    "    rewards_2 = optimize_randomsearch(num_iter, xx, f, noise_intensity, K)\n",
    "    # rewards_2 = optimize_experiment(X, Y, K, num_iter, xx, f, noise_intensity, delta)\n",
    "    \n",
    "    rewards = np.array(rewards)\n",
    "    rewards_2 = np.array(rewards_2)\n",
    "    rewards = np.concatenate([rewards, rewards_2])\n",
    "    \n",
    "    return rewards, all_xx, all_f, all_theta, all_x_init, all_y_init"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e57bc3ed",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Parameters: random seed, feature dimension, number of arms, initial sample size, \n",
    "# number of iterations during sampling, Gaussian noise variance during sampling, \n",
    "# confidence level delta controlling high-probability regret bound\n",
    "\n",
    "# rewards, all_xx, all_f, all_theta, all_x_init, all_y_init = LLM_for_bandits_oracle()\n",
    "\n",
    "# Use ThreadPoolExecutor to execute threads\n",
    "gpt_model = \"gpt-3.5-turbo\"\n",
    "with concurrent.futures.ThreadPoolExecutor() as executor:\n",
    "    future1 = executor.submit(LLM_for_bandits_oracle, 41, 4, 16, 2, 98, 0.02, 0.05)\n",
    "    future2 = executor.submit(LLM_for_bandits_oracle, 42, 4, 16, 2, 98, 0.02, 0.05)\n",
    "    future3 = executor.submit(LLM_for_bandits_oracle, 43, 4, 16, 2, 98, 0.02, 0.05)\n",
    "    future4 = executor.submit(LLM_for_bandits_oracle, 44, 4, 16, 2, 98, 0.02, 0.05)\n",
    "    future5 = executor.submit(LLM_for_bandits_oracle, 45, 4, 16, 2, 98, 0.02, 0.05)\n",
    "    future6 = executor.submit(LLM_for_bandits_oracle, 46, 4, 16, 2, 98, 0.02, 0.05)\n",
    "    future7 = executor.submit(LLM_for_bandits_oracle, 47, 4, 16, 2, 98, 0.02, 0.05)\n",
    "    future8 = executor.submit(LLM_for_bandits_oracle, 48, 4, 16, 2, 98, 0.02, 0.05)\n",
    "    future9 = executor.submit(LLM_for_bandits_oracle, 49, 4, 16, 2, 98, 0.02, 0.05)\n",
    "    future0 = executor.submit(LLM_for_bandits_oracle, 50, 4, 16, 2, 98, 0.02, 0.05)\n",
    "\n",
    "    # Retrieve return values from the threads\n",
    "    result1 = future1.result()\n",
    "    result2 = future2.result()\n",
    "    result3 = future3.result()\n",
    "    result4 = future4.result()\n",
    "    result5 = future5.result()\n",
    "    result6 = future6.result()\n",
    "    result7 = future7.result()\n",
    "    result8 = future8.result()\n",
    "    result9 = future9.result()\n",
    "    result0 = future0.result()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
