{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "005fc085",
   "metadata": {},
   "outputs": [],
   "source": [
    "import openai\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "# Set your API key\n",
    "openai.api_key = 'API KEY'\n",
    "from tqdm import tqdm\n",
    "import math\n",
    "import concurrent.futures\n",
    "import copy\n",
    "import GPy"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "da06b5e9",
   "metadata": {},
   "outputs": [],
   "source": [
    "%run optimize.py\n",
    "%run make_prompt.py\n",
    "%run synthetic_reward_function.py\n",
    "%run get_response.py"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "914d97af",
   "metadata": {},
   "outputs": [],
   "source": [
    "# Global Variables\n",
    "\n",
    "gpt_model = \"gpt-3.5-turbo\"\n",
    "\n",
    "using_difference = False  # True: use the difference of features; False: use feature concatenation\n",
    "\n",
    "f_type = 2  # Reward function type: 1: linear, 2: square, 3: sine, 4: Gaussian Process (GP)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "68a49837",
   "metadata": {},
   "outputs": [],
   "source": [
    "def LLM_for_dueling_bandits(random_seed, d, K, N_repeat_arm_1, N_init, num_iter, noise_intensity):\n",
    "    \n",
    "    rewards = []\n",
    "    rewards_2 = []\n",
    "    X, Y = [], []\n",
    "    \n",
    "    np.random.seed(random_seed)\n",
    "    \n",
    "    xx, theta = generate_xx_theta(d, K)\n",
    "\n",
    "    # We first randomly select some arms\n",
    "    for i in range(N_init):\n",
    "        np.random.seed(random_seed + i)\n",
    "        x_init = xx[np.random.choice(xx.shape[0], 2, replace=False), :]\n",
    "\n",
    "        if using_difference:\n",
    "            feature_diff = np.asarray([x_init[0] - x_init[1]])  # Compute the feature difference between two arms\n",
    "            X.append(feature_diff)\n",
    "        else:\n",
    "            concatenated_feature = np.concatenate((x_init[0], x_init[1]))\n",
    "            X.append(concatenated_feature)\n",
    "        y_init = observe_duel(xx, x_init[0], x_init[1], theta, noise_intensity, d)\n",
    "        Y.append(y_init)\n",
    "        rewards.append([compute_f(xx, x_init[0], theta, d), compute_f(xx, x_init[1], theta, d)])\n",
    "    \n",
    "    np.random.seed(None)\n",
    "    \n",
    "    X = np.squeeze(X) \n",
    "    X = np.array(X)\n",
    "    Y = np.array(Y)\n",
    "    \n",
    "    # Choose iteration method\n",
    "    # rewards_2 = optimize_experiment(X, Y, N_repeat_arm_1, xx, theta, num_iter, noise_intensity, d)\n",
    "    rewards_2 = random_search(X, Y, xx, theta, num_iter, noise_intensity, d)\n",
    "    \n",
    "    rewards = np.vstack((rewards, rewards_2))\n",
    "\n",
    "    return rewards, xx, theta, x_init, y_init"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4bd9f00b",
   "metadata": {},
   "outputs": [],
   "source": [
    "with concurrent.futures.ThreadPoolExecutor() as executor:\n",
    "    # Function, random seed, feature dimension, number of arms, number of times to randomly select arms in the acquisition function,\n",
    "    # number of initial acquisitions, number of subsequent iterations, noise variance\n",
    "    future1 = executor.submit(LLM_for_dueling_bandits, 41, 4, 16, 5, 2, 148, 0)\n",
    "    future2 = executor.submit(LLM_for_dueling_bandits, 42, 4, 16, 5, 2, 148, 0)\n",
    "    future3 = executor.submit(LLM_for_dueling_bandits, 43, 4, 16, 5, 2, 148, 0)\n",
    "    future4 = executor.submit(LLM_for_dueling_bandits, 44, 4, 16, 5, 2, 148, 0)\n",
    "    future5 = executor.submit(LLM_for_dueling_bandits, 45, 4, 16, 5, 2, 148, 0)\n",
    "\n",
    "    # Retrieve the return values from the threads\n",
    "    result1 = future1.result()\n",
    "    result2 = future2.result()\n",
    "    result3 = future3.result()\n",
    "    result4 = future4.result()\n",
    "    result5 = future5.result()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
