{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0e8d57b4-5022-42f5-8be9-389dacf8a5fd",
   "metadata": {},
   "outputs": [],
   "source": [
    "%load_ext autoreload\n",
    "%autoreload 2\n",
    "\n",
    "import pickle \n",
    "import torch\n",
    "import importlib\n",
    "import os\n",
    "\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "\n",
    "from envs import darkroom_env\n",
    "from tqdm.notebook import tqdm\n",
    "\n",
    "from utils import build_darkroom_data_filename\n",
    "from darkroom_data_generation import generate_darkroom_pref_histories"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "af1843ce-fe57-4e4d-8e90-84ed7b01f35e",
   "metadata": {},
   "outputs": [],
   "source": [
    "# n_hists: the number of trajectories to generate for 1 given environment \n",
    "# n_samples: the number of states (optimal actions) to query for 1 given trajectory \n",
    "# n_hists and n_samples default to be 1\n",
    "n_hists, n_samples, horizon = 1, 1, 100 \n",
    "\n",
    "# configuration file for data generation\n",
    "config = {\n",
    "        'n_hists': n_hists,  \n",
    "        'n_samples': n_samples,\n",
    "        'horizon': horizon, # length of each trajectory,\n",
    "        'in_traj':False\n",
    "}"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "0311772e-0af9-4f57-86e0-c1669f86ac39",
   "metadata": {},
   "outputs": [],
   "source": [
    "dim = 10 # size of DarkRoom is set to 10x10\n",
    "n_envs = 100000 \n",
    "\n",
    "# The 'rollin_type' item is not used if 'mode' is 'step'\n",
    "config.update({'dim': dim})\n",
    "# There are ( dim x dim ) possible goals\n",
    "goals = np.array([[(j, i) for i in range(dim)]\n",
    "                 for j in range(dim)]).reshape(-1, 2)\n",
    "\n",
    "np.random.RandomState(seed=0).shuffle(goals)\n",
    "train_test_split = int(.8 * len(goals))\n",
    "train_goals = goals[:train_test_split]\n",
    "test_goals = goals[train_test_split:]\n",
    "\n",
    "# construct the goals for training and testing: the goals in testing are different to those in training\n",
    "eval_goals = np.array(test_goals.tolist() *\n",
    "                      int(100 // len(test_goals)))\n",
    "train_goals = np.repeat(train_goals, n_envs // (dim * dim), axis=0)\n",
    "test_goals = np.repeat(test_goals, n_envs // (dim * dim), axis=0)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "27eda244-5a66-4758-9a32-6b2ef6db4088",
   "metadata": {},
   "source": [
    "## Generating Pretraining Data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "686d9519-4da4-4d3f-8ea3-3a78b794eed9",
   "metadata": {},
   "outputs": [],
   "source": [
    "random_p = (0.2,1.0)\n",
    "config['random_p']=random_p\n",
    "\n",
    "train_trajs = generate_darkroom_pref_histories(train_goals, **config)\n",
    "test_trajs = generate_darkroom_pref_histories(test_goals, **config)\n",
    "eval_trajs = generate_darkroom_pref_histories(eval_goals, **config)\n",
    "\n",
    "env = 'darkroom_pref_step'\n",
    "train_filepath = build_darkroom_data_filename(\n",
    "            env, n_envs, config, random_p, mode=0)\n",
    "test_filepath = build_darkroom_data_filename(\n",
    "    env, n_envs, config, random_p, mode=1)\n",
    "eval_filepath = build_darkroom_data_filename(env, 100, config, random_p, mode=2)\n",
    "\n",
    "# Saving Generated Trajectories\n",
    "if not os.path.exists('datasets'):\n",
    "    os.makedirs('datasets', exist_ok=True)\n",
    "\n",
    "with open(train_filepath, 'wb') as file:\n",
    "    pickle.dump(train_trajs, file)\n",
    "with open(test_filepath, 'wb') as file:\n",
    "    pickle.dump(test_trajs, file)\n",
    "with open(eval_filepath, 'wb') as file:\n",
    "    pickle.dump(eval_trajs, file)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "020b6c84-e2c1-455a-a66a-d7caa7432a92",
   "metadata": {},
   "source": [
    "## Generating Various Offline Testing Trajectories"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "deefa78e-a71b-4a7d-a45d-d80bb5d43d6c",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "n_envs = 10 #does not matter\n",
    "\n",
    "np.random.RandomState(seed=0).shuffle(goals)\n",
    "train_test_split = int(.8 * len(goals))\n",
    "train_goals = goals[:train_test_split]\n",
    "test_goals = goals[train_test_split:]\n",
    "\n",
    "eval_goals = np.array(test_goals.tolist() *\n",
    "                      int(100 // len(test_goals)))\n",
    "train_goals = np.repeat(train_goals, n_envs // (dim * dim), axis=0)\n",
    "test_goals = np.repeat(test_goals, n_envs // (dim * dim), axis=0)\n",
    "\n",
    "for random_p in [0.0, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0]:\n",
    "    random_p = (random_p, 1.0)\n",
    "    print('Generating for random_p: ',random_p)\n",
    "    config['random_p']=random_p\n",
    "    # the 'rollin_type' option is not used\n",
    "    train_trajs = generate_darkroom_pref_histories(train_goals, **config)\n",
    "    test_trajs = generate_darkroom_pref_histories(test_goals, **config)\n",
    "    eval_trajs = generate_darkroom_pref_histories(eval_goals, **config)\n",
    "    \n",
    "    env = 'darkroom_pref_step'\n",
    "    train_filepath = build_darkroom_data_filename(\n",
    "                env, n_envs, config, random_p, mode=0)\n",
    "    test_filepath = build_darkroom_data_filename(\n",
    "        env, n_envs, config, random_p, mode=1)\n",
    "    eval_filepath = build_darkroom_data_filename(env, 100, config, random_p, mode=2)\n",
    "\n",
    "    with open('./'+train_filepath, 'wb') as file:\n",
    "        pickle.dump(train_trajs, file)\n",
    "    with open('./'+test_filepath, 'wb') as file:\n",
    "        pickle.dump(test_trajs, file)\n",
    "    with open('./'+eval_filepath, 'wb') as file:\n",
    "        pickle.dump(eval_trajs, file)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "in-context-learning",
   "language": "python",
   "name": "in-context-learning"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
