{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "4dfb58cd-b02a-4bf9-bb5a-a3cdff4e4187",
   "metadata": {},
   "source": [
    "# Generate synthetic yeast promoters using regLM"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a6a141f0-2570-4593-a40b-b1f263e67790",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "import os\n",
    "import importlib\n",
    "import sys\n",
    "import torch\n",
    "\n",
    "torch.backends.cuda.matmul.allow_tf32 = True\n",
    "torch.backends.cudnn.allow_tf32 = True\n",
    "\n",
    "sys.path.append(\"../../regLM/\")\n",
    "\n",
    "os.environ[\"CUDA_VISIBLE_DEVICES\"]=\"2\"\n",
    "import reglm.lightning"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "006dc325-15fe-4419-ad96-2023f7172468",
   "metadata": {},
   "outputs": [],
   "source": [
    "model = reglm.lightning.LightningModel.load_from_checkpoint(\n",
    "    'lightning_logs/version_10/checkpoints/epoch=9-step=580648.ckpt')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f9cb0486-55fc-4165-891d-85880521985b",
   "metadata": {},
   "outputs": [],
   "source": [
    "df = pd.DataFrame()\n",
    "for label in ['00', '11', '22', '33', '44']:\n",
    "    print(label)\n",
    "    seqs = []\n",
    "    for i in range(150):\n",
    "        seqs.append(model.generate(label=label, device=0, max_new_tokens=80, sample=True))\n",
    "    df = pd.concat([df, pd.DataFrame({'Sequence':seqs, 'label':tok})])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e2685bcd-5301-473c-8779-b25904fcad29",
   "metadata": {},
   "outputs": [],
   "source": [
    "df.reset_index(drop=True).to_csv('synthetic_promoters/lm.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f764f741-d86a-4b45-b54b-c4846e83dd54",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.17"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
