{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "158976ac-e948-49a6-8460-f3ea004c8bed",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import pandas as pd\n",
    "import os\n",
    "import importlib\n",
    "import sys\n",
    "import torch\n",
    "from plotnine import *\n",
    "import anndata\n",
    "import itertools\n",
    "sys.path.insert(0, \"../../\")\n",
    "import scripts.evolve, scripts.regression"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "af11d635-3d9f-4175-bc4a-c5c0a495674a",
   "metadata": {},
   "outputs": [],
   "source": [
    "model = scripts.regression.LightningModel.load_from_checkpoint(\n",
    "    'reg_lm/lightning_logs/version_0/checkpoints/epoch=7-step=20968.ckpt')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "34426c8f-e36d-49d8-9cbf-f03dbe500b8f",
   "metadata": {},
   "outputs": [],
   "source": [
    "start_seqs = pd.read_csv('synthetic_enhancers/start_seqs.csv', index_col=0)"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "52020f99-2570-4a3b-bd41-ecd9e2d9cea5",
   "metadata": {},
   "source": [
    "## Ledidi"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "5a65976e-11ea-4107-82d1-ff4384d9b0ad",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "naa_df = pd.DataFrame()\n",
    "\n",
    "for i, seq in enumerate(start_seqs.iloc[:,0].tolist()):\n",
    "    out_seq = scripts.evolve.ledidi(seq, model, to_max=[0],to_min=[1,2], device=0, num_workers=8)\n",
    "    df = pd.DataFrame({'Sequence':out_seq})    \n",
    "    df['start_seq'] = i\n",
    "    naa_df = pd.concat([naa_df, df])\n",
    "\n",
    "naa_df.reset_index(drop=True).to_csv('synthetic_enhancers/LE_naa.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "63f5dcf9-3e1a-4f7d-9df7-3733e6e00930",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "ana_df = pd.DataFrame()\n",
    "\n",
    "for i, seq in enumerate(start_seqs.iloc[:, 0].tolist()):\n",
    "    out_seq = grelu.design.evolve.ledidi(\n",
    "    out_seq = scripts.evolve.ledidi(seq, model, to_max=[1],to_min=[0,2], device=0, num_workers=8)\n",
    "        max_iter=1000, device=5, l=20, lr=3.5e-3,\n",
    "    )\n",
    "    df = pd.DataFrame({'Sequence':out_seq})    \n",
    "    df['start_seq'] = i\n",
    "    ana_df = pd.concat([ana_df, df])\n",
    "\n",
    "ana_df.reset_index(drop=True).to_csv('synthetic_enhancers/LE_ana.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "71cfee7b-46f0-461f-9bfd-162ab1596d5e",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "aan_df = pd.DataFrame()\n",
    "\n",
    "for i, seq in enumerate(start_seqs.iloc[:, 0].tolist()):\n",
    "    out_seq = grelu.design.evolve.ledidi(\n",
    "    out_seq = scripts.evolve.ledidi(seq, model, to_max=[2],to_min=[1,0], device=0, num_workers=8)\n",
    "        max_iter=1000, device=5, l=20, lr=3.5e-3,\n",
    "    )\n",
    "    df = pd.DataFrame({'Sequence':out_seq})    \n",
    "    df['start_seq'] = i\n",
    "    aan_df = pd.concat([aan_df, df])\n",
    "\n",
    "aan_df.reset_index(drop=True).to_csv('synthetic_enhancers/LE_aan.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7ff1bd99-b327-4bb2-8a82-a5131988fef6",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.17"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
