{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%env CUDA_VISIBLE_DEVICES=0\n",
    "%load_ext autoreload\n",
    "%autoreload 2\n",
    "\n",
    "import matplotlib.pyplot as plt\n",
    "%matplotlib inline\n",
    "\n",
    "from tqdm.notebook import tqdm\n",
    "import os\n",
    "from utils import write_ivecs, write_dvecs, read_ivecs, read_dvecs\n",
    "import numpy as np"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "n = 1010000\n",
    "k = 100\n",
    "d = 6\n",
    "X = (float(n) ** (1 / (d-1))) / d\n",
    "_p = lambda x: (float(x) ** 2 - 1) ** (d - 2)\n",
    "print(X)\n",
    "X = 1.8\n",
    "print(np.arccosh(X))\n",
    "\n",
    "set_path = f'gbnns_theory/data/hyperbolic_d{d}_X{X}'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "accepted = []\n",
    "counter = 0\n",
    "while len(accepted) < n:\n",
    "    candidate = np.random.uniform(1, X)\n",
    "    thr = _p(candidate)\n",
    "    if np.random.uniform(0, _p(X)) < thr:\n",
    "        accepted.append(candidate)\n",
    "    else:\n",
    "        counter += 1\n",
    "\n",
    "accepted = np.array(accepted)[:, None].astype('float64')\n",
    "plt.hist(accepted, bins=100)\n",
    "plt.show()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "x = np.random.randn(n, d).astype('float64')\n",
    "x = (x / np.linalg.norm(x, axis=1)[:, None]) * (accepted ** 2 - 1) ** 0.5\n",
    "x = np.concatenate([accepted, x], axis=1) \n",
    "base = x[:-10000]\n",
    "queries = x[-10000:]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "os.makedirs(set_path, exist_ok=True)\n",
    "\n",
    "write_dvecs(os.path.join(set_path, 'base.1M.dvecs'), base)\n",
    "write_dvecs(os.path.join(set_path, 'query.10K.dvecs'), queries)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Uniform sphere"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# Parameters\n",
    "n = 1010000\n",
    "k = 100\n",
    "d = 6\n",
    "\n",
    "# Generate points\n",
    "x = np.random.randn(n, d + 1).astype('float64')\n",
    "x = x / np.linalg.norm(x, axis=1)[:, None]\n",
    "query = x[-10000:] \n",
    "base = x[:-10000]\n",
    "# dists = -1 * query.astype('float64') @ base.transpose().astype('float64')\n",
    "\n",
    "# # Compute gt\n",
    "# step = 100\n",
    "# gt = np.zeros((len(dists), k))\n",
    "# for i in tqdm(range(0, len(dists), step)):\n",
    "#     gt[i:i+step] = np.argsort(dists[i: i + step], axis=1)[:, :k]\n",
    "    \n",
    "    \n",
    "# Save points\n",
    "set_path = f'gbnns_theory/data/sphere_d{d}'\n",
    "os.makedirs(set_path, exist_ok=True)\n",
    "write_dvecs(os.path.join(set_path, 'base.1M.dvecs'), base)\n",
    "write_dvecs(os.path.join(set_path, 'query.10K.dvecs'), query)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.4"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
