{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "f848f016",
   "metadata": {},
   "source": [
    "# Sampling Mixture of two gaussians\n",
    "\n",
    "For $a \\in \\mathcal{R}^{d}$ and a positive definite matrix $\\Sigma \\in \\mathcal{R}^{{d \\times d}}$,\n",
    "we consider the mixture of two gaussian $\\mathcal{N}(a,\\Sigma)$ and $\\mathcal{N}(-a,\\Sigma)$ with equal weights. Denote $b = \\Sigma^{{-1}} a$ and $\\Lambda = \\Sigma^{{-1}}$.\n",
    "The potential and gradient can be written as\n",
    "\\begin{equation}\n",
    "\\begin{split}\n",
    "f(x)  & = \\frac{1}{2} \\| x - a  \\|^2_{\\Lambda} - \\log ( 1 + \\exp( -2 x^\\top b)  )\n",
    "\\\\ \\nabla f(x) & = \\Lambda x- b + 2 b ( 1+\\exp(-2 x^\\top b) )^{-1}.\n",
    "\\end{split}\n",
    "\\end{equation}\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "62372a47",
   "metadata": {},
   "outputs": [],
   "source": [
    "import numpy as np\n",
    "import matplotlib\n",
    "import matplotlib.pyplot as plt\n",
    "import arviz\n",
    "import argparse\n",
    "import os\n",
    "import time\n",
    "from typing import Callable\n",
    "\n",
    "import scipy.stats as spst\n",
    "import scipy.special as spsp\n",
    "import tqdm\n",
    "\n",
    "import hmc\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a43175d4",
   "metadata": {},
   "outputs": [],
   "source": [
    "def Chebyroot(k, alpha=1.0, beta=10):\n",
    "   assert beta > alpha\n",
    "   a = np.arange(1,k+1)\n",
    "   return (alpha+beta)/2.0  - (beta-alpha)/2.0*np.cos( (a -0.5)*np.pi / k  )  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "71165af3",
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "parser = argparse.ArgumentParser(description='Bias in Hamiltonian Monte Carlo when using the implicit midpoint integrator')\n",
    "parser.add_argument('--step-size', type=float, default=0.1, help='Integration step-size')\n",
    "parser.add_argument('--num-samples', type=int, default=10000, help='Number of samples to generate')\n",
    "parser.add_argument('--thresh', type=float, default=1e-6, help='Convergence tolerance for fixed-point iterations')\n",
    "parser.add_argument('--method', type=str, default='lf', help='Which integrator to use in proposal operator')\n",
    "parser.add_argument('--use-Cheby', type=bool, default=True, help='Whether use Chebyshev integration time')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "adc49c7d",
   "metadata": {},
   "outputs": [],
   "source": [
    "args = parser.parse_args(args=[])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "83294c73",
   "metadata": {},
   "outputs": [],
   "source": [
    "def experiment(method: str, step_size: float, num_samples: int, proposal: Callable, if_use_Cheby: bool, alpha: float, beta: float) -> np.ndarray:\n",
    "    \"\"\"Experiment to examine the use of different integrators for sampling from a\n",
    "    Gaussian distribution. Given a proposal operator, attempts to draw samples\n",
    "    and computes performance metrics for the sampler.\n",
    "    Args:\n",
    "        method: String identifier for the proposal method.\n",
    "        step_size: Integration step-size.\n",
    "        num_samples: Number of samples to generate.\n",
    "        proposal: Proposal function that will yield the next state of the Markov\n",
    "            chain.\n",
    "    Returns:\n",
    "        samples: Samples from the Markov chain generated using the proposal\n",
    "            operator.\n",
    "    \"\"\"\n",
    "    integration_time = np.zeros(num_samples+1)\n",
    "    if if_use_Cheby:\n",
    "        tmp = Chebyroot(num_samples+1, alpha, beta)\n",
    "        integration_time = np.pi/ 2 / np.sqrt(2*np.random.permutation(tmp))\n",
    "    else:\n",
    "        integration_time = np.pi/ 2 / np.sqrt(2*beta)* np.ones(num_samples+1);\n",
    "    sampler = hmc.sample(mu, step_size, integration_time, hamiltonian, proposal, sample_momentum, use_Cheby= if_use_Cheby, check_prob=0.0001)\n",
    "    samples = np.zeros((num_samples, dim))\n",
    "    acc = 0\n",
    "    _ = next(sampler)\n",
    "    start = time.time()\n",
    "    for i in range(num_samples):\n",
    "        samples[i], isacc, nsteps = next(sampler)\n",
    "        acc += isacc\n",
    "    elapsed = time.time() - start\n",
    "    accprob = acc / num_samples\n",
    "    \n",
    "    return samples, elapsed, accprob, nsteps\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "064824aa",
   "metadata": {},
   "outputs": [],
   "source": [
    "dim = 10\n",
    "a1  = np.arange(dim) + 1.0 \n",
    "mu  = np.sqrt(a1) / (2*dim)\n",
    "Sigma = np.diag( a1 / dim )\n",
    "iSigma= np.linalg.inv(Sigma)\n",
    "evals = np.linalg.eigvals(iSigma)\n",
    "alpha = min(evals)\n",
    "beta  = max(evals)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "16e4b908",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "runs  = 10 #number of runs\n",
    "array_stepsize = np.array( [0.001, 0.005, 0.01, 0.05, 0.1] )\n",
    "\n",
    "distr = hmc.applications.gaussian_mixture\n",
    "log_posterior, grad_log_posterior, metric = distr.posterior_factory(mu, Sigma)\n",
    "hamiltonian, grad_pos_hamiltonian, grad_mom_hamiltonian, vector_field, sample_momentum = hmc.integrators.vector_fields.euclidean_hamiltonian_vector_field(log_posterior, grad_log_posterior, metric)\n",
    "\n",
    "proposal = hmc.proposals.leapfrog_proposal_factory(grad_pos_hamiltonian, grad_mom_hamiltonian)\n",
    "name = 'l.f.'\n",
    "args.thresh = 0.0\n",
    "coef = ['beta-{}'.format(i+1) for i in range(dim)]\n",
    "\n",
    "\n",
    "#Use Cheby Integration time\n",
    "Cheby_mean_es = np.zeros( [runs, len(array_stepsize)] )\n",
    "Cheby_min_ess = np.zeros( [runs, len(array_stepsize)] )\n",
    "Cheby_nsteps  = np.zeros( [runs, len(array_stepsize)] )\n",
    "Cheby_elapsed = np.zeros( [runs, len(array_stepsize)])\n",
    "Cheby_accprob = np.zeros( [runs, len(array_stepsize)])\n",
    "\n",
    "for it in range(runs):\n",
    "    for idd in range( len(array_stepsize) ):\n",
    "        samples, Cheby_elapsed[it,idd],  Cheby_accprob[it,idd], Cheby_nsteps[it,idd] = experiment(name, array_stepsize[idd], args.num_samples, proposal, True, alpha, beta)\n",
    "        print('covariance {:} {:}'.format(it,idd))\n",
    "        #print(np.cov(samples.T))\n",
    "        print(np.diag(np.cov(samples.T) ))\n",
    "        metrics = hmc.summarize(samples, coef)\n",
    "        Cheby_mean_es[it,idd] = metrics['ess'].mean()\n",
    "        Cheby_min_ess[it,idd] = metrics['ess'].min()\n",
    "\n",
    "#Use constant Integration time\n",
    "Cst_mean_es = np.zeros( [runs, len(array_stepsize)])\n",
    "Cst_min_ess = np.zeros( [runs, len(array_stepsize)])\n",
    "Cst_nsteps  = np.zeros( [runs, len(array_stepsize)])\n",
    "Cst_elapsed  = np.zeros([runs, len(array_stepsize)])\n",
    "Cst_accprob = np.zeros( [runs, len(array_stepsize)])\n",
    "\n",
    "for it in range(runs):\n",
    "    for idd in range( len(array_stepsize) ):\n",
    "        samples, Cst_elapsed[it,idd],  Cst_accprob[it,idd], Cst_nsteps[it,idd] = experiment(name, array_stepsize[idd], args.num_samples, proposal, False, alpha, beta)\n",
    "        print('covariance {:} {:}'.format(it,idd))\n",
    "        #print(np.cov(samples.T))\n",
    "        print(np.diag(np.cov(samples.T) ))\n",
    "        metrics = hmc.summarize(samples, coef)\n",
    "        Cst_mean_es[it,idd] = metrics['ess'].mean()\n",
    "        Cst_min_ess[it,idd] = metrics['ess'].min()\n",
    "\n",
    "\n",
    "for idd in range( len(array_stepsize) ):\n",
    "    print(\"=== Using Step Size = {:3e}  \".format(array_stepsize[idd]))\n",
    "    print('=== Chebyshev Integration-Time ===')\n",
    "    \n",
    "    print('average of mean ESS in {:} runs: {:5.5f}'.format(runs, np.mean(Cheby_mean_es[:,idd])))\n",
    "    print('std of mean ESS in {:} runs:     {:5.5f}'.format(runs, np.std(Cheby_mean_es[:,idd])))\n",
    "    print('average of min ESS in {:} runs:  {:5.5f}'.format(runs, np.mean(Cheby_min_ess[:,idd])))\n",
    "    print('std of min ESS in {:} runs:      {:5.5f}'.format(runs, np.std(Cheby_min_ess[:,idd])))\n",
    "\n",
    "    print('average of mean ESS/Sec. in {:} runs: {:5.5f}'.format(runs, np.mean(Cheby_mean_es[:,idd]/Cheby_elapsed[:,idd])) )\n",
    "    print('std of mean ESS/Sec. in {:} runs:     {:5.5f}'.format(runs, np.std(Cheby_mean_es[:,idd]/Cheby_elapsed[:,idd]) ))\n",
    "    print('average of min ESS/Sec. in {:} runs:  {:5.5f}'.format(runs, np.mean(Cheby_min_ess[:,idd]/Cheby_elapsed[:,idd])) )\n",
    "    print('std of min ESS/Sec. in {:} runs:      {:5.5f}'.format(runs, np.std(Cheby_min_ess[:,idd]/Cheby_elapsed[:,idd]) ))\n",
    "\n",
    "    print('average of acceptance prob. in {:} runs: {:5.5f}'.format(runs, np.mean(Cheby_accprob[:,idd])))\n",
    "    print('std of acceptance prob. in {:} runs: {:5.5f}'.format(runs, np.std(Cheby_accprob[:,idd])))\n",
    "\n",
    "    print('average of mean ESS per grad. in {:} runs: {:5.5f}'.format(runs, np.mean(Cheby_mean_es[:,idd]/Cheby_nsteps[:,idd]))) \n",
    "    print('std of mean ESS per grad. in {:} runs:     {:5.5f}'.format(runs, np.std(Cheby_mean_es[:,idd]/Cheby_nsteps[:,idd])))\n",
    "    print('average of min per grad in {:} runs:  {:5.5f}'.format(runs, np.mean(Cheby_min_ess[:,idd]/Cheby_nsteps[:,idd])))\n",
    "    print('std of min per grad in {:} runs:      {:5.5f}'.format(runs, np.std(Cheby_min_ess[:,idd]/Cheby_nsteps[:,idd])))\n",
    "\n",
    "    print('=== Const Integration-Time ===')\n",
    "    print('average of mean ESS in {:} runs: {:5.5f}'.format(runs, np.mean(Cst_mean_es[:,idd])))\n",
    "    print('std of mean ESS in {:} runs:     {:5.5f}'.format(runs, np.std(Cst_mean_es[:,idd])))\n",
    "    print('average of min ESS in {:} runs:  {:5.5f}'.format(runs, np.mean(Cst_min_ess[:,idd])))\n",
    "    print('std of min ESS in {:} runs:      {:5.5f}'.format(runs, np.std(Cst_min_ess[:,idd])))\n",
    "\n",
    "    print('average of mean ESS/Sec. in {:} runs: {:5.5f}'.format(runs, np.mean(Cst_mean_es[:,idd]/Cst_elapsed[:,idd])))\n",
    "    print('std of mean ESS/Sec. in {:} runs:     {:5.5f}'.format(runs, np.std(Cst_mean_es[:,idd]/Cst_elapsed[:,idd])))\n",
    "    print('average of min ESS/Sec. in {:} runs:  {:5.5f}'.format(runs, np.mean(Cst_min_ess[:,idd]/Cst_elapsed[:,idd])))\n",
    "    print('std of min ESS/Sec. in {:} runs:      {:5.5f}'.format(runs, np.std(Cst_min_ess[:,idd]/Cst_elapsed[:,idd])))          \n",
    "    \n",
    "    print('average of acceptance prob. in {:} runs: {:5.5f}'.format(runs, np.mean(Cst_accprob[:,idd])))\n",
    "    print('std of acceptance prob. in {:} runs: {:5.5f}'.format(runs, np.std(Cst_accprob[:,idd])))\n",
    "\n",
    "    print('average of mean ESS per grad. in {:} runs: {:5.5f}'.format(runs, np.mean(Cst_mean_es[:,idd]/Cst_nsteps[:,idd]))) \n",
    "    print('std of mean ESS per grad. in {:} runs:     {:5.5f}'.format(runs, np.std(Cst_mean_es[:,idd]/Cst_nsteps[:,idd])))\n",
    "    print('average of min per grad in {:} runs:  {:5.5f}'.format(runs, np.mean(Cst_min_ess[:,idd]/Cst_nsteps[:,idd])))\n",
    "    print('std of min per grad in {:} runs:      {:5.5f}'.format(runs, np.std(Cst_min_ess[:,idd]/Cst_nsteps[:,idd])))\n",
    "\n",
    "    print(\"=============================\")\n",
    "    print(\"=============================\")\n",
    "\n",
    "\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "b6f6ce39",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "rec = np.zeros( [len(array_stepsize), 20] )\n",
    "\n",
    "for idd in range( len(array_stepsize) ):\n",
    "    rec[idd,0] = np.mean(Cheby_mean_es[:,idd])\n",
    "    rec[idd,1] = np.std(Cheby_mean_es[:,idd])\n",
    "    rec[idd,2] = np.mean(Cheby_min_ess[:,idd])\n",
    "    rec[idd,3] = np.std(Cheby_min_ess[:,idd])\n",
    "    rec[idd,4] = np.mean(Cheby_mean_es[:,idd]/Cheby_elapsed[:,idd])\n",
    "    rec[idd,5] = np.std(Cheby_mean_es[:,idd]/Cheby_elapsed[:,idd])\n",
    "    rec[idd,6] = np.mean(Cheby_min_ess[:,idd]/Cheby_elapsed[:,idd])\n",
    "    rec[idd,7] = np.std(Cheby_min_ess[:,idd]/Cheby_elapsed[:,idd])\n",
    "    \n",
    "    rec[idd,8] = np.mean(Cst_mean_es[:,idd])\n",
    "    rec[idd,9] = np.std(Cst_mean_es[:,idd])\n",
    "    rec[idd,10] = np.mean(Cst_min_ess[:,idd])\n",
    "    rec[idd,11] = np.std(Cst_min_ess[:,idd])\n",
    "    rec[idd,12] = np.mean(Cst_mean_es[:,idd]/Cst_elapsed[:,idd])\n",
    "    rec[idd,13] = np.std(Cst_mean_es[:,idd]/Cst_elapsed[:,idd])\n",
    "    rec[idd,14] = np.mean(Cst_min_ess[:,idd]/Cst_elapsed[:,idd])\n",
    "    rec[idd,15] = np.std(Cst_min_ess[:,idd]/Cst_elapsed[:,idd])\n",
    "\n",
    "    rec[idd,16] = np.mean(Cheby_accprob[:,idd])\n",
    "    rec[idd,17] = np.std(Cheby_accprob[:,idd])\n",
    "    rec[idd,18] = np.mean(Cst_accprob[:,idd])\n",
    "    rec[idd,19] = np.std(Cst_accprob[:,idd])\n",
    "\n",
    "filepath='./mixture.csv'\n",
    "np.savetxt(filepath, rec, delimiter=',')\n",
    "data = np.loadtxt(filepath, delimiter=',')\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
