{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "%matplotlib inline\n",
    "import sys, os\n",
    "sys.path.append(\"../\")\n",
    "import numpy as np\n",
    "import numpy.linalg as nla\n",
    "import scipy.linalg as sla\n",
    "import numba as nb\n",
    "import matplotlib as mpl\n",
    "import matplotlib.pyplot as plt\n",
    "from timeit import timeit\n",
    "import matplotlib.pylab as pl\n",
    "%load_ext autoreload\n",
    "%autoreload 2"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from numba import types\n",
    "from numba.extending import overload\n",
    "from numba import config, njit, threading_layer, set_num_threads\n",
    "\n",
    "@overload(np.maximum)\n",
    "def impl_clip(x, a):\n",
    "    # In numba type checking happens at *compile time*. We check the types of\n",
    "    # the arguments here, and return a proper implementation based on those\n",
    "    # types (or error accordingly).\n",
    "\n",
    "    # Check that `a` is a scalar\n",
    "    if not isinstance(a, (types.Integer, types.Float, types.NoneType)):\n",
    "        raise TypingError(\"a must be a scalar int/float\")\n",
    "\n",
    "    if isinstance(x, (types.Integer, types.Float)):\n",
    "        # x is a scalar with a valid type\n",
    "        def impl(x, a):\n",
    "            return max(x, a)    \n",
    "    elif (\n",
    "        isinstance(x, types.Array) and\n",
    "        x.ndim == 1 and\n",
    "        isinstance(x.dtype, (types.Integer, types.Float))\n",
    "    ):\n",
    "        # x is a 1D array of the proper type\n",
    "        def impl(x, a):\n",
    "            # Allocate an output array using standard numpy functions\n",
    "#             out = np.empty_like(x)\n",
    "            # Iterate over x, calling `np.clip` on every element\n",
    "            for i in numba.prange(x.size):\n",
    "                # This will dispatch to the proper scalar implementation (as\n",
    "                # defined above) at *compile time*. There should have no\n",
    "                # overhead at runtime.\n",
    "                x[i] = impl(x[i], 0)\n",
    "            return x\n",
    "    elif ( \n",
    "        isinstance(x, types.Array) and\n",
    "        x.ndim == 2 and\n",
    "        isinstance(x.dtype, (types.Integer, types.Float))\n",
    "    ):   \n",
    "        def impl(x, a):\n",
    "            return impl(x.reshape(-1), a)\n",
    "    else:\n",
    "        raise TypingError(\"x must be an int/float or a 1D/2D array of ints/floats\")\n",
    "\n",
    "    return impl\n",
    "\n",
    "# @overload(np.maximum)\n",
    "# def my_clip(x, a):\n",
    "#     # In numba type checking happens at *compile time*. We check the types of\n",
    "#     # the arguments here, and return a proper implementation based on those\n",
    "#     # types (or error accordingly).\n",
    "\n",
    "#     # Check that `a` is a scalar\n",
    "#     if not isinstance(a, (types.Integer, types.Float, types.NoneType)):\n",
    "#         raise TypingError(\"a must be a scalar int/float\")\n",
    "\n",
    "#     if isinstance(x, (types.Integer, types.Float)):\n",
    "#         # x is a scalar with a valid type\n",
    "#         def impl(x, a):\n",
    "#             return max(x, a)    \n",
    "#     elif (\n",
    "#         isinstance(x, types.Array) and\n",
    "#         x.ndim == 1 and\n",
    "#         isinstance(x.dtype, (types.Integer, types.Float))\n",
    "#     ):\n",
    "#         # x is a 1D array of the proper type\n",
    "#         def impl(x, a):\n",
    "#             # Allocate an output array using standard numpy functions\n",
    "# #             out = np.empty_like(x)\n",
    "#             # Iterate over x, calling `np.clip` on every element\n",
    "#             for i in range(x.size):\n",
    "#                 # This will dispatch to the proper scalar implementation (as\n",
    "#                 # defined above) at *compile time*. There should have no\n",
    "#                 # overhead at runtime.\n",
    "#                 x[i] = impl(x[i], 0)\n",
    "#             return x\n",
    "#     elif ( \n",
    "#         isinstance(x, types.Array) and\n",
    "#         x.ndim == 2 and\n",
    "#         isinstance(x.dtype, (types.Integer, types.Float))\n",
    "#     ):   \n",
    "#         def impl(x, a):\n",
    "#             for i in range(x.shape[0]):\n",
    "#                 np.maximum(x[i, :], a, out=x[i, :])\n",
    "#             return x\n",
    "#     else:\n",
    "#         raise TypingError(\"x must be an int/float or a 1D/2D array of ints/floats\")\n",
    "\n",
    "#     return impl\n",
    "\n",
    "# config.THREADING_LAYER = 'threadsafe'\n",
    "# print(\"Threading layer chosen: %s\" % threading_layer())\n",
    "\n",
    "@nb.jit(nopython=True, fastmath=False, parallel=True)\n",
    "def proxgrad(x, C, step):\n",
    "    x_ = 0\n",
    "    for i in nb.prange(x.size):\n",
    "#         x_ = x[i]\n",
    "        x[i] = max(x[i] - step * C[i], 0.0)\n",
    "    return x\n",
    "\n",
    "@nb.njit (cache=True, fastmath=True, parallel=True)\n",
    "def test_clip(x, amin):\n",
    "    return np.maximum(x, amin)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 189,
   "metadata": {},
   "outputs": [],
   "source": [
    "import scipy as sp\n",
    "import numba as nb\n",
    "\n",
    "@nb.jit(cache=True, nopython=True, fastmath=False, parallel=True)\n",
    "def trace_nonnegative_prox_nb_new(x, C, a, b, step=1.0):\n",
    "    nrows = a.size\n",
    "    tmp = 0.0\n",
    "    for i in nb.prange(x.size):\n",
    "        tmp = a[i % nrows] + b[i // nrows] - step * C[i]\n",
    "        if tmp > 0 or x[i] > 0:\n",
    "            x[i] = max(x[i] + tmp, 0.0)    \n",
    "#         x[i] = max(x[i] + a[i % nrows] + b[i // nrows] - step * C[i], 0.0)\n",
    "    return x\n",
    "\n",
    "@nb.jit(cache=True, nopython=True, fastmath=False, parallel=True)\n",
    "def trace_nonnegative_prox_nb(x, C, step=1.0):\n",
    "    for i in nb.prange(x.size):\n",
    "        x[i] = max(x[i] - step * C[i], 0.0)\n",
    "    return x\n",
    "\n",
    "def apply_adjoint_operator_and_override(e, f, y, x, T, alpha=1.0, beta=None):\n",
    "    \"\"\"\n",
    "        T <- T + alpha * y e^T + beta* f x^T\n",
    "    \"\"\"\n",
    "    assert T.flags['F_CONTIGUOUS']\n",
    "    assert e.size == x.size, \"Dimension mismatch\"\n",
    "    assert f.size == y.size, \"Dimension mismatch\"\n",
    "    if beta is None:\n",
    "        beta = alpha\n",
    "    sp.linalg.blas.dger(alpha, y, e, a=T, overwrite_a=1)\n",
    "    sp.linalg.blas.dger(beta, f, x, a=T, overwrite_a=1)\n",
    "    return T\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# F-Order"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "m, n = 3, 4\n",
    "A = np.random.randn(m, n)\n",
    "C = np.random.randn(m, n)\n",
    "e = np.ones(n)\n",
    "f = np.ones(m)\n",
    "s = np.random.rand(n)\n",
    "r = np.random.rand(m)\n",
    "s, r = r / np.sum(r), s / np.sum(s)\n",
    "\n",
    "A = np.array(A, order='F')\n",
    "B = np.array(A, order='F')\n",
    "C = np.array(C, order='F')\n",
    "\n",
    "assert np.allclose(A, B)            \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 190,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0.066798"
      ]
     },
     "execution_count": 190,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "m, n = 2000, 5000\n",
    "x_ = np.random.randn(m, n) - 1.5\n",
    "C = np.random.randn(m, n)**2\n",
    "\n",
    "a = np.random.randn(m) \n",
    "b = np.random.randn(n)\n",
    "e = np.ones(n)\n",
    "f = np.ones(m)\n",
    "\n",
    "x = np.maximum(x_, 0.0, order='F')\n",
    "y = np.array(x, order='F')\n",
    "\n",
    "assert np.allclose(x, y)    \n",
    "\n",
    "np.sum(x > 0) / (m * n)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 74,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array([[-3.22531379, -0.49389807,  1.67878408,  0.46846923],\n",
       "       [-3.21394236,  0.93822252,  2.27044393,  0.63612745],\n",
       "       [-2.64526201,  0.59295122,  2.63207077,  2.0292389 ]])"
      ]
     },
     "execution_count": 74,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# y + np.outer(a, e) + np.outer(f, b)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 191,
   "metadata": {},
   "outputs": [],
   "source": [
    "apply_adjoint_operator_and_override(e, f, a, b, y, alpha=1.0)\n",
    "trace_nonnegative_prox_nb(y.T.reshape(-1), C.T.reshape(-1), step=5.0)\n",
    "\n",
    "trace_nonnegative_prox_nb_new(x.T.reshape(-1), C.T.reshape(-1), a, b, step=5.0)\n",
    "\n",
    "assert np.allclose(x, y)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 192,
   "metadata": {},
   "outputs": [],
   "source": [
    "def run(): \n",
    "    apply_adjoint_operator_and_override(e, f, a, b, y, alpha=1.0)\n",
    "    trace_nonnegative_prox_nb(y.T.reshape(-1), C.T.reshape(-1), step=5.0)\n",
    "    return e"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 193,
   "metadata": {},
   "outputs": [],
   "source": [
    "def run_():\n",
    "    trace_nonnegative_prox_nb_new(x.T.reshape(-1), C.T.reshape(-1), a, b, step=5.0)\n",
    "    return e"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 194,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "85.7 ms ± 1.31 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)\n"
     ]
    }
   ],
   "source": [
    "%timeit run()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 195,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "92.2 ms ± 1.05 ms per loop (mean ± std. dev. of 7 runs, 10 loops each)\n"
     ]
    }
   ],
   "source": [
    "%timeit run_()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Test rank-one update"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[True, True, True, True]"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "m, n = 4, 20\n",
    "A = np.random.randn(m, n)\n",
    "e = np.ones(n)\n",
    "f = np.ones(m)\n",
    "yy = np.random.randn(m,1)\n",
    "xx = np.random.randn(n)\n",
    "\n",
    "assert np.allclose(A - np.outer(yy, e) - np.outer(f, xx), A - yy - xx)\n",
    "D = np.outer(yy, e) + np.outer(f, xx)\n",
    "[np.allclose(D[i, j], yy[i] + xx[j]) for i, j in zip(range(yy.size), range(xx.size))]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Test Ye"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "m, n = 20000, 20000\n",
    "e = np.ones(n)\n",
    "f = np.ones(m)\n",
    "\n",
    "t1 = np.random.randn(m)\n",
    "t2 = np.random.randn(n)\n",
    "\n",
    "c1 = 0.8\n",
    "c2 = 0.9 \n",
    "\n",
    "def run(t1, t2, c1, c2, e , f):\n",
    "    return t1 - c1 * f, t2 - c2 * e\n",
    "\n",
    "# Broadcasting\n",
    "def run_(t1, t2, c1, c2):\n",
    "    return t1 - c1, t2 - c2\n",
    "\n",
    "yy, xx = run(t1, t2, c1, c2, e , f)\n",
    "yy_, xx_ = run_(t1, t2, c1, c2)\n",
    "\n",
    "assert np.allclose(yy, yy_)\n",
    "assert np.allclose(xx, xx_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit run(t1, t2, c1, c2, e , f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit run_(t1, t2, c1, c2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Test trace nonnegative prox "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "proxgrad(A.T.reshape(-1), C.T.reshape(-1), 1.0)\n",
    "np.maximum(B - C, 0.0, out=B, order='F')\n",
    "\n",
    "assert np.allclose(A, B)\n",
    "assert A.flags['F_CONTIGUOUS']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit proxgrad(A.T.reshape(-1), C.T.reshape(-1), 1.0)   "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "%timeit proxgrad(A.reshape(-1), C.reshape(-1), 1.0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit np.maximum(B - C, 0.0, out=B, order='F')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "scrolled": false
   },
   "outputs": [],
   "source": [
    "%timeit global B; B-=A"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit sla.blas.daxpy(A, B, a=-2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Test rank one update"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit B = sla.blas.dger(1.4, s, e, a=A, overwrite_a=0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit np.subtract(A, 1.4*np.outer(s, e), out=A, order='F')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "%timeit sla.blas.dger(-1.4, s, e, a=B, overwrite_a=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## Test matrix-vector multiplication"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "b = np.sum(A, axis=0)\n",
    "c = A.T.dot(f)\n",
    "d = sla.blas.dgemv(1, A, f, trans=1)\n",
    "\n",
    "assert np.allclose(b,c)\n",
    "assert np.allclose(c,d)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit A.T.dot(f)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit sla.blas.dgemv(1, A, f, trans=1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# C-Order"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "m, n = 10000, 5000\n",
    "A = np.random.randn(m, n)\n",
    "C = np.random.randn(m, n)\n",
    "B = A.copy()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "nb.config.NUMBA_DEFAULT_NUM_THREADS, nb.config.NUMBA_NUM_THREADS"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit test_clip(C, 0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit np.maximum(B-C, 0, out=B)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {
    "scrolled": true
   },
   "outputs": [],
   "source": [
    "%timeit proxgrad(A.reshape(-1), C.reshape(-1), 1.0)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit A - B"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit global B; B -=A "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "assert np.allclose(A, B)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "e = np.ones(A.shape[1])\n",
    "f = np.ones(A.shape[0])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit A.T.dot(f)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Test prox functions"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import scipy\n",
    "m, n = 10000, 5000\n",
    "A = np.random.randn(m, n)\n",
    "x = np.random.randn(m)\n",
    "y = np.random.randn(n)\n",
    "r = np.random.rand(n)\n",
    "s = np.random.rand(m)\n",
    "r, s = r / np.sum(r), s / np.sum(s)\n",
    "\n",
    "B = np.array(A, order='F')\n",
    "assert np.allclose(A, B)\n",
    "\n",
    "# def numpy_run1(A):\n",
    "#     A_ = A.copy()\n",
    "#     A_ += np.outer(x, y)\n",
    "\n",
    "# def scipy_run(A):\n",
    "#     B = np.array(A, order='F')\n",
    "#     assert B.flags['F_CONTIGUOUS']\n",
    "#     scipy.linalg.blas.dger(1, x, y, a=B, overwrite_a=1)\n",
    "\n",
    "# f1 = lambda: numpy_run1(A)\n",
    "# ts_md = timeit(f1, number=1)\n",
    "# print(ts_md)\n",
    "\n",
    "# f2 = lambda: scipy_run(B)\n",
    "# ts_md = timeit(f2, number=1)\n",
    "# print(ts_md)\n",
    "\n",
    "# assert np.allclose(A, A_)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%timeit A.dot(y)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "m, n = 5000, 5000\n",
    "A = np.random.randn(m, n)\n",
    "x = np.random.randn(m)\n",
    "y = np.random.randn(n)\n",
    "r = np.random.rand(n)\n",
    "s = np.random.rand(m)\n",
    "r, s = r / np.sum(r), s / np.sum(s)\n",
    "e = np.ones(n)\n",
    "f = np.ones(m)\n",
    "\n",
    "B = np.array(A, order='F')\n",
    "C = np.zeros((m,n))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "f1 = lambda: projection_1(A, s, r)\n",
    "ts_md = timeit(f1, number=1)\n",
    "print(ts_md)\n",
    "\n",
    "f2 = lambda: projection_2(B, s, r)\n",
    "ts_md = timeit(f2, number=1)\n",
    "print(ts_md)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def Sinkhorn(C, reg, a, b, delta=1e-9, lam=1e-6):\n",
    "\n",
    "    K = np.exp(-C / reg)\n",
    "    u = np.ones(np.shape(a)[0])\n",
    "    v = np.ones(np.shape(b)[0])\n",
    "\n",
    "    u_trans = np.dot(K, v) + lam  # add regularization to avoid divide 0\n",
    "    v_trans = np.dot(K.T, u) + lam  # add regularization to avoid divide 0\n",
    "\n",
    "    err_1 = np.sum(np.abs(u * u_trans - a))\n",
    "    err_2 = np.sum(np.abs(v * v_trans - b))\n",
    "\n",
    "    while True:\n",
    "        if err_1 + err_2 > delta:\n",
    "            u = a / u_trans\n",
    "            v_trans = np.dot(K.T, u) + lam\n",
    "\n",
    "            v = b / v_trans\n",
    "            u_trans = np.dot(K, v) + lam\n",
    "\n",
    "            err_1 = np.sum(np.abs(u * u_trans - a))\n",
    "            err_2 = np.sum(np.abs(v * v_trans - b))\n",
    "        else:\n",
    "            return u, v\n",
    "\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(nb.__version__)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# np.show_config()\n",
    "# print(np.__version__)\n",
    "# # np.__config__.show()\n",
    "# from numpy.distutils.system_info import get_info\n",
    "# info = get_info('blas_opt')\n",
    "# print(info)\n",
    "# config.THREADING_LAYER = 'threadsafe'\n",
    "# print(\"Threading layer chosen: %s\" % threading_layer())\n",
    "\n",
    "# nb.set_num_threads(16)\n",
    "# nb.config.NUMBA_DEFAULT_NUM_THREADS, nb.config.NUMBA_NUM_THREADS"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# proxf_ = lambda x: nonneg_projection(x -  step * C_)\n",
    "# proxg_ = lambda x: generalized_doubly_stochastic_matrices_projection_(x, p, q)"
   ]
  }
 ],
 "metadata": {
  "interpreter": {
   "hash": "d5ba264c5f4101a9468be457e73710a096a733042fc21294adfce058d6ef15df"
  },
  "kernelspec": {
   "display_name": "Python [conda env:common]",
   "language": "python",
   "name": "conda-env-common-py"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.10"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
