

<!DOCTYPE html>
<html class="writer-html5" lang="en" >
<head>
  <meta charset="utf-8">
  
  <meta name="viewport" content="width=device-width, initial-scale=1.0">
  
  <title>deeprobust.image.optimizer &mdash; DeepRobust 0.1.1 documentation</title>
  

  
  <link rel="stylesheet" href="../../../_static/css/theme.css" type="text/css" />
  <link rel="stylesheet" href="../../../_static/pygments.css" type="text/css" />

  
  
  
  

  
  <!--[if lt IE 9]>
    <script src="../../../_static/js/html5shiv.min.js"></script>
  <![endif]-->
  
    
      <script type="text/javascript" id="documentation_options" data-url_root="../../../" src="../../../_static/documentation_options.js"></script>
        <script type="text/javascript" src="../../../_static/jquery.js"></script>
        <script type="text/javascript" src="../../../_static/underscore.js"></script>
        <script type="text/javascript" src="../../../_static/doctools.js"></script>
        <script type="text/javascript" src="../../../_static/language_data.js"></script>
        <script async="async" type="text/javascript" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/latest.js?config=TeX-AMS-MML_HTMLorMML"></script>
    
    <script type="text/javascript" src="../../../_static/js/theme.js"></script>

    
    <link rel="index" title="Index" href="../../../genindex.html" />
    <link rel="search" title="Search" href="../../../search.html" /> 
</head>

<body class="wy-body-for-nav">

   
  <div class="wy-grid-for-nav">
    
    <nav data-toggle="wy-nav-shift" class="wy-nav-side">
      <div class="wy-side-scroll">
        <div class="wy-side-nav-search" >
          

          
            <a href="../../../index.html" class="icon icon-home" alt="Documentation Home"> DeepRobust
          

          
          </a>

          
            
            
          

          
<div role="search">
  <form id="rtd-search-form" class="wy-form" action="../../../search.html" method="get">
    <input type="text" name="q" placeholder="Search docs" />
    <input type="hidden" name="check_keywords" value="yes" />
    <input type="hidden" name="area" value="default" />
  </form>
</div>

          
        </div>

        
        <div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="main navigation">
          
            
            
              
            
            
              <p class="caption"><span class="caption-text">Installation</span></p>
<ul>
<li class="toctree-l1"><a class="reference internal" href="../../../notes/installation.html">Installation</a></li>
</ul>
<p class="caption"><span class="caption-text">Graph Package</span></p>
<ul>
<li class="toctree-l1"><a class="reference internal" href="../../../graph/data.html">Graph Dataset</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../graph/attack.html">Introduction to Graph Attack with Examples</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../graph/defense.html">Introduction to Graph Defense with Examples</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../graph/pyg.html">Using PyTorch Geometric in DeepRobust</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../graph/node_embedding.html">Node Embedding Attack and Defense</a></li>
</ul>
<p class="caption"><span class="caption-text">Image Package</span></p>
<ul>
<li class="toctree-l1"><a class="reference internal" href="../../../image/example.html">Image Attack and Defense</a></li>
</ul>
<p class="caption"><span class="caption-text">Image Package</span></p>
<ul>
<li class="toctree-l1"><a class="reference internal" href="../../../source/deeprobust.image.attack.html">deeprobust.image.attack package</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../source/deeprobust.image.defense.html">deeprobust.image.defense package</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../source/deeprobust.image.netmodels.html">deeprobust.image.netmodels package</a></li>
</ul>
<p class="caption"><span class="caption-text">Graph Package</span></p>
<ul>
<li class="toctree-l1"><a class="reference internal" href="../../../source/deeprobust.graph.global_attack.html">deeprobust.graph.global_attack package</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../source/deeprobust.graph.targeted_attack.html">deeprobust.graph.targeted_attack package</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../source/deeprobust.graph.defense.html">deeprobust.graph.defense package</a></li>
<li class="toctree-l1"><a class="reference internal" href="../../../source/deeprobust.graph.data.html">deeprobust.graph.data package</a></li>
</ul>

            
          
        </div>
        
      </div>
    </nav>

    <section data-toggle="wy-nav-shift" class="wy-nav-content-wrap">

      
      <nav class="wy-nav-top" aria-label="top navigation">
        
          <i data-toggle="wy-nav-top" class="fa fa-bars"></i>
          <a href="../../../index.html">DeepRobust</a>
        
      </nav>


      <div class="wy-nav-content">
        
        <div class="rst-content">
        
          















<div role="navigation" aria-label="breadcrumbs navigation">

  <ul class="wy-breadcrumbs">
    
      <li><a href="../../../index.html" class="icon icon-home"></a> &raquo;</li>
        
          <li><a href="../../index.html">Module code</a> &raquo;</li>
        
      <li>deeprobust.image.optimizer</li>
    
    
      <li class="wy-breadcrumbs-aside">
        
      </li>
    
  </ul>

  
  <hr/>
</div>
          <div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
           <div itemprop="articleBody">
            
  <h1>Source code for deeprobust.image.optimizer</h1><div class="highlight"><pre>
<span></span><span class="sd">&quot;&quot;&quot;</span>
<span class="sd">This module include the following optimizer:</span>
<span class="sd">1. differential_evolution:</span>
<span class="sd">The differential evolution global optimization algorithm</span>
<span class="sd">https://github.com/scipy/scipy/blob/70e61dee181de23fdd8d893eaa9491100e2218d7/scipy/optimize/_differentialevolution.py</span>

<span class="sd">modified by:</span>
<span class="sd">https://github.com/DebangLi/one-pixel-attack-pytorch/blob/master/differential_evolution.py</span>

<span class="sd">2. Basic Adam Optimizer</span>

<span class="sd">&quot;&quot;&quot;</span>

<span class="kn">from</span> <span class="nn">__future__</span> <span class="kn">import</span> <span class="n">division</span><span class="p">,</span> <span class="n">print_function</span><span class="p">,</span> <span class="n">absolute_import</span>
<span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
<span class="kn">from</span> <span class="nn">scipy.optimize</span> <span class="kn">import</span> <span class="n">OptimizeResult</span><span class="p">,</span> <span class="n">minimize</span>
<span class="kn">from</span> <span class="nn">scipy.optimize.optimize</span> <span class="kn">import</span> <span class="n">_status_message</span>
<span class="kn">from</span> <span class="nn">scipy._lib._util</span> <span class="kn">import</span> <span class="n">check_random_state</span>
<span class="kn">import</span> <span class="nn">warnings</span>


<span class="n">__all__</span> <span class="o">=</span> <span class="p">[</span><span class="s1">&#39;differential_evolution&#39;</span><span class="p">,</span> <span class="s1">&#39;AdamOptimizer&#39;</span><span class="p">]</span>

<span class="n">_MACHEPS</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">finfo</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">float64</span><span class="p">)</span><span class="o">.</span><span class="n">eps</span>


<div class="viewcode-block" id="differential_evolution"><a class="viewcode-back" href="../../../source/deeprobust.image.html#deeprobust.image.optimizer.differential_evolution">[docs]</a><span class="k">def</span> <span class="nf">differential_evolution</span><span class="p">(</span><span class="n">func</span><span class="p">,</span> <span class="n">bounds</span><span class="p">,</span> <span class="n">args</span><span class="o">=</span><span class="p">(),</span> <span class="n">strategy</span><span class="o">=</span><span class="s1">&#39;best1bin&#39;</span><span class="p">,</span>
                           <span class="n">maxiter</span><span class="o">=</span><span class="mi">1000</span><span class="p">,</span> <span class="n">popsize</span><span class="o">=</span><span class="mi">15</span><span class="p">,</span> <span class="n">tol</span><span class="o">=</span><span class="mf">0.01</span><span class="p">,</span>
                           <span class="n">mutation</span><span class="o">=</span><span class="p">(</span><span class="mf">0.5</span><span class="p">,</span> <span class="mi">1</span><span class="p">),</span> <span class="n">recombination</span><span class="o">=</span><span class="mf">0.7</span><span class="p">,</span> <span class="n">seed</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span>
                           <span class="n">callback</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span> <span class="n">disp</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span> <span class="n">polish</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
                           <span class="n">init</span><span class="o">=</span><span class="s1">&#39;latinhypercube&#39;</span><span class="p">,</span> <span class="n">atol</span><span class="o">=</span><span class="mi">0</span><span class="p">):</span>
    <span class="sd">&quot;&quot;&quot;Finds the global minimum of a multivariate function.</span>
<span class="sd">    Differential Evolution is stochastic in nature (does not use gradient</span>
<span class="sd">    methods) to find the minimium, and can search large areas of candidate</span>
<span class="sd">    space, but often requires larger numbers of function evaluations than</span>
<span class="sd">    conventional gradient based techniques.</span>
<span class="sd">    The algorithm is due to Storn and Price [1]_.</span>
<span class="sd">    Parameters</span>
<span class="sd">    ----------</span>
<span class="sd">    func : callable</span>
<span class="sd">        The objective function to be minimized.  Must be in the form</span>
<span class="sd">        ``f(x, *args)``, where ``x`` is the argument in the form of a 1-D array</span>
<span class="sd">        and ``args`` is a  tuple of any additional fixed parameters needed to</span>
<span class="sd">        completely specify the function.</span>
<span class="sd">    bounds : sequence</span>
<span class="sd">        Bounds for variables.  ``(min, max)`` pairs for each element in ``x``,</span>
<span class="sd">        defining the lower and upper bounds for the optimizing argument of</span>
<span class="sd">        `func`. It is required to have ``len(bounds) == len(x)``.</span>
<span class="sd">        ``len(bounds)`` is used to determine the number of parameters in ``x``.</span>
<span class="sd">    args : tuple, optional</span>
<span class="sd">        Any additional fixed parameters needed to</span>
<span class="sd">        completely specify the objective function.</span>
<span class="sd">    strategy : str, optional</span>
<span class="sd">        The differential evolution strategy to use. Should be one of:</span>
<span class="sd">            - &#39;best1bin&#39;</span>
<span class="sd">            - &#39;best1exp&#39;</span>
<span class="sd">            - &#39;rand1exp&#39;</span>
<span class="sd">            - &#39;randtobest1exp&#39;</span>
<span class="sd">            - &#39;currenttobest1exp&#39;</span>
<span class="sd">            - &#39;best2exp&#39;</span>
<span class="sd">            - &#39;rand2exp&#39;</span>
<span class="sd">            - &#39;randtobest1bin&#39;</span>
<span class="sd">            - &#39;currenttobest1bin&#39;</span>
<span class="sd">            - &#39;best2bin&#39;</span>
<span class="sd">            - &#39;rand2bin&#39;</span>
<span class="sd">            - &#39;rand1bin&#39;</span>
<span class="sd">        The default is &#39;best1bin&#39;.</span>
<span class="sd">    maxiter : int, optional</span>
<span class="sd">        The maximum number of generations over which the entire population is</span>
<span class="sd">        evolved. The maximum number of function evaluations (with no polishing)</span>
<span class="sd">        is: ``(maxiter + 1) * popsize * len(x)``</span>
<span class="sd">    popsize : int, optional</span>
<span class="sd">        A multiplier for setting the total population size.  The population has</span>
<span class="sd">        ``popsize * len(x)`` individuals (unless the initial population is</span>
<span class="sd">        supplied via the `init` keyword).</span>
<span class="sd">    tol : float, optional</span>
<span class="sd">        Relative tolerance for convergence, the solving stops when</span>
<span class="sd">        ``np.std(pop) &lt;= atol + tol * np.abs(np.mean(population_energies))``,</span>
<span class="sd">        where and `atol` and `tol` are the absolute and relative tolerance</span>
<span class="sd">        respectively.</span>
<span class="sd">    mutation : float or tuple(float, float), optional</span>
<span class="sd">        The mutation constant. In the literature this is also known as</span>
<span class="sd">        differential weight, being denoted by F.</span>
<span class="sd">        If specified as a float it should be in the range [0, 2].</span>
<span class="sd">        If specified as a tuple ``(min, max)`` dithering is employed. Dithering</span>
<span class="sd">        randomly changes the mutation constant on a generation by generation</span>
<span class="sd">        basis. The mutation constant for that generation is taken from</span>
<span class="sd">        ``U[min, max)``. Dithering can help speed convergence significantly.</span>
<span class="sd">        Increasing the mutation constant increases the search radius, but will</span>
<span class="sd">        slow down convergence.</span>
<span class="sd">    recombination : float, optional</span>
<span class="sd">        The recombination constant, should be in the range [0, 1]. In the</span>
<span class="sd">        literature this is also known as the crossover probability, being</span>
<span class="sd">        denoted by CR. Increasing this value allows a larger number of mutants</span>
<span class="sd">        to progress into the next generation, but at the risk of population</span>
<span class="sd">        stability.</span>
<span class="sd">    seed : int or `np.random.RandomState`, optional</span>
<span class="sd">        If `seed` is not specified the `np.RandomState` singleton is used.</span>
<span class="sd">        If `seed` is an int, a new `np.random.RandomState` instance is used,</span>
<span class="sd">        seeded with seed.</span>
<span class="sd">        If `seed` is already a `np.random.RandomState instance`, then that</span>
<span class="sd">        `np.random.RandomState` instance is used.</span>
<span class="sd">        Specify `seed` for repeatable minimizations.</span>
<span class="sd">    disp : bool, optional</span>
<span class="sd">        Display status messages</span>
<span class="sd">    callback : callable, `callback(xk, convergence=val)`, optional</span>
<span class="sd">        A function to follow the progress of the minimization. ``xk`` is</span>
<span class="sd">        the current value of ``x0``. ``val`` represents the fractional</span>
<span class="sd">        value of the population convergence.  When ``val`` is greater than one</span>
<span class="sd">        the function halts. If callback returns `True`, then the minimization</span>
<span class="sd">        is halted (any polishing is still carried out).</span>
<span class="sd">    polish : bool, optional</span>
<span class="sd">        If True (default), then `scipy.optimize.minimize` with the `L-BFGS-B`</span>
<span class="sd">        method is used to polish the best population member at the end, which</span>
<span class="sd">        can improve the minimization slightly.</span>
<span class="sd">    init : str or array-like, optional</span>
<span class="sd">        Specify which type of population initialization is performed. Should be</span>
<span class="sd">        one of:</span>
<span class="sd">            - &#39;latinhypercube&#39;</span>
<span class="sd">            - &#39;random&#39;</span>
<span class="sd">            - array specifying the initial population. The array should have</span>
<span class="sd">              shape ``(M, len(x))``, where len(x) is the number of parameters.</span>
<span class="sd">              `init` is clipped to `bounds` before use.</span>
<span class="sd">        The default is &#39;latinhypercube&#39;. Latin Hypercube sampling tries to</span>
<span class="sd">        maximize coverage of the available parameter space. &#39;random&#39;</span>
<span class="sd">        initializes the population randomly - this has the drawback that</span>
<span class="sd">        clustering can occur, preventing the whole of parameter space being</span>
<span class="sd">        covered. Use of an array to specify a population subset could be used,</span>
<span class="sd">        for example, to create a tight bunch of initial guesses in an location</span>
<span class="sd">        where the solution is known to exist, thereby reducing time for</span>
<span class="sd">        convergence.</span>
<span class="sd">    atol : float, optional</span>
<span class="sd">        Absolute tolerance for convergence, the solving stops when</span>
<span class="sd">        ``np.std(pop) &lt;= atol + tol * np.abs(np.mean(population_energies))``,</span>
<span class="sd">        where and `atol` and `tol` are the absolute and relative tolerance</span>
<span class="sd">        respectively.</span>
<span class="sd">    Returns</span>
<span class="sd">    -------</span>
<span class="sd">    res : OptimizeResult</span>
<span class="sd">        The optimization result represented as a `OptimizeResult` object.</span>
<span class="sd">        Important attributes are: ``x`` the solution array, ``success`` a</span>
<span class="sd">        Boolean flag indicating if the optimizer exited successfully and</span>
<span class="sd">        ``message`` which describes the cause of the termination. See</span>
<span class="sd">        `OptimizeResult` for a description of other attributes.  If `polish`</span>
<span class="sd">        was employed, and a lower minimum was obtained by the polishing, then</span>
<span class="sd">        OptimizeResult also contains the ``jac`` attribute.</span>
<span class="sd">    Notes</span>
<span class="sd">    -----</span>
<span class="sd">    Differential evolution is a stochastic population based method that is</span>
<span class="sd">    useful for global optimization problems. At each pass through the population</span>
<span class="sd">    the algorithm mutates each candidate solution by mixing with other candidate</span>
<span class="sd">    solutions to create a trial candidate. There are several strategies [2]_ for</span>
<span class="sd">    creating trial candidates, which suit some problems more than others. The</span>
<span class="sd">    &#39;best1bin&#39; strategy is a good starting point for many systems. In this</span>
<span class="sd">    strategy two members of the population are randomly chosen. Their difference</span>
<span class="sd">    is used to mutate the best member (the `best` in `best1bin`), :math:`b_0`,</span>
<span class="sd">    so far:</span>
<span class="sd">    .. math::</span>
<span class="sd">        b&#39; = b_0 + mutation * (population[rand0] - population[rand1])</span>
<span class="sd">    A trial vector is then constructed. Starting with a randomly chosen &#39;i&#39;th</span>
<span class="sd">    parameter the trial is sequentially filled (in modulo) with parameters from</span>
<span class="sd">    `b&#39;` or the original candidate. The choice of whether to use `b&#39;` or the</span>
<span class="sd">    original candidate is made with a binomial distribution (the &#39;bin&#39; in</span>
<span class="sd">    &#39;best1bin&#39;) - a random number in [0, 1) is generated.  If this number is</span>
<span class="sd">    less than the `recombination` constant then the parameter is loaded from</span>
<span class="sd">    `b&#39;`, otherwise it is loaded from the original candidate.  The final</span>
<span class="sd">    parameter is always loaded from `b&#39;`.  Once the trial candidate is built</span>
<span class="sd">    its fitness is assessed. If the trial is better than the original candidate</span>
<span class="sd">    then it takes its place. If it is also better than the best overall</span>
<span class="sd">    candidate it also replaces that.</span>
<span class="sd">    To improve your chances of finding a global minimum use higher `popsize`</span>
<span class="sd">    values, with higher `mutation` and (dithering), but lower `recombination`</span>
<span class="sd">    values. This has the effect of widening the search radius, but slowing</span>
<span class="sd">    convergence.</span>
<span class="sd">    .. versionadded:: 0.15.0</span>

<span class="sd">    References</span>
<span class="sd">    ----------</span>
<span class="sd">    .. [1] Storn, R and Price, K, Differential Evolution - a Simple and</span>
<span class="sd">           Efficient Heuristic for Global Optimization over Continuous Spaces,</span>
<span class="sd">           Journal of Global Optimization, 1997, 11, 341 - 359.</span>
<span class="sd">    .. [2] http://www1.icsi.berkeley.edu/~storn/code.html</span>
<span class="sd">    .. [3] http://en.wikipedia.org/wiki/Differential_evolution</span>
<span class="sd">    &quot;&quot;&quot;</span>

    <span class="n">solver</span> <span class="o">=</span> <span class="n">DifferentialEvolutionSolver</span><span class="p">(</span><span class="n">func</span><span class="p">,</span> <span class="n">bounds</span><span class="p">,</span> <span class="n">args</span><span class="o">=</span><span class="n">args</span><span class="p">,</span>
                                         <span class="n">strategy</span><span class="o">=</span><span class="n">strategy</span><span class="p">,</span> <span class="n">maxiter</span><span class="o">=</span><span class="n">maxiter</span><span class="p">,</span>
                                         <span class="n">popsize</span><span class="o">=</span><span class="n">popsize</span><span class="p">,</span> <span class="n">tol</span><span class="o">=</span><span class="n">tol</span><span class="p">,</span>
                                         <span class="n">mutation</span><span class="o">=</span><span class="n">mutation</span><span class="p">,</span>
                                         <span class="n">recombination</span><span class="o">=</span><span class="n">recombination</span><span class="p">,</span>
                                         <span class="n">seed</span><span class="o">=</span><span class="n">seed</span><span class="p">,</span> <span class="n">polish</span><span class="o">=</span><span class="n">polish</span><span class="p">,</span>
                                         <span class="n">callback</span><span class="o">=</span><span class="n">callback</span><span class="p">,</span>
                                         <span class="n">disp</span><span class="o">=</span><span class="n">disp</span><span class="p">,</span> <span class="n">init</span><span class="o">=</span><span class="n">init</span><span class="p">,</span> <span class="n">atol</span><span class="o">=</span><span class="n">atol</span><span class="p">)</span>
    <span class="k">return</span> <span class="n">solver</span><span class="o">.</span><span class="n">solve</span><span class="p">()</span></div>


<span class="k">class</span> <span class="nc">DifferentialEvolutionSolver</span><span class="p">(</span><span class="nb">object</span><span class="p">):</span>

    <span class="sd">&quot;&quot;&quot;This class implements the differential evolution solver</span>
<span class="sd">    Parameters</span>
<span class="sd">    ----------</span>
<span class="sd">    func : callable</span>
<span class="sd">        The objective function to be minimized.  Must be in the form</span>
<span class="sd">        ``f(x, *args)``, where ``x`` is the argument in the form of a 1-D array</span>
<span class="sd">        and ``args`` is a  tuple of any additional fixed parameters needed to</span>
<span class="sd">        completely specify the function.</span>
<span class="sd">    bounds : sequence</span>
<span class="sd">        Bounds for variables.  ``(min, max)`` pairs for each element in ``x``,</span>
<span class="sd">        defining the lower and upper bounds for the optimizing argument of</span>
<span class="sd">        `func`. It is required to have ``len(bounds) == len(x)``.</span>
<span class="sd">        ``len(bounds)`` is used to determine the number of parameters in ``x``.</span>
<span class="sd">    args : tuple, optional</span>
<span class="sd">        Any additional fixed parameters needed to</span>
<span class="sd">        completely specify the objective function.</span>
<span class="sd">    strategy : str, optional</span>
<span class="sd">        The differential evolution strategy to use. Should be one of:</span>
<span class="sd">            - &#39;best1bin&#39;</span>
<span class="sd">            - &#39;best1exp&#39;</span>
<span class="sd">            - &#39;rand1exp&#39;</span>
<span class="sd">            - &#39;randtobest1exp&#39;</span>
<span class="sd">            - &#39;currenttobest1exp&#39;</span>
<span class="sd">            - &#39;best2exp&#39;</span>
<span class="sd">            - &#39;rand2exp&#39;</span>
<span class="sd">            - &#39;randtobest1bin&#39;</span>
<span class="sd">            - &#39;currenttobest1bin&#39;</span>
<span class="sd">            - &#39;best2bin&#39;</span>
<span class="sd">            - &#39;rand2bin&#39;</span>
<span class="sd">            - &#39;rand1bin&#39;</span>
<span class="sd">        The default is &#39;best1bin&#39;</span>
<span class="sd">    maxiter : int, optional</span>
<span class="sd">        The maximum number of generations over which the entire population is</span>
<span class="sd">        evolved. The maximum number of function evaluations (with no polishing)</span>
<span class="sd">        is: ``(maxiter + 1) * popsize * len(x)``</span>
<span class="sd">    popsize : int, optional</span>
<span class="sd">        A multiplier for setting the total population size.  The population has</span>
<span class="sd">        ``popsize * len(x)`` individuals (unless the initial population is</span>
<span class="sd">        supplied via the `init` keyword).</span>
<span class="sd">    tol : float, optional</span>
<span class="sd">        Relative tolerance for convergence, the solving stops when</span>
<span class="sd">        ``np.std(pop) &lt;= atol + tol * np.abs(np.mean(population_energies))``,</span>
<span class="sd">        where and `atol` and `tol` are the absolute and relative tolerance</span>
<span class="sd">        respectively.</span>
<span class="sd">    mutation : float or tuple(float, float), optional</span>
<span class="sd">        The mutation constant. In the literature this is also known as</span>
<span class="sd">        differential weight, being denoted by F.</span>
<span class="sd">        If specified as a float it should be in the range [0, 2].</span>
<span class="sd">        If specified as a tuple ``(min, max)`` dithering is employed. Dithering</span>
<span class="sd">        randomly changes the mutation constant on a generation by generation</span>
<span class="sd">        basis. The mutation constant for that generation is taken from</span>
<span class="sd">        U[min, max). Dithering can help speed convergence significantly.</span>
<span class="sd">        Increasing the mutation constant increases the search radius, but will</span>
<span class="sd">        slow down convergence.</span>
<span class="sd">    recombination : float, optional</span>
<span class="sd">        The recombination constant, should be in the range [0, 1]. In the</span>
<span class="sd">        literature this is also known as the crossover probability, being</span>
<span class="sd">        denoted by CR. Increasing this value allows a larger number of mutants</span>
<span class="sd">        to progress into the next generation, but at the risk of population</span>
<span class="sd">        stability.</span>
<span class="sd">    seed : int or `np.random.RandomState`, optional</span>
<span class="sd">        If `seed` is not specified the `np.random.RandomState` singleton is</span>
<span class="sd">        used.</span>
<span class="sd">        If `seed` is an int, a new `np.random.RandomState` instance is used,</span>
<span class="sd">        seeded with `seed`.</span>
<span class="sd">        If `seed` is already a `np.random.RandomState` instance, then that</span>
<span class="sd">        `np.random.RandomState` instance is used.</span>
<span class="sd">        Specify `seed` for repeatable minimizations.</span>
<span class="sd">    disp : bool, optional</span>
<span class="sd">        Display status messages</span>
<span class="sd">    callback : callable, `callback(xk, convergence=val)`, optional</span>
<span class="sd">        A function to follow the progress of the minimization. ``xk`` is</span>
<span class="sd">        the current value of ``x0``. ``val`` represents the fractional</span>
<span class="sd">        value of the population convergence.  When ``val`` is greater than one</span>
<span class="sd">        the function halts. If callback returns `True`, then the minimization</span>
<span class="sd">        is halted (any polishing is still carried out).</span>
<span class="sd">    polish : bool, optional</span>
<span class="sd">        If True, then `scipy.optimize.minimize` with the `L-BFGS-B` method</span>
<span class="sd">        is used to polish the best population member at the end. This requires</span>
<span class="sd">        a few more function evaluations.</span>
<span class="sd">    maxfun : int, optional</span>
<span class="sd">        Set the maximum number of function evaluations. However, it probably</span>
<span class="sd">        makes more sense to set `maxiter` instead.</span>
<span class="sd">    init : str or array-like, optional</span>
<span class="sd">        Specify which type of population initialization is performed. Should be</span>
<span class="sd">        one of:</span>
<span class="sd">            - &#39;latinhypercube&#39;</span>
<span class="sd">            - &#39;random&#39;</span>
<span class="sd">            - array specifying the initial population. The array should have</span>
<span class="sd">              shape ``(M, len(x))``, where len(x) is the number of parameters.</span>
<span class="sd">              `init` is clipped to `bounds` before use.</span>
<span class="sd">        The default is &#39;latinhypercube&#39;. Latin Hypercube sampling tries to</span>
<span class="sd">        maximize coverage of the available parameter space. &#39;random&#39;</span>
<span class="sd">        initializes the population randomly - this has the drawback that</span>
<span class="sd">        clustering can occur, preventing the whole of parameter space being</span>
<span class="sd">        covered. Use of an array to specify a population could be used, for</span>
<span class="sd">        example, to create a tight bunch of initial guesses in an location</span>
<span class="sd">        where the solution is known to exist, thereby reducing time for</span>
<span class="sd">        convergence.</span>
<span class="sd">    atol : float, optional</span>
<span class="sd">        Absolute tolerance for convergence, the solving stops when</span>
<span class="sd">        ``np.std(pop) &lt;= atol + tol * np.abs(np.mean(population_energies))``,</span>
<span class="sd">        where and `atol` and `tol` are the absolute and relative tolerance</span>
<span class="sd">        respectively.</span>
<span class="sd">    &quot;&quot;&quot;</span>

    <span class="c1"># Dispatch of mutation strategy method (binomial or exponential).</span>
    <span class="n">_binomial</span> <span class="o">=</span> <span class="p">{</span><span class="s1">&#39;best1bin&#39;</span><span class="p">:</span> <span class="s1">&#39;_best1&#39;</span><span class="p">,</span>
                 <span class="s1">&#39;randtobest1bin&#39;</span><span class="p">:</span> <span class="s1">&#39;_randtobest1&#39;</span><span class="p">,</span>
                 <span class="s1">&#39;currenttobest1bin&#39;</span><span class="p">:</span> <span class="s1">&#39;_currenttobest1&#39;</span><span class="p">,</span>
                 <span class="s1">&#39;best2bin&#39;</span><span class="p">:</span> <span class="s1">&#39;_best2&#39;</span><span class="p">,</span>
                 <span class="s1">&#39;rand2bin&#39;</span><span class="p">:</span> <span class="s1">&#39;_rand2&#39;</span><span class="p">,</span>
                 <span class="s1">&#39;rand1bin&#39;</span><span class="p">:</span> <span class="s1">&#39;_rand1&#39;</span><span class="p">}</span>
    <span class="n">_exponential</span> <span class="o">=</span> <span class="p">{</span><span class="s1">&#39;best1exp&#39;</span><span class="p">:</span> <span class="s1">&#39;_best1&#39;</span><span class="p">,</span>
                    <span class="s1">&#39;rand1exp&#39;</span><span class="p">:</span> <span class="s1">&#39;_rand1&#39;</span><span class="p">,</span>
                    <span class="s1">&#39;randtobest1exp&#39;</span><span class="p">:</span> <span class="s1">&#39;_randtobest1&#39;</span><span class="p">,</span>
                    <span class="s1">&#39;currenttobest1exp&#39;</span><span class="p">:</span> <span class="s1">&#39;_currenttobest1&#39;</span><span class="p">,</span>
                    <span class="s1">&#39;best2exp&#39;</span><span class="p">:</span> <span class="s1">&#39;_best2&#39;</span><span class="p">,</span>
                    <span class="s1">&#39;rand2exp&#39;</span><span class="p">:</span> <span class="s1">&#39;_rand2&#39;</span><span class="p">}</span>

    <span class="n">__init_error_msg</span> <span class="o">=</span> <span class="p">(</span><span class="s2">&quot;The population initialization method must be one of &quot;</span>
                        <span class="s2">&quot;&#39;latinhypercube&#39; or &#39;random&#39;, or an array of shape &quot;</span>
                        <span class="s2">&quot;(M, N) where N is the number of parameters and M&gt;5&quot;</span><span class="p">)</span>

    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">func</span><span class="p">,</span> <span class="n">bounds</span><span class="p">,</span> <span class="n">args</span><span class="o">=</span><span class="p">(),</span>
                 <span class="n">strategy</span><span class="o">=</span><span class="s1">&#39;best1bin&#39;</span><span class="p">,</span> <span class="n">maxiter</span><span class="o">=</span><span class="mi">1000</span><span class="p">,</span> <span class="n">popsize</span><span class="o">=</span><span class="mi">15</span><span class="p">,</span>
                 <span class="n">tol</span><span class="o">=</span><span class="mf">0.01</span><span class="p">,</span> <span class="n">mutation</span><span class="o">=</span><span class="p">(</span><span class="mf">0.5</span><span class="p">,</span> <span class="mi">1</span><span class="p">),</span> <span class="n">recombination</span><span class="o">=</span><span class="mf">0.7</span><span class="p">,</span> <span class="n">seed</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span>
                 <span class="n">maxfun</span><span class="o">=</span><span class="n">np</span><span class="o">.</span><span class="n">inf</span><span class="p">,</span> <span class="n">callback</span><span class="o">=</span><span class="kc">None</span><span class="p">,</span> <span class="n">disp</span><span class="o">=</span><span class="kc">False</span><span class="p">,</span> <span class="n">polish</span><span class="o">=</span><span class="kc">True</span><span class="p">,</span>
                 <span class="n">init</span><span class="o">=</span><span class="s1">&#39;latinhypercube&#39;</span><span class="p">,</span> <span class="n">atol</span><span class="o">=</span><span class="mi">0</span><span class="p">):</span>

        <span class="k">if</span> <span class="n">strategy</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">_binomial</span><span class="p">:</span>
            <span class="bp">self</span><span class="o">.</span><span class="n">mutation_func</span> <span class="o">=</span> <span class="nb">getattr</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">_binomial</span><span class="p">[</span><span class="n">strategy</span><span class="p">])</span>
        <span class="k">elif</span> <span class="n">strategy</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">_exponential</span><span class="p">:</span>
            <span class="bp">self</span><span class="o">.</span><span class="n">mutation_func</span> <span class="o">=</span> <span class="nb">getattr</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">_exponential</span><span class="p">[</span><span class="n">strategy</span><span class="p">])</span>
        <span class="k">else</span><span class="p">:</span>
            <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="s2">&quot;Please select a valid mutation strategy&quot;</span><span class="p">)</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">strategy</span> <span class="o">=</span> <span class="n">strategy</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">callback</span> <span class="o">=</span> <span class="n">callback</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">polish</span> <span class="o">=</span> <span class="n">polish</span>

        <span class="c1"># relative and absolute tolerances for convergence</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">tol</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">atol</span> <span class="o">=</span> <span class="n">tol</span><span class="p">,</span> <span class="n">atol</span>

        <span class="c1"># Mutation constant should be in [0, 2). If specified as a sequence</span>
        <span class="c1"># then dithering is performed.</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">=</span> <span class="n">mutation</span>
        <span class="k">if</span> <span class="p">(</span><span class="ow">not</span> <span class="n">np</span><span class="o">.</span><span class="n">all</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">isfinite</span><span class="p">(</span><span class="n">mutation</span><span class="p">))</span> <span class="ow">or</span>
                <span class="n">np</span><span class="o">.</span><span class="n">any</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">(</span><span class="n">mutation</span><span class="p">)</span> <span class="o">&gt;=</span> <span class="mi">2</span><span class="p">)</span> <span class="ow">or</span>
                <span class="n">np</span><span class="o">.</span><span class="n">any</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">(</span><span class="n">mutation</span><span class="p">)</span> <span class="o">&lt;</span> <span class="mi">0</span><span class="p">)):</span>
            <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="s1">&#39;The mutation constant must be a float in &#39;</span>
                             <span class="s1">&#39;U[0, 2), or specified as a tuple(min, max)&#39;</span>
                             <span class="s1">&#39; where min &lt; max and min, max are in U[0, 2).&#39;</span><span class="p">)</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">dither</span> <span class="o">=</span> <span class="kc">None</span>
        <span class="k">if</span> <span class="nb">hasattr</span><span class="p">(</span><span class="n">mutation</span><span class="p">,</span> <span class="s1">&#39;__iter__&#39;</span><span class="p">)</span> <span class="ow">and</span> <span class="nb">len</span><span class="p">(</span><span class="n">mutation</span><span class="p">)</span> <span class="o">&gt;</span> <span class="mi">1</span><span class="p">:</span>
            <span class="bp">self</span><span class="o">.</span><span class="n">dither</span> <span class="o">=</span> <span class="p">[</span><span class="n">mutation</span><span class="p">[</span><span class="mi">0</span><span class="p">],</span> <span class="n">mutation</span><span class="p">[</span><span class="mi">1</span><span class="p">]]</span>
            <span class="bp">self</span><span class="o">.</span><span class="n">dither</span><span class="o">.</span><span class="n">sort</span><span class="p">()</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">cross_over_probability</span> <span class="o">=</span> <span class="n">recombination</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">func</span> <span class="o">=</span> <span class="n">func</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">args</span> <span class="o">=</span> <span class="n">args</span>

        <span class="c1"># convert tuple of lower and upper bounds to limits</span>
        <span class="c1"># [(low_0, high_0), ..., (low_n, high_n]</span>
        <span class="c1">#     -&gt; [[low_0, ..., low_n], [high_0, ..., high_n]]</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">limits</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">(</span><span class="n">bounds</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="s1">&#39;float&#39;</span><span class="p">)</span><span class="o">.</span><span class="n">T</span>
        <span class="k">if</span> <span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">size</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">limits</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span> <span class="o">!=</span> <span class="mi">2</span> <span class="ow">or</span> <span class="ow">not</span>
                <span class="n">np</span><span class="o">.</span><span class="n">all</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">isfinite</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">limits</span><span class="p">))):</span>
            <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="s1">&#39;bounds should be a sequence containing &#39;</span>
                             <span class="s1">&#39;real valued (min, max) pairs for each value&#39;</span>
                             <span class="s1">&#39; in x&#39;</span><span class="p">)</span>

        <span class="k">if</span> <span class="n">maxiter</span> <span class="ow">is</span> <span class="kc">None</span><span class="p">:</span>  <span class="c1"># the default used to be None</span>
            <span class="n">maxiter</span> <span class="o">=</span> <span class="mi">1000</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">maxiter</span> <span class="o">=</span> <span class="n">maxiter</span>
        <span class="k">if</span> <span class="n">maxfun</span> <span class="ow">is</span> <span class="kc">None</span><span class="p">:</span>  <span class="c1"># the default used to be None</span>
            <span class="n">maxfun</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">inf</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">maxfun</span> <span class="o">=</span> <span class="n">maxfun</span>

        <span class="c1"># population is scaled to between [0, 1].</span>
        <span class="c1"># We have to scale between parameter &lt;-&gt; population</span>
        <span class="c1"># save these arguments for _scale_parameter and</span>
        <span class="c1"># _unscale_parameter. This is an optimization</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">__scale_arg1</span> <span class="o">=</span> <span class="mf">0.5</span> <span class="o">*</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">limits</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">limits</span><span class="p">[</span><span class="mi">1</span><span class="p">])</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">__scale_arg2</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">fabs</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">limits</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">limits</span><span class="p">[</span><span class="mi">1</span><span class="p">])</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">size</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">limits</span><span class="p">,</span> <span class="mi">1</span><span class="p">)</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">random_number_generator</span> <span class="o">=</span> <span class="n">check_random_state</span><span class="p">(</span><span class="n">seed</span><span class="p">)</span>

        <span class="c1"># default population initialization is a latin hypercube design, but</span>
        <span class="c1"># there are other population initializations possible.</span>
        <span class="c1"># the minimum is 5 because &#39;best2bin&#39; requires a population that&#39;s at</span>
        <span class="c1"># least 5 long</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span> <span class="o">=</span> <span class="nb">max</span><span class="p">(</span><span class="mi">5</span><span class="p">,</span> <span class="n">popsize</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span><span class="p">)</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">population_shape</span> <span class="o">=</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span><span class="p">,</span>
                                 <span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span><span class="p">)</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span> <span class="o">=</span> <span class="mi">0</span>
        <span class="k">if</span> <span class="nb">isinstance</span><span class="p">(</span><span class="n">init</span><span class="p">,</span> <span class="nb">str</span><span class="p">):</span>
            <span class="k">if</span> <span class="n">init</span> <span class="o">==</span> <span class="s1">&#39;latinhypercube&#39;</span><span class="p">:</span>
                <span class="bp">self</span><span class="o">.</span><span class="n">init_population_lhs</span><span class="p">()</span>
            <span class="k">elif</span> <span class="n">init</span> <span class="o">==</span> <span class="s1">&#39;random&#39;</span><span class="p">:</span>
                <span class="bp">self</span><span class="o">.</span><span class="n">init_population_random</span><span class="p">()</span>
            <span class="k">else</span><span class="p">:</span>
                <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">__init_error_msg</span><span class="p">)</span>
        <span class="k">else</span><span class="p">:</span>
            <span class="bp">self</span><span class="o">.</span><span class="n">init_population_array</span><span class="p">(</span><span class="n">init</span><span class="p">)</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">disp</span> <span class="o">=</span> <span class="n">disp</span>

    <span class="k">def</span> <span class="nf">init_population_lhs</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        Initializes the population with Latin Hypercube Sampling.</span>
<span class="sd">        Latin Hypercube Sampling ensures that each parameter is uniformly</span>
<span class="sd">        sampled over its range.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">rng</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">random_number_generator</span>

        <span class="c1"># Each parameter range needs to be sampled uniformly. The scaled</span>
        <span class="c1"># parameter range ([0, 1)) needs to be split into</span>
        <span class="c1"># `self.num_population_members` segments, each of which has the following</span>
        <span class="c1"># size:</span>
        <span class="n">segsize</span> <span class="o">=</span> <span class="mf">1.0</span> <span class="o">/</span> <span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span>

        <span class="c1"># Within each segment we sample from a uniform random distribution.</span>
        <span class="c1"># We need to do this sampling for each parameter.</span>
        <span class="n">samples</span> <span class="o">=</span> <span class="p">(</span><span class="n">segsize</span> <span class="o">*</span> <span class="n">rng</span><span class="o">.</span><span class="n">random_sample</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population_shape</span><span class="p">)</span>

        <span class="c1"># Offset each segment to cover the entire parameter range [0, 1)</span>
                   <span class="o">+</span> <span class="n">np</span><span class="o">.</span><span class="n">linspace</span><span class="p">(</span><span class="mf">0.</span><span class="p">,</span> <span class="mf">1.</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span><span class="p">,</span>
                                 <span class="n">endpoint</span><span class="o">=</span><span class="kc">False</span><span class="p">)[:,</span> <span class="n">np</span><span class="o">.</span><span class="n">newaxis</span><span class="p">])</span>

        <span class="c1"># Create an array for population of candidate solutions.</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">population</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">zeros_like</span><span class="p">(</span><span class="n">samples</span><span class="p">)</span>

        <span class="c1"># Initialize population of candidate solutions by permutation of the</span>
        <span class="c1"># random samples.</span>
        <span class="k">for</span> <span class="n">j</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span><span class="p">):</span>
            <span class="n">order</span> <span class="o">=</span> <span class="n">rng</span><span class="o">.</span><span class="n">permutation</span><span class="p">(</span><span class="nb">range</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span><span class="p">))</span>
            <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[:,</span> <span class="n">j</span><span class="p">]</span> <span class="o">=</span> <span class="n">samples</span><span class="p">[</span><span class="n">order</span><span class="p">,</span> <span class="n">j</span><span class="p">]</span>

        <span class="c1"># reset population energies</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span> <span class="o">=</span> <span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">ones</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span><span class="p">)</span> <span class="o">*</span>
                                    <span class="n">np</span><span class="o">.</span><span class="n">inf</span><span class="p">)</span>

        <span class="c1"># reset number of function evaluations counter</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span> <span class="o">=</span> <span class="mi">0</span>

    <span class="k">def</span> <span class="nf">init_population_random</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        Initialises the population at random.  This type of initialization</span>
<span class="sd">        can possess clustering, Latin Hypercube sampling is generally better.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">rng</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">random_number_generator</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">population</span> <span class="o">=</span> <span class="n">rng</span><span class="o">.</span><span class="n">random_sample</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population_shape</span><span class="p">)</span>

        <span class="c1"># reset population energies</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span> <span class="o">=</span> <span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">ones</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span><span class="p">)</span> <span class="o">*</span>
                                    <span class="n">np</span><span class="o">.</span><span class="n">inf</span><span class="p">)</span>

        <span class="c1"># reset number of function evaluations counter</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span> <span class="o">=</span> <span class="mi">0</span>

    <span class="k">def</span> <span class="nf">init_population_array</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">init</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        Initialises the population with a user specified population.</span>
<span class="sd">        Parameters</span>
<span class="sd">        ----------</span>
<span class="sd">        init : np.ndarray</span>
<span class="sd">            Array specifying subset of the initial population. The array should</span>
<span class="sd">            have shape (M, len(x)), where len(x) is the number of parameters.</span>
<span class="sd">            The population is clipped to the lower and upper `bounds`.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="c1"># make sure you&#39;re using a float array</span>
        <span class="n">popn</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">asfarray</span><span class="p">(</span><span class="n">init</span><span class="p">)</span>

        <span class="k">if</span> <span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">size</span><span class="p">(</span><span class="n">popn</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span> <span class="o">&lt;</span> <span class="mi">5</span> <span class="ow">or</span>
                <span class="n">popn</span><span class="o">.</span><span class="n">shape</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span> <span class="o">!=</span> <span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span> <span class="ow">or</span>
                <span class="nb">len</span><span class="p">(</span><span class="n">popn</span><span class="o">.</span><span class="n">shape</span><span class="p">)</span> <span class="o">!=</span> <span class="mi">2</span><span class="p">):</span>
            <span class="k">raise</span> <span class="ne">ValueError</span><span class="p">(</span><span class="s2">&quot;The population supplied needs to have shape&quot;</span>
                             <span class="s2">&quot; (M, len(x)), where M &gt; 4.&quot;</span><span class="p">)</span>

        <span class="c1"># scale values and clip to bounds, assigning to population</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">population</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">clip</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">_unscale_parameters</span><span class="p">(</span><span class="n">popn</span><span class="p">),</span> <span class="mi">0</span><span class="p">,</span> <span class="mi">1</span><span class="p">)</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">size</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">population_shape</span> <span class="o">=</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span><span class="p">,</span>
                                 <span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span><span class="p">)</span>

        <span class="c1"># reset population energies</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span> <span class="o">=</span> <span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">ones</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span><span class="p">)</span> <span class="o">*</span>
                                    <span class="n">np</span><span class="o">.</span><span class="n">inf</span><span class="p">)</span>

        <span class="c1"># reset number of function evaluations counter</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span> <span class="o">=</span> <span class="mi">0</span>

    <span class="nd">@property</span>
    <span class="k">def</span> <span class="nf">x</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        The best solution from the solver</span>
<span class="sd">        Returns</span>
<span class="sd">        -------</span>
<span class="sd">        x : ndarray</span>
<span class="sd">            The best solution from the solver.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">_scale_parameters</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="mi">0</span><span class="p">])</span>

    <span class="nd">@property</span>
    <span class="k">def</span> <span class="nf">convergence</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        The standard deviation of the population energies divided by their</span>
<span class="sd">        mean.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="k">return</span> <span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">std</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">)</span> <span class="o">/</span>
                <span class="n">np</span><span class="o">.</span><span class="n">abs</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">)</span> <span class="o">+</span> <span class="n">_MACHEPS</span><span class="p">))</span>

    <span class="k">def</span> <span class="nf">solve</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        Runs the DifferentialEvolutionSolver.</span>
<span class="sd">        Returns</span>
<span class="sd">        -------</span>
<span class="sd">        res : OptimizeResult</span>
<span class="sd">            The optimization result represented as a ``OptimizeResult`` object.</span>
<span class="sd">            Important attributes are: ``x`` the solution array, ``success`` a</span>
<span class="sd">            Boolean flag indicating if the optimizer exited successfully and</span>
<span class="sd">            ``message`` which describes the cause of the termination. See</span>
<span class="sd">            `OptimizeResult` for a description of other attributes.  If `polish`</span>
<span class="sd">            was employed, and a lower minimum was obtained by the polishing,</span>
<span class="sd">            then OptimizeResult also contains the ``jac`` attribute.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">nit</span><span class="p">,</span> <span class="n">warning_flag</span> <span class="o">=</span> <span class="mi">0</span><span class="p">,</span> <span class="kc">False</span>
        <span class="n">status_message</span> <span class="o">=</span> <span class="n">_status_message</span><span class="p">[</span><span class="s1">&#39;success&#39;</span><span class="p">]</span>

        <span class="c1"># The population may have just been initialized (all entries are</span>
        <span class="c1"># np.inf). If it has you have to calculate the initial energies.</span>
        <span class="c1"># Although this is also done in the evolve generator it&#39;s possible</span>
        <span class="c1"># that someone can set maxiter=0, at which point we still want the</span>
        <span class="c1"># initial energies to be calculated (the following loop isn&#39;t run).</span>
        <span class="k">if</span> <span class="n">np</span><span class="o">.</span><span class="n">all</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">isinf</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">)):</span>
            <span class="bp">self</span><span class="o">.</span><span class="n">_calculate_population_energies</span><span class="p">()</span>

        <span class="c1"># do the optimisation.</span>
        <span class="k">for</span> <span class="n">nit</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">1</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">maxiter</span> <span class="o">+</span> <span class="mi">1</span><span class="p">):</span>
            <span class="c1"># evolve the population by a generation</span>
            <span class="k">try</span><span class="p">:</span>
                <span class="nb">next</span><span class="p">(</span><span class="bp">self</span><span class="p">)</span>
            <span class="k">except</span> <span class="ne">StopIteration</span><span class="p">:</span>
                <span class="n">warning_flag</span> <span class="o">=</span> <span class="kc">True</span>
                <span class="n">status_message</span> <span class="o">=</span> <span class="n">_status_message</span><span class="p">[</span><span class="s1">&#39;maxfev&#39;</span><span class="p">]</span>
                <span class="k">break</span>

            <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">disp</span><span class="p">:</span>
                <span class="nb">print</span><span class="p">(</span><span class="s2">&quot;differential_evolution step </span><span class="si">%d</span><span class="s2">: f(x)= </span><span class="si">%g</span><span class="s2">&quot;</span>
                      <span class="o">%</span> <span class="p">(</span><span class="n">nit</span><span class="p">,</span>
                         <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="mi">0</span><span class="p">]))</span>

            <span class="c1"># should the solver terminate?</span>
            <span class="n">convergence</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">convergence</span>

            <span class="k">if</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">callback</span> <span class="ow">and</span>
                    <span class="bp">self</span><span class="o">.</span><span class="n">callback</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">_scale_parameters</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="mi">0</span><span class="p">]),</span>
                                  <span class="n">convergence</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">tol</span> <span class="o">/</span> <span class="n">convergence</span><span class="p">)</span> <span class="ow">is</span> <span class="kc">True</span><span class="p">):</span>

                <span class="n">warning_flag</span> <span class="o">=</span> <span class="kc">True</span>
                <span class="n">status_message</span> <span class="o">=</span> <span class="p">(</span><span class="s1">&#39;callback function requested stop early &#39;</span>
                                  <span class="s1">&#39;by returning True&#39;</span><span class="p">)</span>
                <span class="k">break</span>

            <span class="n">intol</span> <span class="o">=</span> <span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">std</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">)</span> <span class="o">&lt;=</span>
                     <span class="bp">self</span><span class="o">.</span><span class="n">atol</span> <span class="o">+</span>
                     <span class="bp">self</span><span class="o">.</span><span class="n">tol</span> <span class="o">*</span> <span class="n">np</span><span class="o">.</span><span class="n">abs</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">mean</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">)))</span>
            <span class="k">if</span> <span class="n">warning_flag</span> <span class="ow">or</span> <span class="n">intol</span><span class="p">:</span>
                <span class="k">break</span>

        <span class="k">else</span><span class="p">:</span>
            <span class="n">status_message</span> <span class="o">=</span> <span class="n">_status_message</span><span class="p">[</span><span class="s1">&#39;maxiter&#39;</span><span class="p">]</span>
            <span class="n">warning_flag</span> <span class="o">=</span> <span class="kc">True</span>

        <span class="n">DE_result</span> <span class="o">=</span> <span class="n">OptimizeResult</span><span class="p">(</span>
            <span class="n">x</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">x</span><span class="p">,</span>
            <span class="n">fun</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="mi">0</span><span class="p">],</span>
            <span class="n">nfev</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span><span class="p">,</span>
            <span class="n">nit</span><span class="o">=</span><span class="n">nit</span><span class="p">,</span>
            <span class="n">message</span><span class="o">=</span><span class="n">status_message</span><span class="p">,</span>
            <span class="n">success</span><span class="o">=</span><span class="p">(</span><span class="n">warning_flag</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">True</span><span class="p">))</span>

        <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">polish</span><span class="p">:</span>
            <span class="n">result</span> <span class="o">=</span> <span class="n">minimize</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">func</span><span class="p">,</span>
                              <span class="n">np</span><span class="o">.</span><span class="n">copy</span><span class="p">(</span><span class="n">DE_result</span><span class="o">.</span><span class="n">x</span><span class="p">),</span>
                              <span class="n">method</span><span class="o">=</span><span class="s1">&#39;L-BFGS-B&#39;</span><span class="p">,</span>
                              <span class="n">bounds</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">limits</span><span class="o">.</span><span class="n">T</span><span class="p">,</span>
                              <span class="n">args</span><span class="o">=</span><span class="bp">self</span><span class="o">.</span><span class="n">args</span><span class="p">)</span>

            <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span> <span class="o">+=</span> <span class="n">result</span><span class="o">.</span><span class="n">nfev</span>
            <span class="n">DE_result</span><span class="o">.</span><span class="n">nfev</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span>

            <span class="k">if</span> <span class="n">result</span><span class="o">.</span><span class="n">fun</span> <span class="o">&lt;</span> <span class="n">DE_result</span><span class="o">.</span><span class="n">fun</span><span class="p">:</span>
                <span class="n">DE_result</span><span class="o">.</span><span class="n">fun</span> <span class="o">=</span> <span class="n">result</span><span class="o">.</span><span class="n">fun</span>
                <span class="n">DE_result</span><span class="o">.</span><span class="n">x</span> <span class="o">=</span> <span class="n">result</span><span class="o">.</span><span class="n">x</span>
                <span class="n">DE_result</span><span class="o">.</span><span class="n">jac</span> <span class="o">=</span> <span class="n">result</span><span class="o">.</span><span class="n">jac</span>
                <span class="c1"># to keep internal state consistent</span>
                <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">=</span> <span class="n">result</span><span class="o">.</span><span class="n">fun</span>
                <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">_unscale_parameters</span><span class="p">(</span><span class="n">result</span><span class="o">.</span><span class="n">x</span><span class="p">)</span>

        <span class="k">return</span> <span class="n">DE_result</span>

    <span class="k">def</span> <span class="nf">_calculate_population_energies</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        Calculate the energies of all the population members at the same time.</span>
<span class="sd">        Puts the best member in first place. Useful if the population has just</span>
<span class="sd">        been initialised.</span>
<span class="sd">        &quot;&quot;&quot;</span>

        <span class="c1">##############</span>
        <span class="c1">## CHANGES: self.func operates on the entire parameters array</span>
        <span class="c1">##############</span>
        <span class="n">itersize</span> <span class="o">=</span> <span class="nb">max</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="nb">min</span><span class="p">(</span><span class="nb">len</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">),</span> <span class="bp">self</span><span class="o">.</span><span class="n">maxfun</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span> <span class="o">+</span> <span class="mi">1</span><span class="p">))</span>
        <span class="n">candidates</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[:</span><span class="n">itersize</span><span class="p">]</span>
        <span class="n">parameters</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">([</span><span class="bp">self</span><span class="o">.</span><span class="n">_scale_parameters</span><span class="p">(</span><span class="n">c</span><span class="p">)</span> <span class="k">for</span> <span class="n">c</span> <span class="ow">in</span> <span class="n">candidates</span><span class="p">])</span> <span class="c1"># TODO: vectorize</span>
        <span class="n">energies</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">func</span><span class="p">(</span><span class="n">parameters</span><span class="p">,</span> <span class="o">*</span><span class="bp">self</span><span class="o">.</span><span class="n">args</span><span class="p">)</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span> <span class="o">=</span> <span class="n">energies</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span> <span class="o">+=</span> <span class="n">itersize</span>

        <span class="c1"># for index, candidate in enumerate(self.population):</span>
        <span class="c1">#     if self._nfev &gt; self.maxfun:</span>
        <span class="c1">#         break</span>

        <span class="c1">#     parameters = self._scale_parameters(candidate)</span>
        <span class="c1">#     self.population_energies[index] = self.func(parameters,</span>
        <span class="c1">#                                                 *self.args)</span>
        <span class="c1">#     self._nfev += 1</span>

        <span class="c1">##############</span>
        <span class="c1">##############</span>



        <span class="n">minval</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">argmin</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">)</span>

        <span class="c1"># put the lowest energy into the best solution position.</span>
        <span class="n">lowest_energy</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="n">minval</span><span class="p">]</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="n">minval</span><span class="p">]</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">=</span> <span class="n">lowest_energy</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[[</span><span class="mi">0</span><span class="p">,</span> <span class="n">minval</span><span class="p">],</span> <span class="p">:]</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[[</span><span class="n">minval</span><span class="p">,</span> <span class="mi">0</span><span class="p">],</span> <span class="p">:]</span>

    <span class="k">def</span> <span class="fm">__iter__</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
        <span class="k">return</span> <span class="bp">self</span>

    <span class="k">def</span> <span class="fm">__next__</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        Evolve the population by a single generation</span>
<span class="sd">        Returns</span>
<span class="sd">        -------</span>
<span class="sd">        x : ndarray</span>
<span class="sd">            The best solution from the solver.</span>
<span class="sd">        fun : float</span>
<span class="sd">            Value of objective function obtained from the best solution.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="c1"># the population may have just been initialized (all entries are</span>
        <span class="c1"># np.inf). If it has you have to calculate the initial energies</span>
        <span class="k">if</span> <span class="n">np</span><span class="o">.</span><span class="n">all</span><span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">isinf</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">)):</span>
            <span class="bp">self</span><span class="o">.</span><span class="n">_calculate_population_energies</span><span class="p">()</span>

        <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">dither</span> <span class="ow">is</span> <span class="ow">not</span> <span class="kc">None</span><span class="p">:</span>
            <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">=</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">random_number_generator</span><span class="o">.</span><span class="n">rand</span><span class="p">()</span>
                          <span class="o">*</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">dither</span><span class="p">[</span><span class="mi">1</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">dither</span><span class="p">[</span><span class="mi">0</span><span class="p">])</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">dither</span><span class="p">[</span><span class="mi">0</span><span class="p">])</span>

        <span class="c1">##############</span>
        <span class="c1">## CHANGES: self.func operates on the entire parameters array</span>
        <span class="c1">##############</span>

        <span class="n">itersize</span> <span class="o">=</span> <span class="nb">max</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="nb">min</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">maxfun</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span> <span class="o">+</span> <span class="mi">1</span><span class="p">))</span>
        <span class="n">trials</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">([</span><span class="bp">self</span><span class="o">.</span><span class="n">_mutate</span><span class="p">(</span><span class="n">c</span><span class="p">)</span> <span class="k">for</span> <span class="n">c</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="n">itersize</span><span class="p">)])</span> <span class="c1"># TODO: vectorize</span>
        <span class="k">for</span> <span class="n">trial</span> <span class="ow">in</span> <span class="n">trials</span><span class="p">:</span> <span class="bp">self</span><span class="o">.</span><span class="n">_ensure_constraint</span><span class="p">(</span><span class="n">trial</span><span class="p">)</span>
        <span class="n">parameters</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">array</span><span class="p">([</span><span class="bp">self</span><span class="o">.</span><span class="n">_scale_parameters</span><span class="p">(</span><span class="n">trial</span><span class="p">)</span> <span class="k">for</span> <span class="n">trial</span> <span class="ow">in</span> <span class="n">trials</span><span class="p">])</span>
        <span class="n">energies</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">func</span><span class="p">(</span><span class="n">parameters</span><span class="p">,</span> <span class="o">*</span><span class="bp">self</span><span class="o">.</span><span class="n">args</span><span class="p">)</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">_nfev</span> <span class="o">+=</span> <span class="n">itersize</span>

        <span class="k">for</span> <span class="n">candidate</span><span class="p">,(</span><span class="n">energy</span><span class="p">,</span><span class="n">trial</span><span class="p">)</span> <span class="ow">in</span> <span class="nb">enumerate</span><span class="p">(</span><span class="nb">zip</span><span class="p">(</span><span class="n">energies</span><span class="p">,</span> <span class="n">trials</span><span class="p">)):</span>
            <span class="c1"># if the energy of the trial candidate is lower than the</span>
            <span class="c1"># original population member then replace it</span>
            <span class="k">if</span> <span class="n">energy</span> <span class="o">&lt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="n">candidate</span><span class="p">]:</span>
                <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">candidate</span><span class="p">]</span> <span class="o">=</span> <span class="n">trial</span>
                <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="n">candidate</span><span class="p">]</span> <span class="o">=</span> <span class="n">energy</span>

                <span class="c1"># if the trial candidate also has a lower energy than the</span>
                <span class="c1"># best solution then replace that as well</span>
                <span class="k">if</span> <span class="n">energy</span> <span class="o">&lt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="mi">0</span><span class="p">]:</span>
                    <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">=</span> <span class="n">energy</span>
                    <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">=</span> <span class="n">trial</span>

        <span class="c1"># for candidate in range(self.num_population_members):</span>
        <span class="c1">#     if self._nfev &gt; self.maxfun:</span>
        <span class="c1">#         raise StopIteration</span>

        <span class="c1">#     # create a trial solution</span>
        <span class="c1">#     trial = self._mutate(candidate)</span>

        <span class="c1">#     # ensuring that it&#39;s in the range [0, 1)</span>
        <span class="c1">#     self._ensure_constraint(trial)</span>

        <span class="c1">#     # scale from [0, 1) to the actual parameter value</span>
        <span class="c1">#     parameters = self._scale_parameters(trial)</span>

        <span class="c1">#     # determine the energy of the objective function</span>
        <span class="c1">#     energy = self.func(parameters, *self.args)</span>
        <span class="c1">#     self._nfev += 1</span>

        <span class="c1">#     # if the energy of the trial candidate is lower than the</span>
        <span class="c1">#     # original population member then replace it</span>
        <span class="c1">#     if energy &lt; self.population_energies[candidate]:</span>
        <span class="c1">#         self.population[candidate] = trial</span>
        <span class="c1">#         self.population_energies[candidate] = energy</span>

        <span class="c1">#         # if the trial candidate also has a lower energy than the</span>
        <span class="c1">#         # best solution then replace that as well</span>
        <span class="c1">#         if energy &lt; self.population_energies[0]:</span>
        <span class="c1">#             self.population_energies[0] = energy</span>
        <span class="c1">#             self.population[0] = trial</span>

        <span class="c1">##############</span>
        <span class="c1">##############</span>

        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">x</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">population_energies</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span>

    <span class="k">def</span> <span class="nf">next</span><span class="p">(</span><span class="bp">self</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        Evolve the population by a single generation</span>
<span class="sd">        Returns</span>
<span class="sd">        -------</span>
<span class="sd">        x : ndarray</span>
<span class="sd">            The best solution from the solver.</span>
<span class="sd">        fun : float</span>
<span class="sd">            Value of objective function obtained from the best solution.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="c1"># next() is required for compatibility with Python2.7.</span>
        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="fm">__next__</span><span class="p">()</span>

    <span class="k">def</span> <span class="nf">_scale_parameters</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">trial</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        scale from a number between 0 and 1 to parameters.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="k">return</span> <span class="bp">self</span><span class="o">.</span><span class="n">__scale_arg1</span> <span class="o">+</span> <span class="p">(</span><span class="n">trial</span> <span class="o">-</span> <span class="mf">0.5</span><span class="p">)</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">__scale_arg2</span>

    <span class="k">def</span> <span class="nf">_unscale_parameters</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">parameters</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        scale from parameters to a number between 0 and 1.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="k">return</span> <span class="p">(</span><span class="n">parameters</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">__scale_arg1</span><span class="p">)</span> <span class="o">/</span> <span class="bp">self</span><span class="o">.</span><span class="n">__scale_arg2</span> <span class="o">+</span> <span class="mf">0.5</span>

    <span class="k">def</span> <span class="nf">_ensure_constraint</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">trial</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        make sure the parameters lie between the limits</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="k">for</span> <span class="n">index</span> <span class="ow">in</span> <span class="n">np</span><span class="o">.</span><span class="n">where</span><span class="p">((</span><span class="n">trial</span> <span class="o">&lt;</span> <span class="mi">0</span><span class="p">)</span> <span class="o">|</span> <span class="p">(</span><span class="n">trial</span> <span class="o">&gt;</span> <span class="mi">1</span><span class="p">))[</span><span class="mi">0</span><span class="p">]:</span>
            <span class="n">trial</span><span class="p">[</span><span class="n">index</span><span class="p">]</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">random_number_generator</span><span class="o">.</span><span class="n">rand</span><span class="p">()</span>

    <span class="k">def</span> <span class="nf">_mutate</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">candidate</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        create a trial vector based on a mutation strategy</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">trial</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">copy</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">candidate</span><span class="p">])</span>

        <span class="n">rng</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">random_number_generator</span>

        <span class="n">fill_point</span> <span class="o">=</span> <span class="n">rng</span><span class="o">.</span><span class="n">randint</span><span class="p">(</span><span class="mi">0</span><span class="p">,</span> <span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span><span class="p">)</span>

        <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">strategy</span> <span class="ow">in</span> <span class="p">[</span><span class="s1">&#39;currenttobest1exp&#39;</span><span class="p">,</span> <span class="s1">&#39;currenttobest1bin&#39;</span><span class="p">]:</span>
            <span class="n">bprime</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">mutation_func</span><span class="p">(</span><span class="n">candidate</span><span class="p">,</span>
                                        <span class="bp">self</span><span class="o">.</span><span class="n">_select_samples</span><span class="p">(</span><span class="n">candidate</span><span class="p">,</span> <span class="mi">5</span><span class="p">))</span>
        <span class="k">else</span><span class="p">:</span>
            <span class="n">bprime</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">mutation_func</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">_select_samples</span><span class="p">(</span><span class="n">candidate</span><span class="p">,</span> <span class="mi">5</span><span class="p">))</span>

        <span class="k">if</span> <span class="bp">self</span><span class="o">.</span><span class="n">strategy</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">_binomial</span><span class="p">:</span>
            <span class="n">crossovers</span> <span class="o">=</span> <span class="n">rng</span><span class="o">.</span><span class="n">rand</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span><span class="p">)</span>
            <span class="n">crossovers</span> <span class="o">=</span> <span class="n">crossovers</span> <span class="o">&lt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">cross_over_probability</span>
            <span class="c1"># the last one is always from the bprime vector for binomial</span>
            <span class="c1"># If you fill in modulo with a loop you have to set the last one to</span>
            <span class="c1"># true. If you don&#39;t use a loop then you can have any random entry</span>
            <span class="c1"># be True.</span>
            <span class="n">crossovers</span><span class="p">[</span><span class="n">fill_point</span><span class="p">]</span> <span class="o">=</span> <span class="kc">True</span>
            <span class="n">trial</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">where</span><span class="p">(</span><span class="n">crossovers</span><span class="p">,</span> <span class="n">bprime</span><span class="p">,</span> <span class="n">trial</span><span class="p">)</span>
            <span class="k">return</span> <span class="n">trial</span>

        <span class="k">elif</span> <span class="bp">self</span><span class="o">.</span><span class="n">strategy</span> <span class="ow">in</span> <span class="bp">self</span><span class="o">.</span><span class="n">_exponential</span><span class="p">:</span>
            <span class="n">i</span> <span class="o">=</span> <span class="mi">0</span>
            <span class="k">while</span> <span class="p">(</span><span class="n">i</span> <span class="o">&lt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span> <span class="ow">and</span>
                   <span class="n">rng</span><span class="o">.</span><span class="n">rand</span><span class="p">()</span> <span class="o">&lt;</span> <span class="bp">self</span><span class="o">.</span><span class="n">cross_over_probability</span><span class="p">):</span>

                <span class="n">trial</span><span class="p">[</span><span class="n">fill_point</span><span class="p">]</span> <span class="o">=</span> <span class="n">bprime</span><span class="p">[</span><span class="n">fill_point</span><span class="p">]</span>
                <span class="n">fill_point</span> <span class="o">=</span> <span class="p">(</span><span class="n">fill_point</span> <span class="o">+</span> <span class="mi">1</span><span class="p">)</span> <span class="o">%</span> <span class="bp">self</span><span class="o">.</span><span class="n">parameter_count</span>
                <span class="n">i</span> <span class="o">+=</span> <span class="mi">1</span>

            <span class="k">return</span> <span class="n">trial</span>

    <span class="k">def</span> <span class="nf">_best1</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">samples</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        best1bin, best1exp</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">r0</span><span class="p">,</span> <span class="n">r1</span> <span class="o">=</span> <span class="n">samples</span><span class="p">[:</span><span class="mi">2</span><span class="p">]</span>
        <span class="k">return</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">*</span>
                <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r0</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r1</span><span class="p">]))</span>

    <span class="k">def</span> <span class="nf">_rand1</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">samples</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        rand1bin, rand1exp</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">r0</span><span class="p">,</span> <span class="n">r1</span><span class="p">,</span> <span class="n">r2</span> <span class="o">=</span> <span class="n">samples</span><span class="p">[:</span><span class="mi">3</span><span class="p">]</span>
        <span class="k">return</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r0</span><span class="p">]</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">*</span>
                <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r1</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r2</span><span class="p">]))</span>

    <span class="k">def</span> <span class="nf">_randtobest1</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">samples</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        randtobest1bin, randtobest1exp</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">r0</span><span class="p">,</span> <span class="n">r1</span><span class="p">,</span> <span class="n">r2</span> <span class="o">=</span> <span class="n">samples</span><span class="p">[:</span><span class="mi">3</span><span class="p">]</span>
        <span class="n">bprime</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">copy</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r0</span><span class="p">])</span>
        <span class="n">bprime</span> <span class="o">+=</span> <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">*</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">-</span> <span class="n">bprime</span><span class="p">)</span>
        <span class="n">bprime</span> <span class="o">+=</span> <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">*</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r1</span><span class="p">]</span> <span class="o">-</span>
                                <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r2</span><span class="p">])</span>
        <span class="k">return</span> <span class="n">bprime</span>

    <span class="k">def</span> <span class="nf">_currenttobest1</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">candidate</span><span class="p">,</span> <span class="n">samples</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        currenttobest1bin, currenttobest1exp</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">r0</span><span class="p">,</span> <span class="n">r1</span> <span class="o">=</span> <span class="n">samples</span><span class="p">[:</span><span class="mi">2</span><span class="p">]</span>
        <span class="n">bprime</span> <span class="o">=</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">candidate</span><span class="p">]</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">*</span>
                  <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">candidate</span><span class="p">]</span> <span class="o">+</span>
                   <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r0</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r1</span><span class="p">]))</span>
        <span class="k">return</span> <span class="n">bprime</span>

    <span class="k">def</span> <span class="nf">_best2</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">samples</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        best2bin, best2exp</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">r0</span><span class="p">,</span> <span class="n">r1</span><span class="p">,</span> <span class="n">r2</span><span class="p">,</span> <span class="n">r3</span> <span class="o">=</span> <span class="n">samples</span><span class="p">[:</span><span class="mi">4</span><span class="p">]</span>
        <span class="n">bprime</span> <span class="o">=</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="mi">0</span><span class="p">]</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">*</span>
                  <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r0</span><span class="p">]</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r1</span><span class="p">]</span> <span class="o">-</span>
                   <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r2</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r3</span><span class="p">]))</span>

        <span class="k">return</span> <span class="n">bprime</span>

    <span class="k">def</span> <span class="nf">_rand2</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">samples</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        rand2bin, rand2exp</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">r0</span><span class="p">,</span> <span class="n">r1</span><span class="p">,</span> <span class="n">r2</span><span class="p">,</span> <span class="n">r3</span><span class="p">,</span> <span class="n">r4</span> <span class="o">=</span> <span class="n">samples</span>
        <span class="n">bprime</span> <span class="o">=</span> <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r0</span><span class="p">]</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">scale</span> <span class="o">*</span>
                  <span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r1</span><span class="p">]</span> <span class="o">+</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r2</span><span class="p">]</span> <span class="o">-</span>
                   <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r3</span><span class="p">]</span> <span class="o">-</span> <span class="bp">self</span><span class="o">.</span><span class="n">population</span><span class="p">[</span><span class="n">r4</span><span class="p">]))</span>

        <span class="k">return</span> <span class="n">bprime</span>

    <span class="k">def</span> <span class="nf">_select_samples</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">candidate</span><span class="p">,</span> <span class="n">number_samples</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;</span>
<span class="sd">        obtain random integers from range(self.num_population_members),</span>
<span class="sd">        without replacement.  You can&#39;t have the original candidate either.</span>
<span class="sd">        &quot;&quot;&quot;</span>
        <span class="n">idxs</span> <span class="o">=</span> <span class="nb">list</span><span class="p">(</span><span class="nb">range</span><span class="p">(</span><span class="bp">self</span><span class="o">.</span><span class="n">num_population_members</span><span class="p">))</span>
        <span class="n">idxs</span><span class="o">.</span><span class="n">remove</span><span class="p">(</span><span class="n">candidate</span><span class="p">)</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">random_number_generator</span><span class="o">.</span><span class="n">shuffle</span><span class="p">(</span><span class="n">idxs</span><span class="p">)</span>
        <span class="n">idxs</span> <span class="o">=</span> <span class="n">idxs</span><span class="p">[:</span><span class="n">number_samples</span><span class="p">]</span>
        <span class="k">return</span> <span class="n">idxs</span>

<div class="viewcode-block" id="AdamOptimizer"><a class="viewcode-back" href="../../../source/deeprobust.image.html#deeprobust.image.optimizer.AdamOptimizer">[docs]</a><span class="k">class</span> <span class="nc">AdamOptimizer</span><span class="p">:</span>
    <span class="sd">&quot;&quot;&quot;Basic Adam optimizer implementation that can minimize w.r.t.</span>
<span class="sd">    a single variable.</span>
<span class="sd">    Parameters</span>
<span class="sd">    ----------</span>
<span class="sd">    shape : tuple</span>
<span class="sd">        shape of the variable w.r.t. which the loss should be minimized</span>
<span class="sd">    &quot;&quot;&quot;</span>
    <span class="c1">#TODO Add reference or rewrite the function.</span>
    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">shape</span><span class="p">):</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">m</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="n">shape</span><span class="p">)</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">v</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">zeros</span><span class="p">(</span><span class="n">shape</span><span class="p">)</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">t</span> <span class="o">=</span> <span class="mi">0</span>

    <span class="k">def</span> <span class="fm">__call__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">gradient</span><span class="p">,</span> <span class="n">learning_rate</span><span class="p">,</span> <span class="n">beta1</span><span class="o">=</span><span class="mf">0.9</span><span class="p">,</span> <span class="n">beta2</span><span class="o">=</span><span class="mf">0.999</span><span class="p">,</span> <span class="n">epsilon</span><span class="o">=</span><span class="mf">1e-8</span><span class="p">):</span>
        <span class="sd">&quot;&quot;&quot;Updates internal parameters of the optimizer and returns</span>
<span class="sd">        the change that should be applied to the variable.</span>
<span class="sd">        Parameters</span>
<span class="sd">        ----------</span>
<span class="sd">        gradient : `np.ndarray`</span>
<span class="sd">            the gradient of the loss w.r.t. to the variable</span>
<span class="sd">        learning_rate: float</span>
<span class="sd">            the learning rate in the current iteration</span>
<span class="sd">        beta1: float</span>
<span class="sd">            decay rate for calculating the exponentially</span>
<span class="sd">            decaying average of past gradients</span>
<span class="sd">        beta2: float</span>
<span class="sd">            decay rate for calculating the exponentially</span>
<span class="sd">            decaying average of past squared gradients</span>
<span class="sd">        epsilon: float</span>
<span class="sd">            small value to avoid division by zero</span>
<span class="sd">        &quot;&quot;&quot;</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">t</span> <span class="o">+=</span> <span class="mi">1</span>

        <span class="bp">self</span><span class="o">.</span><span class="n">m</span> <span class="o">=</span> <span class="n">beta1</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">m</span> <span class="o">+</span> <span class="p">(</span><span class="mi">1</span> <span class="o">-</span> <span class="n">beta1</span><span class="p">)</span> <span class="o">*</span> <span class="n">gradient</span>
        <span class="bp">self</span><span class="o">.</span><span class="n">v</span> <span class="o">=</span> <span class="n">beta2</span> <span class="o">*</span> <span class="bp">self</span><span class="o">.</span><span class="n">v</span> <span class="o">+</span> <span class="p">(</span><span class="mi">1</span> <span class="o">-</span> <span class="n">beta2</span><span class="p">)</span> <span class="o">*</span> <span class="n">gradient</span> <span class="o">**</span> <span class="mi">2</span>

        <span class="n">bias_correction_1</span> <span class="o">=</span> <span class="mi">1</span> <span class="o">-</span> <span class="n">beta1</span> <span class="o">**</span> <span class="bp">self</span><span class="o">.</span><span class="n">t</span>
        <span class="n">bias_correction_2</span> <span class="o">=</span> <span class="mi">1</span> <span class="o">-</span> <span class="n">beta2</span> <span class="o">**</span> <span class="bp">self</span><span class="o">.</span><span class="n">t</span>

        <span class="n">m_hat</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">m</span> <span class="o">/</span> <span class="n">bias_correction_1</span>
        <span class="n">v_hat</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">v</span> <span class="o">/</span> <span class="n">bias_correction_2</span>

        <span class="k">return</span> <span class="o">-</span><span class="n">learning_rate</span> <span class="o">*</span> <span class="n">m_hat</span> <span class="o">/</span> <span class="p">(</span><span class="n">np</span><span class="o">.</span><span class="n">sqrt</span><span class="p">(</span><span class="n">v_hat</span><span class="p">)</span> <span class="o">+</span> <span class="n">epsilon</span><span class="p">)</span></div>
</pre></div>

           </div>
           
          </div>
          <footer>
  

  <hr/>

  <div role="contentinfo">
    <p>
        
        &copy; Copyright 

    </p>
  </div>
    
    
    
    Built with <a href="http://sphinx-doc.org/">Sphinx</a> using a
    
    <a href="https://github.com/rtfd/sphinx_rtd_theme">theme</a>
    
    provided by <a href="https://readthedocs.org">Read the Docs</a>. 

</footer>

        </div>
      </div>

    </section>

  </div>
  

  <script type="text/javascript">
      jQuery(function () {
          SphinxRtdTheme.Navigation.enable(true);
      });
  </script>

  
  
    
   

</body>
</html>