{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 14,
   "id": "e1f061a3",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Using matplotlib backend: MacOSX\n"
     ]
    }
   ],
   "source": [
    "#Extra_MWU\n",
    "\n",
    "from scipy.linalg import expm, sinm, cosm\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import math\n",
    "from mpl_toolkits.mplot3d import Axes3D\n",
    "%matplotlib inline\n",
    "%matplotlib auto\n",
    "\n",
    "plt.style.use('seaborn-white')\n",
    "%config InlineBackend.figure_format = 'svg'\n",
    "\n",
    "\n",
    "#training steps\n",
    "T =200\n",
    "\n",
    "#step size\n",
    "s = 0.8\n",
    "eta = 0.1\n",
    "\n",
    "# x,y\n",
    "x = np.zeros((T,2))\n",
    "y = np.zeros((T,2))\n",
    "\n",
    "x_hat = np.zeros((T,2))\n",
    "y_hat = np.zeros((T,2))\n",
    "\n",
    "\n",
    "# k use to store immediate strategy\n",
    "k_1 = np.zeros(T)\n",
    "k_2 = np.zeros(T)\n",
    "\n",
    "\n",
    "#define initial conditions on accumulated strategy / payoff\n",
    "\n",
    "\n",
    "\n",
    "x[0] = [0.8, 0.2]\n",
    "y[0] = [0.3, 0.7]\n",
    "\n",
    "\n",
    "\n",
    "k_1[0] = y[0][0]\n",
    "k_2[0] = y[0][1]\n",
    "\n",
    "\n",
    "def A(t):\n",
    "    if(t%2 == 0):\n",
    "        return np.array([[-1,1],[1,-1]])\n",
    "    else:\n",
    "        return np.array([[1,-1],[-1,1]])\n",
    "\n",
    "def A_21(t):\n",
    "    return np.array([[-1*A(t)[0][0],-1*A(t)[1][0]], [-1*A(t)[0][1],-1*A(t)[1][1]]])\n",
    "\n",
    "for t in range(0,T-1):\n",
    "        \n",
    "    \n",
    "    z = np.dot(A_21(t),x[t].T).T\n",
    "    d_1 = y[t][0] * math.exp(s*z[0]) + y[t][1] * math.exp(s*z[1]) \n",
    "    y_hat[t+1][0] = y[t][0] * math.exp(s*z[0])/d_1\n",
    "    y_hat[t+1][1] = y[t][1] * math.exp(s*z[1])/d_1\n",
    "    \n",
    "    w = np.dot(A(t),y[t].T).T\n",
    "    d_2 = x[t][0] * math.exp(s*w[0]) + x[t][1] * math.exp(s*w[1]) \n",
    "    x_hat[t+1][0] = x[t][0] * math.exp(s*w[0])/d_2\n",
    "    x_hat[t+1][1] = x[t][1] * math.exp(s*w[1])/d_2\n",
    "    \n",
    "    z_2 = np.dot(A_21(t),x_hat[t+1].T).T\n",
    "    d_3 = y[t][0] * math.exp(eta*z_2[0]) + y[t][1] * math.exp(eta*z_2[1])\n",
    "    y[t+1][0] = y[t][0] * math.exp(eta*z_2[0])/d_3\n",
    "    y[t+1][1] = y[t][1] * math.exp(eta*z_2[1])/d_3\n",
    "    \n",
    "    k_1[t+1] = y[t+1][0] \n",
    "    k_2[t+1] = y[t+1][1] \n",
    "    \n",
    "    w_2 = np.dot(A(t),y_hat[t+1].T).T\n",
    "    d_4 = x[t][0] * math.exp(eta*w_2[0]) + x[t][1] * math.exp(eta*w_2[1]) \n",
    "    x[t+1][0] = x[t][0] * math.exp(eta*w_2[0])/d_4\n",
    "    x[t+1][1] = x[t][1] * math.exp(eta*w_2[1])/d_4\n",
    "    \n",
    "plt.figure()\n",
    "\n",
    "plt.plot(k_1)\n",
    "plt.plot(k_2)\n",
    "\n",
    "plt.legend([\"Strategy 1\",\"Strategy 2\"])\n",
    "#plt.legend([\"Strategy 2\"])\n",
    "plt.show()  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "482422c2",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-2-bec91da08084>:112: RuntimeWarning: divide by zero encountered in double_scalars\n",
      "  return 1/2 * math.log(1/(2*x1)) + 1/2 * math.log(1/(2*x2)) + 1/2 * math.log(1/(2*y1)) + 1/2 * math.log(1/(2*y2))\n",
      "No handles with labels found to put in legend.\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Using matplotlib backend: MacOSX\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "<matplotlib.legend.Legend at 0x7fc889c80f10>"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# OMWU，Min_x Max_y\n",
    "\n",
    "from scipy.linalg import expm, sinm, cosm\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
    "import math\n",
    "from mpl_toolkits.mplot3d import Axes3D\n",
    "%matplotlib inline\n",
    "%matplotlib auto\n",
    "\n",
    "plt.style.use('seaborn-white')\n",
    "%config InlineBackend.figure_format = 'svg'\n",
    "\n",
    "#training steps\n",
    "T = 3000\n",
    "\n",
    "#step size\n",
    "s = 0.1\n",
    "\n",
    "# x,y\n",
    "x = np.zeros((T,2))\n",
    "y = np.zeros((T,2))\n",
    "\n",
    "Y = np.zeros((T,4))\n",
    "X = np.zeros((T,4))\n",
    "# k use to store immediate strategy\n",
    "k_1 = np.zeros(T)\n",
    "k_2 = np.zeros(T)\n",
    "\n",
    "k_3 = np.zeros(T)\n",
    "k_4 = np.zeros(T)\n",
    "\n",
    "m = np.zeros(T)\n",
    "\n",
    "\n",
    "x[0] = [0.3, 0.7]\n",
    "y[0] = [0.3, 0.7]\n",
    "\n",
    "x[1] = [0.3, 0.7]\n",
    "y[1] = [0.3, 0.7]\n",
    "\n",
    "\n",
    "k_1[0] = y[0][0]\n",
    "k_2[0] = y[1][0]\n",
    "\n",
    "k_3[0] = x[0][0]\n",
    "k_4[0] = x[1][0]\n",
    "\n",
    "value3 = np.zeros(T)\n",
    "value4 = np.zeros(T)\n",
    "value5 = np.zeros(T)\n",
    "\n",
    "\n",
    "def A(t):\n",
    "    if(t%2 == 0):\n",
    "        return np.array([[0,-1],[-1,0]])\n",
    "    else:\n",
    "       # return np.array([[0,1],[1,0]])\n",
    "        return np.array([[0,1],[1,0]])\n",
    "    \n",
    "def A_21(t):\n",
    "    return - A(t).T\n",
    "\n",
    "for t in range(1,T-1):\n",
    "    \n",
    "    z =  2*s*np.dot(x[t],A(t)) - s*np.dot(x[t-1],A(t-1))\n",
    "    d_1 = y[t][0] * math.exp(z[0]) + y[t][1] * math.exp(z[1]) \n",
    "    y[t+1][0] = y[t][0] * math.exp(z[0])/d_1\n",
    "    y[t+1][1] = y[t][1] * math.exp(z[1])/d_1\n",
    "    \n",
    "    \n",
    "    w =  - 2*s*np.dot(y[t],A(t).T) + s*np.dot(y[t-1],A(t-1).T)\n",
    "    d_2 = x[t][0] * math.exp(w[0]) + x[t][1] * math.exp(w[1]) \n",
    "    x[t+1][0] = x[t][0] * math.exp(w[0])/d_2\n",
    "    x[t+1][1] = x[t][1] * math.exp(w[1])/d_2\n",
    "    \n",
    "    Y[t] = [ w[0],w[1],z[0],z[1] ]\n",
    "    X[t+1] = [ x[t+1][0], x[t+1][1] , y[t+1][0] , y[t+1][1] ]\n",
    "    \n",
    "    k_1[t+1] = y[t+1][0] \n",
    "    k_2[t+1] = y[t+1][1] \n",
    "    \n",
    "    k_3[t+1] = x[t+1][0] \n",
    "    k_4[t+1] = x[t+1][1]\n",
    "    equi = [ 1/2, 1/2 , 1/2 , 1/2 ]\n",
    "    \n",
    "\n",
    "        \n",
    "k_1[0] = k_1[1]\n",
    "k_2[0] = k_2[1]\n",
    "    \n",
    "k_3[0] = k_3[1]\n",
    "k_4[0] = k_4[1]    \n",
    "\n",
    "def kl(x1,x2,y1,y2):\n",
    "    return 1/2 * math.log(1/(2*x1)) + 1/2 * math.log(1/(2*x2)) + 1/2 * math.log(1/(2*y1)) + 1/2 * math.log(1/(2*y2))\n",
    "\n",
    "    \n",
    "\n",
    "value = np.zeros(T)\n",
    "\n",
    "for t in range(0,T-1):\n",
    "    value[t] = kl( k_3[t] , k_4[t] , k_1[t] , k_2[t])\n",
    "    \n",
    "#for t in range(0,T-1):\n",
    "#    print( value[t+1] - value[t] ) \n",
    "    \n",
    "    \n",
    "value[T-1] = value[T-2]\n",
    "\n",
    "step = range(T)\n",
    "plt.scatter(step,value,s=4) \n",
    "plt.show()\n",
    "\n",
    "plt.title(\" \")\n",
    "plt.legend()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "522268f1",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "tensorflow",
   "language": "python",
   "name": "tensorflow"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
