{"metadata":{"kernelspec":{"language":"python","display_name":"Python 3","name":"python3"},"language_info":{"name":"python","version":"3.10.12","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"code","source":"!git clone https://github.com/zysophia/Doubly_Adaptive_MCMC.git\n%cd  Doubly_Adaptive_MCMC/src\nfrom gibbsChains import * \nfrom algorithms import * \nfrom meanEstimator import * \n\n\nimport torch\nfrom torch import nn\nimport numpy as np \nimport torch.autograd.functional as F\nfrom torch.autograd import Variable\nimport time \nimport pandas as pd ","metadata":{"_uuid":"8f2839f25d086af736a60e9eeb907d3b93b6e0e5","_cell_guid":"b1076dfc-b9ad-4769-8c92-a6c4dae69d19","execution":{"iopub.status.busy":"2023-08-07T06:14:11.899482Z","iopub.execute_input":"2023-08-07T06:14:11.900025Z","iopub.status.idle":"2023-08-07T06:14:19.443679Z","shell.execute_reply.started":"2023-08-07T06:14:11.899998Z","shell.execute_reply":"2023-08-07T06:14:19.442608Z"},"trusted":true},"execution_count":1,"outputs":[{"name":"stdout","text":"Cloning into 'Doubly_Adaptive_MCMC'...\nremote: Enumerating objects: 92, done.\u001b[K\nremote: Counting objects: 100% (92/92), done.\u001b[K\nremote: Compressing objects: 100% (72/72), done.\u001b[K\nremote: Total 92 (delta 26), reused 81 (delta 19), pack-reused 0\u001b[K\nReceiving objects: 100% (92/92), 5.06 MiB | 10.15 MiB/s, done.\nResolving deltas: 100% (26/26), done.\n/kaggle/working/Doubly_Adaptive_MCMC/src\n","output_type":"stream"}]},{"cell_type":"code","source":"class CFG:\n    n = 4\n    beta = 0.02\n\n    \n    flag1 = 'w'\n    flag2 = 'v'\n    \n    times= 1\n\n    d = n**2\n\n    \n    M= 4\n    h = 0.01\n    N = 500\n    \n    epoch_stage_1=700\n    epoch_stage_2=50\n    \n    \n    optim = ['SGD','Adam'][1]\n    lr = 0.001\n    seed = 44\n    hidden_size = 108\n    \n    \n    lambda1 =1\n    lambda2 =1\n    \n    \n    print_step = 100\n    ","metadata":{"execution":{"iopub.status.busy":"2023-08-07T06:28:10.083158Z","iopub.execute_input":"2023-08-07T06:28:10.083532Z","iopub.status.idle":"2023-08-07T06:28:10.090490Z","shell.execute_reply.started":"2023-08-07T06:28:10.083501Z","shell.execute_reply":"2023-08-07T06:28:10.089538Z"},"trusted":true},"execution_count":34,"outputs":[]},{"cell_type":"code","source":"def get_values(T,n,beta):\n    chain = IsingChainLattice(n = n)\n    chain.beta= beta\n    uniform_mixing = chain.get_uniform_mixing()\n    chain.restart_and_sample(steps =uniform_mixing)\n    chainvals = [0 for _ in range(T)]\n    for t in range(T):\n        chain.step()\n        chainvals[t] = chain.current\n    return chainvals\n\n'''\ndef get_values():\n    gibbsChain1 = IsingChainLattice(n = CFG.n)\n    T=1\n    chain1vals = [0 for _ in range(T)]\n    for t in range(T):\n        gibbsChain1.step()\n        chain1vals[t] = gibbsChain1.current\n    return chain1vals\n'''\nchain = IsingChainLattice(n = CFG.n)\n## true_values\ndef get_true_values():\n    # MCMC-B\n    cs1 = [get_values(1,CFG.n,-0.02) for  i in range(100)]\n    cs2 = [get_values(1,CFG.n, 0) for  i in range(100)]\n    cs1 = np.array(cs1).reshape(100,CFG.n**2)\n    cs2 = np.array(cs2).reshape(100,CFG.n**2)\n\n    \n    ture1 = [np.exp(-CFG.beta/2*chain.get_Hamiltonian(cs1[i])) for i in range(cs1.shape[0])]\n    ture2 = [np.exp(CFG.beta/2*chain.get_Hamiltonian(cs2[i])) for i in range(cs2.shape[0])]\n    \n    wi = np.mean(ture1)\n    vi = np.mean(ture2)\n    z = vi/wi\n    return np.round(wi,decimals=7),np.round(vi,decimals=7),np.round(z,decimals=7)\n\nw_true,v_true,z_true = get_true_values()\nprint('w_true',w_true)\nprint('v_true',v_true)\nprint('z_true',z_true)\n\n## train chain \ncs1 = [get_values(1,CFG.n,-0.02) for  i in range(CFG.N)]\ncs1 = np.array(cs1).reshape(CFG.N,CFG.n**2)\n\ncs2 = [get_values(1,CFG.n,0) for  i in range(CFG.N)]\ncs2 = np.array(cs2).reshape(CFG.N,CFG.n**2)\n\n## MCMC-B-est\n\nwc1 = np.mean([np.exp(-CFG.beta/2*chain.get_Hamiltonian(cs1[i])) for i in range(cs1.shape[0])])# f\nvc1 = np.mean([np.exp(CFG.beta/2*chain.get_Hamiltonian(cs2[i])) for i in range(cs2.shape[0])])# g\nprint('wc1',wc1)\nprint('vc1',vc1)\nprint('zc1',vc1/wc1)\n\n\n\ndef get_Hamiltonian(X):\n    X_reshaped = X.view(CFG.n, CFG.n)\n    match = torch.zeros(1).cuda()\n    for p in range(CFG.n ** 2):\n        neighbors = [p + 1, p + CFG.n]\n        for neighbor in neighbors:\n            if 0 <= neighbor < CFG.n ** 2:\n                match += torch.where((X_reshaped.view(-1)[p] - X_reshaped.view(-1)[neighbor])==0,1,0)\n    return 1 + match\n\ndef seed_torch(seed):\n    torch.manual_seed(seed)\n    torch.cuda.manual_seed(seed)\n    torch.backends.cudnn.deterministic = True\nseed_torch(seed = CFG.seed)\n\ndef deltaW(N, m, h, seed,generator=None):\n    if generator is None:\n        generator = np.random.default_rng(seed=seed)\n    return generator.normal(0.0, np.sqrt(h), (N, m))\n\ndef get_wt(CFG,seed=1):\n    n,h,N,d = CFG.M,CFG.h,CFG.N,CFG.d\n    ts = np.array([i*h for i in range(n)])\n    w_t_increments = np.array([deltaW(N=n-1, m=d, h=h, generator=None,seed=int(i+seed)) for i in range(N)])\n    w_t = np.array([np.insert(np.cumsum(i.T),0,np.zeros(1)) for i in w_t_increments])\n    return w_t,ts,w_t_increments#.reshape(CFG.N,CFG.M-1)\n\ndef sinkhorn_loss(x, y, epsilon, n, niter):\n    C = cost_matrix(x, y)\n    mu = Variable(1. / n * torch.FloatTensor(n).fill_(1), requires_grad=False)\n    nu = Variable(1. / n * torch.FloatTensor(n).fill_(1), requires_grad=False)\n    rho = 1 \n    tau = -.8  \n    lam = rho / (rho + epsilon)  \n    thresh = 10**(-1) \n    def ave(u, u1):\n        return tau * u + (1 - tau) * u1\n    def M(u, v):\n        return (-C + u.unsqueeze(1) + v.unsqueeze(0)) / epsilon\n    def lse(A):\n        return torch.log(torch.exp(A).sum(1, keepdim=True) + 1e-6)\n    u, v, err = 0. * mu, 0. * nu, 0.\n    actual_nits = 0  \n    for i in range(niter):\n        u1 = u  \n        u = epsilon * (torch.log(mu) - lse(M(u, v)).squeeze()) + u\n        v = epsilon * (torch.log(nu) - lse(M(u, v).t()).squeeze()) + v\n        err = (u - u1).abs().sum()\n        actual_nits += 1\n        if (err < thresh).data.numpy():\n            break\n    U, V = u, v\n    pi = torch.exp(M(U, V))  \n    cost = torch.sum(pi * C)\n    return cost\n\ndef cost_matrix(x, y, p=2):\n    x_col = x.unsqueeze(1)\n    y_lin = y.unsqueeze(0)\n    c = torch.sum((torch.abs(x_col - y_lin)) ** p, 2)\n    return c   \n\n\nclass wasserstein_loss(nn.Module):\n    def __init__(self, **kwargs):\n        super(wasserstein_loss, self).__init__(**kwargs)\n    def forward(self,x,y):\n        return sinkhorn_loss(x.t(),y.t(),epsilon=1e-5,n=N,niter=1000)\n    \ndef gradients(u, x, order=1):  \n    if order == 1:  \n        return torch.autograd.grad(u, x,grad_outputs=torch.ones_like(u),  create_graph=True,only_inputs=True,)[0]  \n    else:  \n        return gradients(gradients(u, x), x,order=order-1)\n\nclass F_model(nn.Module):\n    def __init__(self):\n        super(F_model, self).__init__()\n        self.hidden_layer1 = torch.nn.Linear(CFG.d, CFG.hidden_size)\n        self.hidden_layer2 = torch.nn.Linear(CFG.hidden_size, CFG.hidden_size)\n        self.output_layer = torch.nn.Linear(CFG.hidden_size, CFG.d)\n        self.tanh = nn.Tanh()\n    def forward(self, x):\n        x = self.hidden_layer1(x)\n        x = self.hidden_layer2(x)\n        x =  self.tanh(x)\n        x = self.hidden_layer2(x)\n        x = self.hidden_layer2(x)\n        #x = self.hidden_layer2(x)\n        x =  self.tanh(x)\n        x = self.output_layer(x)\n        return x\n    \nclass G_model(nn.Module):\n    def __init__(self):\n        super(G_model, self).__init__()\n        self.hidden_layer1 = torch.nn.Linear(CFG.d, CFG.hidden_size)\n        self.hidden_layer2 = torch.nn.Linear(CFG.hidden_size, CFG.hidden_size)\n        self.output_layer = torch.nn.Linear(CFG.hidden_size, CFG.d)\n        self.tanh = nn.Tanh()\n    def forward(self, x):\n        x = self.hidden_layer1(x)\n        x = self.hidden_layer2(x)\n        x =  self.tanh(x)\n        x = self.hidden_layer2(x)\n        x = self.hidden_layer2(x)\n        #x = self.hidden_layer2(x)\n        x =  self.tanh(x)\n        x = self.output_layer(x)\n        x = torch.diag_embed(x)#.view(x.shape[0],CFG.d,CFG.d)\n        return x\n    \nclass X_0_model(nn.Module):\n    def __init__(self):\n        super(X_0_model, self).__init__()\n        self.hidden_layer1 = torch.nn.Linear(CFG.d, CFG.hidden_size)\n        self.hidden_layer2 = torch.nn.Linear(CFG.hidden_size, CFG.hidden_size)\n        self.output_layer = torch.nn.Linear(CFG.hidden_size, CFG.d)\n        self.tanh = nn.Tanh()\n    def forward(self, x):\n        x = self.hidden_layer1(x)\n        x = self.output_layer(x)\n        return x #torch.mean(x)#.view(CFG.N,1)\n    \n\n    \nclass Pde_model(nn.Module):\n    def __init__(self):\n        super(Pde_model, self).__init__()\n        self.hidden_layer1 = torch.nn.Linear(CFG.d+1, CFG.hidden_size)\n        self.hidden_layer2 = torch.nn.Linear(CFG.hidden_size, CFG.hidden_size)\n        self.output_layer = torch.nn.Linear(CFG.hidden_size, 1)\n        self.tanh = nn.Tanh()\n        self.initialize_weights()\n    def forward(self,x):\n        x = self.hidden_layer1(x)\n        x =  self.tanh(x)\n        x = self.hidden_layer2(x)\n        x =  self.tanh(x)\n        x = self.output_layer(x)\n        return x\n    \n    def initialize_weights(self):\n        for m in self.modules():\n            if isinstance(m, nn.Linear):\n                torch.nn.init.normal_(m.weight.data, 0, 0.01)\n                m.bias.data.zero_()\n                \n\n    \nclass loss_function(nn.Module):\n    def __init__(self, **kwargs):\n        super(loss_function, self).__init__(**kwargs)\n        \n    def get_1d_wasserstein(self,u_values, v_values):\n        u_sorter = torch.argsort(u_values)\n        v_sorter = torch.argsort(v_values)\n        all_values =torch.cat((u_values, v_values))\n        all_values= torch.sort(all_values)[0]\n        deltas = torch.diff(all_values)\n        u_cdf_indices = torch.searchsorted(u_values[u_sorter],all_values[:-1],right=True)\n        v_cdf_indices = torch.searchsorted(v_values[v_sorter],all_values[:-1],right=True)\n        u_cdf = u_cdf_indices / len(u_values)\n        v_cdf = v_cdf_indices / len(v_values)\n        return torch.sum(torch.multiply(torch.abs(u_cdf - v_cdf), deltas))\n    \n    def get_wasserstein(self,x,y):\n        return sinkhorn_loss(x, y,epsilon=1e-2,n=CFG.N,niter=2000)\n    \n    def get_1d_wasserstein_sum(self,x,y):\n        for i in range(CFG.d):\n            if i == 0 :\n                sums = self.get_1d_wasserstein(x[:,i],y[:,i])\n            else:\n                sums = sums + self.get_1d_wasserstein(x[:,i],y[:,i])\n        return sums\n    \n    def get_out(self,t,yt,w_t_increments,par,model_list):\n        xt = model_list[2](par)\n        xt_l = []\n        for i in range(CFG.M):\n            if i == 0 :\n                xt_l.append(xt)\n                xt1 =xt\n            else:\n                xt1 =xt1+ model_list[0](xt)*CFG.h + (model_list[1](xt) @ w_t_increments[:,i-1,:].unsqueeze(-1)).view(CFG.N,CFG.d)\n                xt_l.append(xt1)\n\n        f= [model_list[0](xt_l[j])for j in range(CFG.M)]\n        l =[model_list[1](xt_l[j])for j in range(CFG.M)]\n        return xt_l,f,l\n\n    def forward(self,t,yt,w_t_increments,par,model_list):\n        xt = model_list[2](par)\n        xt_l = []\n        for i in range(CFG.M):\n            if i == 0 :\n                xt_l.append(xt)\n                xt1 =xt\n            else:\n                xt1 =xt1+ model_list[0](xt)*CFG.h + (model_list[1](xt) @ w_t_increments[:,i-1,:].unsqueeze(-1)).view(CFG.N,CFG.d)\n                xt_l.append(xt1)\n        \n        #xt_l[-1] = \n        wr = self.get_1d_wasserstein_sum(torch.sigmoid(xt_l[-1]),yt)\n        return wr #self.get_wasserstein(xt_l[-1],yt)# + torch.mean(loss_sum)\n    \nclass loss_pde(nn.Module):\n    def __init__(self, **kwargs):\n        super(loss_pde, self).__init__(**kwargs)\n    def forward(self,t,xt_l,f,ll,model_list,flag):\n        T = torch.cat([t[-1].view(-1) for K in range(CFG.N)],dim = 0).view(CFG.N,1)\n        XT = xt_l[-1]\n\n        uTx =torch.cat([T,XT],dim=-1)\n        uT = model_list[3](uTx)\n\n        f1 = torch.cat([get_Hamiltonian(torch.round(torch.sigmoid(XT)[i])) for i in range(CFG.N)],dim=0)\n        #print(f1)\n        #print(uT.view(-1))\n        if flag== 'w':\n            loss1 = (uT.view(-1) - torch.exp(-CFG.beta/2*f1) )**2\n        if flag== 'v':\n            loss1 = (uT.view(-1) - torch.exp(CFG.beta/2*f1) )**2\n        #np.exp(-gap/2*chain.get_Hamiltonian(x))\n        loss_sum =0\n        for s in range(1,CFG.M-1):#range(CFG.M):\n            xi= xt_l[s]\n            ti = torch.cat([t[s].view(-1) for K in range(CFG.N)],dim = 0).view(CFG.N,1)\n            x =  torch.cat([ti,xi],dim=-1)\n            u = model_list[3](x)\n            d1 = gradients(u,x)\n            ut = d1[:,0]\n            a = torch.sum(f[s] * d1[:,1:],dim=1)\n            d3=torch.sum(torch.cat([torch.autograd.grad(d1[:,i], x, torch.ones_like(d1[:,i]), create_graph=True)[0][:,i].view(CFG.N,1) for i in range(1,CFG.d+1)],dim = 1),dim=1)\n            b= 1/2*d3\n\n            loss_sum = (ut + a+ b )**2\n        return torch.mean(loss_sum)+1*torch.mean(loss1)\n        \ndef get_optimizer(model):\n    if CFG.optim == 'SGD':\n        optimizer = torch.optim.SGD(model.parameters(), lr=CFG.lr)\n    if CFG.optim == 'Adam':\n        optimizer = torch.optim.Adam(model.parameters(), lr=CFG.lr, amsgrad = False)\n    return optimizer\n\ndef get_wt_nn(CFG,seed= 1):\n    n,h,N = CFG.M,CFG.h,CFG.N\n    ts = np.array([i*h for i in range(n)])\n    w_t_increments = np.array([deltaW(N=n-1, m=1, h=h, generator=None,seed=int(i+seed)) for i in range(N)])\n    w_t = np.array([np.insert(np.cumsum(i.T),0,np.zeros(1)) for i in w_t_increments])\n    return w_t,ts,w_t_increments.reshape(CFG.N,CFG.M-1)\n    \n    \ndef get_predict_sample(CFG,model_list,flag):\n    par = np.array([1 for i in range(CFG.N*CFG.d)])\n    par = torch.tensor(par.astype(np.float32)).reshape(CFG.N,CFG.d).requires_grad_(True).cuda()\n    w_t,ts,w_t_increments = get_wt(CFG,seed=100000)\n    w_t_increments = torch.tensor(w_t_increments.astype(np.float32)).requires_grad_(False).cuda()\n    t = torch.tensor(ts.astype(np.float32)).reshape(CFG.M,1).requires_grad_(True).cuda()\n    t0 = torch.cat([t[0].view(-1) for K in range(CFG.N)],dim = 0).view(CFG.N,1).cuda()\n    \n    xt = model_list[2](par)\n    xt_l = []\n    for i in range(CFG.M):\n        if i == 0 :\n            xt_l.append(xt)\n            xt1 =xt\n        else:\n            xt1 =xt1+ model_list[0](xt)*CFG.h + (model_list[1](xt) @ w_t_increments[:,i-1,:].unsqueeze(-1)).view(CFG.N,CFG.d)\n            xt_l.append(xt1)\n    if flag =='w':\n        out = torch.mean(torch.exp(-CFG.beta/2*torch.round(torch.sigmoid(xt_l[-1]))))\n    if flag =='v':\n        out = torch.mean(torch.exp(CFG.beta/2*torch.round(torch.sigmoid(xt_l[-1]))))\n    return out\n\n\ndef get_nn_solution(CFG,yt,flag):\n    model_list =[F_model().cuda() ,G_model().cuda(), X_0_model().cuda(),Pde_model().cuda()]\n    par = np.array([1 for i in range(CFG.N*CFG.d)])\n    par = torch.tensor(par.astype(np.float32)).reshape(CFG.N,CFG.d).requires_grad_(True).cuda()\n    yt = torch.tensor(yt.astype(np.float32)).requires_grad_(False).cuda()\n    loss_ito = loss_function()\n    loss_pdes = loss_pde()\n    optimizer_list = [get_optimizer(model_list[i]) for i in range(3)]+[torch.optim.Adam(model_list[3].parameters(), lr=CFG.lr*10, amsgrad = False)]\n    result= []\n\n    loss_ito_log = []\n\n    w_t,ts,w_t_increments = get_wt(CFG,seed=1)\n    w_t_increments = torch.tensor(w_t_increments.astype(np.float32)).requires_grad_(False).cuda()\n    t = torch.tensor(ts.astype(np.float32)).reshape(CFG.M,1).requires_grad_(True).cuda()\n    t0 = torch.cat([t[0].view(-1) for K in range(CFG.N)],dim = 0).view(CFG.N,1).cuda()\n    print('stage 1 begin')\n    b1 = time.time()\n    for epoch in range(CFG.epoch_stage_1):\n        for optimizer in optimizer_list[0:3]:\n            optimizer.zero_grad()\n\n        loss_1 = loss_ito(t,yt,w_t_increments,par,model_list)\n        loss_1.backward()\n        for optimizer in optimizer_list[0:3]:\n            optimizer.step()\n        if epoch % CFG.print_step== 0: \n            print('Epoch:{}/{}\\t Ito_loss={:.4f}\\t '.format(CFG.epoch_stage_1,epoch ,loss_1,))\n\n    e1 = time.time()\n    time1 =e1 - b1\n        \n    xt_l,f,l = loss_ito.get_out(t,yt,w_t_increments,par,model_list)\n    \n    xt_l = [torch.tensor(i.detach().cpu().numpy().astype(np.float32)).requires_grad_(True).cuda() for i in xt_l]\n    f = [torch.tensor(i.detach().cpu().numpy().astype(np.float32)).requires_grad_(False).cuda() for i in f]\n    l = [torch.tensor(i.detach().cpu().numpy().astype(np.float32)).requires_grad_(False).cuda() for i in l]\n    \n\n    ll = [l[s] @ torch.transpose(l[s], 2, 1) for s in range(CFG.M)]\n    \n    print('stage 2 begin')\n    b2 = time.time()\n    EX_LSIT=[]\n    for epoch in range(CFG.epoch_stage_2):\n        optimizer_list[-1].zero_grad()\n        loss_2 = loss_pdes(t,xt_l,f,ll,model_list,flag)\n        loss_2.backward()\n        optimizer_list[-1].step()\n        if epoch % 1== 0:\n            x =  torch.cat([t0,model_list[2](par)],dim=-1)\n            EX= model_list[3](x)\n            if epoch in [i for i in range(CFG.epoch_stage_2 - 10, CFG.epoch_stage_2)]:\n                EX_LSIT.append(EX[0].item())\n            print('Epoch:{}/{}\\t PDE_loss={:.4f}\\t EX={:.4f}\\t'.format(CFG.epoch_stage_2,epoch ,loss_2,EX[0].item()))\n    e2 = time.time()\n    time2 =e2 - b2\n    \n    return result,model_list,np.mean(EX_LSIT),time1,time2 #,[,loss_ito_log,loss_sum_log]\n  ","metadata":{"execution":{"iopub.status.busy":"2023-08-07T06:28:11.379412Z","iopub.execute_input":"2023-08-07T06:28:11.380236Z","iopub.status.idle":"2023-08-07T06:30:25.076821Z","shell.execute_reply.started":"2023-08-07T06:28:11.380195Z","shell.execute_reply":"2023-08-07T06:30:25.075726Z"},"trusted":true},"execution_count":35,"outputs":[{"name":"stdout","text":"w_true 0.8599499\nv_true 1.1563472\nz_true 1.344668\nwc1 0.8638932555787735\nvc1 1.1580353849876324\nzc1 1.3404843451541888\n","output_type":"stream"}]},{"cell_type":"code","source":"w_true = 0.8641533\nv_true = 1.1563625\nz_true = 1.338233","metadata":{"execution":{"iopub.status.busy":"2023-08-07T06:27:40.326898Z","iopub.status.idle":"2023-08-07T06:27:40.327246Z","shell.execute_reply.started":"2023-08-07T06:27:40.327078Z","shell.execute_reply":"2023-08-07T06:27:40.327095Z"},"trusted":true},"execution_count":null,"outputs":[]},{"cell_type":"code","source":"result,model_list,EX1,time1a,time2a=get_nn_solution(CFG,cs1,'w')\npredict1 = get_predict_sample(CFG,model_list,'w')\n\n\nresult,model_list,EX2,time1b,time2b=get_nn_solution(CFG,cs2,'v')\npredict2 = get_predict_sample(CFG,model_list,'v')\n","metadata":{"execution":{"iopub.status.busy":"2023-08-07T06:30:50.216964Z","iopub.execute_input":"2023-08-07T06:30:50.217334Z","iopub.status.idle":"2023-08-07T06:33:09.426475Z","shell.execute_reply.started":"2023-08-07T06:30:50.217303Z","shell.execute_reply":"2023-08-07T06:33:09.424645Z"},"trusted":true},"execution_count":36,"outputs":[{"name":"stdout","text":"stage 1 begin\nEpoch:700/0\t Ito_loss=7.9668\t \nEpoch:700/100\t Ito_loss=3.4792\t \nEpoch:700/200\t Ito_loss=2.4887\t \nEpoch:700/300\t Ito_loss=2.0346\t \nEpoch:700/400\t Ito_loss=1.7593\t \nEpoch:700/500\t Ito_loss=1.5694\t \nEpoch:700/600\t Ito_loss=1.4280\t \nstage 2 begin\nEpoch:50/0\t PDE_loss=0.7508\t EX=0.0401\t\nEpoch:50/1\t PDE_loss=0.6985\t EX=0.2079\t\nEpoch:50/2\t PDE_loss=0.7923\t EX=0.2101\t\nEpoch:50/3\t PDE_loss=0.7153\t EX=0.1007\t\nEpoch:50/4\t PDE_loss=0.6115\t EX=0.0700\t\nEpoch:50/5\t PDE_loss=0.6353\t EX=0.0821\t\nEpoch:50/6\t PDE_loss=0.6197\t EX=0.1110\t\nEpoch:50/7\t PDE_loss=0.6064\t EX=0.1365\t\nEpoch:50/8\t PDE_loss=0.5663\t EX=0.1584\t\nEpoch:50/9\t PDE_loss=0.5189\t EX=0.2138\t\nEpoch:50/10\t PDE_loss=0.4688\t EX=0.3369\t\nEpoch:50/11\t PDE_loss=0.4195\t EX=0.4031\t\nEpoch:50/12\t PDE_loss=0.3369\t EX=0.4984\t\nEpoch:50/13\t PDE_loss=0.2703\t EX=0.6502\t\nEpoch:50/14\t PDE_loss=0.2685\t EX=0.5969\t\nEpoch:50/15\t PDE_loss=0.3820\t EX=0.7014\t\nEpoch:50/16\t PDE_loss=0.0787\t EX=0.7788\t\nEpoch:50/17\t PDE_loss=0.2262\t EX=0.7314\t\nEpoch:50/18\t PDE_loss=0.0339\t EX=0.7338\t\nEpoch:50/19\t PDE_loss=0.1114\t EX=0.7674\t\nEpoch:50/20\t PDE_loss=0.0807\t EX=0.7960\t\nEpoch:50/21\t PDE_loss=0.0149\t EX=0.8438\t\nEpoch:50/22\t PDE_loss=0.0304\t EX=0.9152\t\nEpoch:50/23\t PDE_loss=0.0340\t EX=0.9790\t\nEpoch:50/24\t PDE_loss=0.0183\t EX=0.9978\t\nEpoch:50/25\t PDE_loss=0.0208\t EX=0.9554\t\nEpoch:50/26\t PDE_loss=0.0255\t EX=0.8741\t\nEpoch:50/27\t PDE_loss=0.0135\t EX=0.8015\t\nEpoch:50/28\t PDE_loss=0.0100\t EX=0.7758\t\nEpoch:50/29\t PDE_loss=0.0214\t EX=0.8003\t\nEpoch:50/30\t PDE_loss=0.0205\t EX=0.8506\t\nEpoch:50/31\t PDE_loss=0.0061\t EX=0.8985\t\nEpoch:50/32\t PDE_loss=0.0033\t EX=0.9296\t\nEpoch:50/33\t PDE_loss=0.0118\t EX=0.9422\t\nEpoch:50/34\t PDE_loss=0.0134\t EX=0.9310\t\nEpoch:50/35\t PDE_loss=0.0070\t EX=0.8891\t\nEpoch:50/36\t PDE_loss=0.0025\t EX=0.8321\t\nEpoch:50/37\t PDE_loss=0.0035\t EX=0.7992\t\nEpoch:50/38\t PDE_loss=0.0067\t EX=0.8104\t\nEpoch:50/39\t PDE_loss=0.0063\t EX=0.8393\t\nEpoch:50/40\t PDE_loss=0.0044\t EX=0.8529\t\nEpoch:50/41\t PDE_loss=0.0022\t EX=0.8613\t\nEpoch:50/42\t PDE_loss=0.0024\t EX=0.8886\t\nEpoch:50/43\t PDE_loss=0.0033\t EX=0.9094\t\nEpoch:50/44\t PDE_loss=0.0044\t EX=0.8918\t\nEpoch:50/45\t PDE_loss=0.0036\t EX=0.8679\t\nEpoch:50/46\t PDE_loss=0.0029\t EX=0.8664\t\nEpoch:50/47\t PDE_loss=0.0020\t EX=0.8570\t\nEpoch:50/48\t PDE_loss=0.0019\t EX=0.8338\t\nEpoch:50/49\t PDE_loss=0.0020\t EX=0.8349\t\nstage 1 begin\nEpoch:700/0\t Ito_loss=7.9682\t \nEpoch:700/100\t Ito_loss=3.5142\t \nEpoch:700/200\t Ito_loss=2.5001\t \nEpoch:700/300\t Ito_loss=2.0402\t \nEpoch:700/400\t Ito_loss=1.7620\t \nEpoch:700/500\t Ito_loss=1.5704\t \nEpoch:700/600\t Ito_loss=1.4279\t \nstage 2 begin\nEpoch:50/0\t PDE_loss=1.3321\t EX=0.0577\t\nEpoch:50/1\t PDE_loss=1.2478\t EX=0.3710\t\nEpoch:50/2\t PDE_loss=1.3484\t EX=0.1727\t\nEpoch:50/3\t PDE_loss=1.2001\t EX=0.1401\t\nEpoch:50/4\t PDE_loss=1.0926\t EX=0.1518\t\nEpoch:50/5\t PDE_loss=1.0750\t EX=0.1908\t\nEpoch:50/6\t PDE_loss=1.0440\t EX=0.2608\t\nEpoch:50/7\t PDE_loss=0.9633\t EX=0.3517\t\nEpoch:50/8\t PDE_loss=0.8582\t EX=0.4477\t\nEpoch:50/9\t PDE_loss=0.7384\t EX=0.5463\t\nEpoch:50/10\t PDE_loss=0.5884\t EX=0.6560\t\nEpoch:50/11\t PDE_loss=0.4093\t EX=0.7810\t\nEpoch:50/12\t PDE_loss=0.2190\t EX=0.9306\t\nEpoch:50/13\t PDE_loss=0.1239\t EX=1.2766\t\nEpoch:50/14\t PDE_loss=0.0796\t EX=1.5617\t\nEpoch:50/15\t PDE_loss=0.1914\t EX=1.6922\t\nEpoch:50/16\t PDE_loss=0.2845\t EX=1.4345\t\nEpoch:50/17\t PDE_loss=0.1508\t EX=1.2144\t\nEpoch:50/18\t PDE_loss=0.0435\t EX=1.0350\t\nEpoch:50/19\t PDE_loss=0.0518\t EX=0.9110\t\nEpoch:50/20\t PDE_loss=0.1033\t EX=0.8693\t\nEpoch:50/21\t PDE_loss=0.1244\t EX=0.9160\t\nEpoch:50/22\t PDE_loss=0.0937\t EX=1.0277\t\nEpoch:50/23\t PDE_loss=0.0635\t EX=1.1593\t\nEpoch:50/24\t PDE_loss=0.0445\t EX=1.2629\t\nEpoch:50/25\t PDE_loss=0.0375\t EX=1.3047\t\nEpoch:50/26\t PDE_loss=0.0268\t EX=1.2791\t\nEpoch:50/27\t PDE_loss=0.0243\t EX=1.2129\t\nEpoch:50/28\t PDE_loss=0.0260\t EX=1.1597\t\nEpoch:50/29\t PDE_loss=0.0301\t EX=1.1487\t\nEpoch:50/30\t PDE_loss=0.0187\t EX=1.1601\t\nEpoch:50/31\t PDE_loss=0.0156\t EX=1.1602\t\nEpoch:50/32\t PDE_loss=0.0128\t EX=1.1366\t\nEpoch:50/33\t PDE_loss=0.0099\t EX=1.1068\t\nEpoch:50/34\t PDE_loss=0.0105\t EX=1.1014\t\nEpoch:50/35\t PDE_loss=0.0159\t EX=1.1311\t\nEpoch:50/36\t PDE_loss=0.0115\t EX=1.1722\t\nEpoch:50/37\t PDE_loss=0.0098\t EX=1.1916\t\nEpoch:50/38\t PDE_loss=0.0073\t EX=1.1827\t\nEpoch:50/39\t PDE_loss=0.0045\t EX=1.1659\t\nEpoch:50/40\t PDE_loss=0.0049\t EX=1.1608\t\nEpoch:50/41\t PDE_loss=0.0046\t EX=1.1678\t\nEpoch:50/42\t PDE_loss=0.0046\t EX=1.1717\t\nEpoch:50/43\t PDE_loss=0.0059\t EX=1.1611\t\nEpoch:50/44\t PDE_loss=0.0048\t EX=1.1443\t\nEpoch:50/45\t PDE_loss=0.0039\t EX=1.1406\t\nEpoch:50/46\t PDE_loss=0.0041\t EX=1.1532\t\nEpoch:50/47\t PDE_loss=0.0022\t EX=1.1642\t\nEpoch:50/48\t PDE_loss=0.0024\t EX=1.1596\t\nEpoch:50/49\t PDE_loss=0.0020\t EX=1.1474\t\n","output_type":"stream"}]},{"cell_type":"code","source":"df = pd.DataFrame(columns=['Method','n','wi','vi','q','true_wi','true_vi','true_q'\n                          ,'error_wi','error_vi','error_q','wi sample ponints','vi sample ponints','wi time','vi time']\n                 )","metadata":{"execution":{"iopub.status.busy":"2023-08-07T06:33:15.192158Z","iopub.execute_input":"2023-08-07T06:33:15.192551Z","iopub.status.idle":"2023-08-07T06:33:15.199904Z","shell.execute_reply.started":"2023-08-07T06:33:15.192518Z","shell.execute_reply":"2023-08-07T06:33:15.198818Z"},"trusted":true},"execution_count":37,"outputs":[]},{"cell_type":"code","source":"m1 = ['MCMC-R',CFG.n,np.round(predict1.item(),7),np.round(predict2.item(),7),\n      np.round(predict2.item()/predict1.item(),7)\n       ,w_true,v_true,z_true,0,0,0,CFG.N,CFG.N,np.round(time1a,3),np.round(time1b,3)\n      ]\n\nm2 = ['MCMC-T',CFG.n,np.round(EX1,7),np.round(EX2,7),np.round(EX2/EX1,7)\n       ,w_true,v_true,z_true,0,0,0,CFG.N*CFG.M,CFG.N,np.round(time2a,3),np.round(time2b,3)\n     ]","metadata":{"execution":{"iopub.status.busy":"2023-08-07T06:33:15.388898Z","iopub.execute_input":"2023-08-07T06:33:15.389229Z","iopub.status.idle":"2023-08-07T06:33:15.397797Z","shell.execute_reply.started":"2023-08-07T06:33:15.389200Z","shell.execute_reply":"2023-08-07T06:33:15.396817Z"},"trusted":true},"execution_count":38,"outputs":[]},{"cell_type":"code","source":"df.loc[0] = m1\ndf.loc[1] = m2","metadata":{"execution":{"iopub.status.busy":"2023-08-07T06:33:15.869651Z","iopub.execute_input":"2023-08-07T06:33:15.870629Z","iopub.status.idle":"2023-08-07T06:33:15.881786Z","shell.execute_reply.started":"2023-08-07T06:33:15.870590Z","shell.execute_reply":"2023-08-07T06:33:15.880649Z"},"trusted":true},"execution_count":39,"outputs":[]},{"cell_type":"code","source":"df['error_wi'] = (df['true_wi'] - df['wi'])**2\ndf['error_vi'] = (df['true_vi'] - df['vi'])**2\ndf['error_q'] = (df['true_q'] - df['q'])**2","metadata":{"execution":{"iopub.status.busy":"2023-08-07T06:33:16.330680Z","iopub.execute_input":"2023-08-07T06:33:16.331794Z","iopub.status.idle":"2023-08-07T06:33:16.339186Z","shell.execute_reply.started":"2023-08-07T06:33:16.331732Z","shell.execute_reply":"2023-08-07T06:33:16.338072Z"},"trusted":true},"execution_count":40,"outputs":[]},{"cell_type":"code","source":"df","metadata":{"execution":{"iopub.status.busy":"2023-08-07T06:33:18.911895Z","iopub.execute_input":"2023-08-07T06:33:18.912263Z","iopub.status.idle":"2023-08-07T06:33:18.930805Z","shell.execute_reply.started":"2023-08-07T06:33:18.912232Z","shell.execute_reply":"2023-08-07T06:33:18.929551Z"},"trusted":true},"execution_count":41,"outputs":[{"execution_count":41,"output_type":"execute_result","data":{"text/plain":"   Method  n        wi        vi         q  true_wi   true_vi    true_q  \\\n0  MCMC-R  4  0.995174  1.005068  1.009942  0.85995  1.156347  1.344668   \n1  MCMC-T  4  0.866409  1.157078  1.335487  0.85995  1.156347  1.344668   \n\n   error_wi      error_vi   error_q  wi sample ponints  vi sample ponints  \\\n0  0.018286  2.288543e-02  0.112042                500                500   \n1  0.000042  5.345072e-07  0.000084               2000                500   \n\n   wi time  vi time  \n0   10.762   10.573  \n1   59.597   58.064  ","text/html":"<div>\n<style scoped>\n    .dataframe tbody tr th:only-of-type {\n        vertical-align: middle;\n    }\n\n    .dataframe tbody tr th {\n        vertical-align: top;\n    }\n\n    .dataframe thead th {\n        text-align: right;\n    }\n</style>\n<table border=\"1\" class=\"dataframe\">\n  <thead>\n    <tr style=\"text-align: right;\">\n      <th></th>\n      <th>Method</th>\n      <th>n</th>\n      <th>wi</th>\n      <th>vi</th>\n      <th>q</th>\n      <th>true_wi</th>\n      <th>true_vi</th>\n      <th>true_q</th>\n      <th>error_wi</th>\n      <th>error_vi</th>\n      <th>error_q</th>\n      <th>wi sample ponints</th>\n      <th>vi sample ponints</th>\n      <th>wi time</th>\n      <th>vi time</th>\n    </tr>\n  </thead>\n  <tbody>\n    <tr>\n      <th>0</th>\n      <td>MCMC-R</td>\n      <td>4</td>\n      <td>0.995174</td>\n      <td>1.005068</td>\n      <td>1.009942</td>\n      <td>0.85995</td>\n      <td>1.156347</td>\n      <td>1.344668</td>\n      <td>0.018286</td>\n      <td>2.288543e-02</td>\n      <td>0.112042</td>\n      <td>500</td>\n      <td>500</td>\n      <td>10.762</td>\n      <td>10.573</td>\n    </tr>\n    <tr>\n      <th>1</th>\n      <td>MCMC-T</td>\n      <td>4</td>\n      <td>0.866409</td>\n      <td>1.157078</td>\n      <td>1.335487</td>\n      <td>0.85995</td>\n      <td>1.156347</td>\n      <td>1.344668</td>\n      <td>0.000042</td>\n      <td>5.345072e-07</td>\n      <td>0.000084</td>\n      <td>2000</td>\n      <td>500</td>\n      <td>59.597</td>\n      <td>58.064</td>\n    </tr>\n  </tbody>\n</table>\n</div>"},"metadata":{}}]},{"cell_type":"code","source":"","metadata":{},"execution_count":null,"outputs":[]}]}