{"metadata":{"kernelspec":{"language":"python","display_name":"Python 3","name":"python3"},"language_info":{"name":"python","version":"3.7.12","mimetype":"text/x-python","codemirror_mode":{"name":"ipython","version":3},"pygments_lexer":"ipython3","nbconvert_exporter":"python","file_extension":".py"}},"nbformat_minor":4,"nbformat":4,"cells":[{"cell_type":"code","source":"import numpy as np \n#import sdeint\nfrom sklearn.metrics import mean_squared_error\nimport time\n\nimport statsmodels.api as sm\nfrom torch.autograd import Variable\nimport seaborn as sns\nimport torch\n\nimport matplotlib.pyplot as plt\n\n\nimport torch\nfrom torch import nn","metadata":{"_uuid":"8f2839f25d086af736a60e9eeb907d3b93b6e0e5","_cell_guid":"b1076dfc-b9ad-4769-8c92-a6c4dae69d19","execution":{"iopub.status.busy":"2023-05-21T07:37:40.843899Z","iopub.execute_input":"2023-05-21T07:37:40.844317Z","iopub.status.idle":"2023-05-21T07:37:40.850404Z","shell.execute_reply.started":"2023-05-21T07:37:40.844280Z","shell.execute_reply":"2023-05-21T07:37:40.849391Z"},"trusted":true},"execution_count":66,"outputs":[]},{"cell_type":"code","source":"# GPU version ","metadata":{},"execution_count":null,"outputs":[]},{"cell_type":"code","source":"class CFG:\n   \n    d = 20\n\n    a = 0.2\n    #b= 0.2\n    \n    x0 = 0\n    \n    M= 101\n    h = 0.1\n    \n    \n    N = 100\n    \n    \n    epoch=401\n    optim = ['SGD','Adam'][1]\n    lr = 0.001\n    seed = 44\n    hidden_size =526#108\n    \n    \n    \n    lambda1 =1\n    lambda2 =1\n    print_step = 100\n    gap = 20\n","metadata":{"execution":{"iopub.status.busy":"2023-05-21T07:37:41.298534Z","iopub.execute_input":"2023-05-21T07:37:41.299594Z","iopub.status.idle":"2023-05-21T07:37:41.306590Z","shell.execute_reply.started":"2023-05-21T07:37:41.299536Z","shell.execute_reply":"2023-05-21T07:37:41.305585Z"},"trusted":true},"execution_count":67,"outputs":[]},{"cell_type":"code","source":"def seed_torch(seed):\n    torch.manual_seed(seed)\n    torch.cuda.manual_seed(seed)\n    torch.backends.cudnn.deterministic = True\nseed_torch(seed = CFG.seed)\n\ndef deltaW(N, m, h, seed,generator=None):\n    if generator is None:\n        generator = np.random.default_rng(seed=seed)\n    return generator.normal(0.0, np.sqrt(h), (N, m))\n\ndef get_wt(CFG,seed=1):\n    n,h,N,d = CFG.M,CFG.h,CFG.N,CFG.d\n    ts = np.array([i*h for i in range(n)])\n    w_t_increments = np.array([deltaW(N=n-1, m=d, h=h, generator=None,seed=int(i+seed*100)) for i in range(N)])\n    w_t = np.array([np.insert(np.cumsum(i.T),0,np.zeros(1)) for i in w_t_increments])\n    return w_t,ts,w_t_increments","metadata":{"execution":{"iopub.status.busy":"2023-05-21T07:37:41.755261Z","iopub.execute_input":"2023-05-21T07:37:41.755640Z","iopub.status.idle":"2023-05-21T07:37:41.765757Z","shell.execute_reply.started":"2023-05-21T07:37:41.755606Z","shell.execute_reply":"2023-05-21T07:37:41.764578Z"},"trusted":true},"execution_count":68,"outputs":[]},{"cell_type":"code","source":"def p(x):\n    cov_matrix = torch.eye(CFG.d).expand(x.size(0), -1, -1) # Expand cov_matrix to match the shape of x\n    mean_vector = torch.ones(CFG.d)* 0.2# *torch.linspace(-5, 5, 10)#* 0.2 \n    exponent = -0.5 * torch.bmm(torch.bmm((x - mean_vector).unsqueeze(1), torch.inverse(cov_matrix)), (x - mean_vector).unsqueeze(-1))\n    # Compute normalization factor for each input in x\n    #normalization = (2 * torch.tensor([[3.14159265358979323846]])) ** (-0.5) * (torch.det(cov_matrix).unsqueeze(-1)) ** (-0.5)\n   \n    result = torch.exp(exponent.squeeze(-1).squeeze(-1))#normalization * torch.exp(exponent.squeeze(-1).squeeze(-1))\n    return result\n\ndef gradients(u, x, order=1):  \n    if order == 1:  \n        return torch.autograd.grad(u, x,grad_outputs=torch.ones_like(u),  create_graph=True,only_inputs=True,)[0]  \n    else:  \n        return gradients(gradients(u, x), x,order=order-1)\n\n    \ndef f(x):\n    x=x.requires_grad_(True)\n    y = (1/2)*gradients(torch.log(p(x)),x)\n    return y.detach()\n\n\ndef getFL(see):\n    w_t,ts,w_t_increments = get_wt(CFG,seed=see)\n    w_t_increments = torch.from_numpy(w_t_increments.astype(np.float32))\n    F=[]\n    L=[]\n    xt = np.zeros((CFG.M,CFG.N, CFG.d))\n    xt[0] = CFG.x0   \n    xt = torch.from_numpy(xt.astype(np.float32))\n    for i in range(CFG.M-1):\n        xt[i+1] = xt[i] + f(xt[i])*CFG.h + (torch.eye(CFG.d)@ w_t_increments[:,i,:].unsqueeze(-1)).view(CFG.N,CFG.d)\n        F.append(f(xt[i]))\n        L.append(torch.eye(CFG.d))\n    F.append(f(xt[-1]))\n    L.append(torch.eye(CFG.d))\n    \n    \n    F = np.array(F)\n    L = np.array(L)\n    return xt,F,L\n\n","metadata":{"execution":{"iopub.status.busy":"2023-05-21T07:37:42.127843Z","iopub.execute_input":"2023-05-21T07:37:42.128666Z","iopub.status.idle":"2023-05-21T07:37:42.143544Z","shell.execute_reply.started":"2023-05-21T07:37:42.128623Z","shell.execute_reply":"2023-05-21T07:37:42.142601Z"},"trusted":true},"execution_count":69,"outputs":[]},{"cell_type":"code","source":"class Pde_model(nn.Module):\n    def __init__(self):\n        super(Pde_model, self).__init__()\n        self.hidden_layer1 = torch.nn.Linear(CFG.d+1, CFG.hidden_size)\n        self.hidden_layer2 = torch.nn.Linear(CFG.hidden_size, CFG.hidden_size)\n        self.output_layer = torch.nn.Linear(CFG.hidden_size, 1)\n        self.tanh = nn.Tanh()\n    def forward(self, x):\n\n        x = self.hidden_layer1(x)\n        x = self.hidden_layer2(x)\n        x =  self.tanh(x)\n        x = self.hidden_layer2(x)\n        x = self.hidden_layer2(x)\n        x =  self.tanh(x)\n        x = self.output_layer(x)\n        return x\n\nclass loss_pde(nn.Module):\n    def __init__(self, **kwargs):\n        super(loss_pde, self).__init__(**kwargs)\n    def forward(self,t,xt_l,f,ll,model,epoch):\n        T = torch.cat([t[-1].view(-1) for K in range(CFG.N)],dim = 0).view(CFG.N,1).cuda()\n        loss1 = 0\n        for k in [-1]:\n            XT = xt_l[k]\n            uTx =torch.cat([T,XT],dim=-1)\n            uT = model(uTx).view(-1)\n            loss1 = loss1+(uT - torch.sum(XT,dim=-1))**2\n            if epoch %10 == 0:\n                pass\n        loss_sum =0\n        for s in range(1,len(xt_l)-1):\n            xi= xt_l[s]\n            ti = torch.cat([t[s].view(-1) for K in range(CFG.N)],dim = 0).view(CFG.N,1)\n            x =  torch.cat([ti,xi],dim=-1)\n            \n            u = model(x)\n            d1 = gradients(u,x)\n            ut = d1[:,0]\n            a = torch.sum(f[s] * d1[:,1:],dim=1)\n\n            d3=torch.sum(torch.cat([torch.autograd.grad(d1[:,i], x, torch.ones_like(d1[:,i]), create_graph=True)[0][:,i].view(CFG.N,1) for i in range(1,CFG.d+1)],dim = 1),dim=1)\n            b= 1/2*d3\n\n            loss_sum = loss_sum + (ut + a+ b)**2\n        \n        if epoch %CFG.print_step == 0:\n\n            print('loss bonund 1:',torch.mean(loss1).item())\n\n            print('loss pde :',torch.mean(loss_sum).item())\n        \n        #torch.mean(loss_sum)+\n        return torch.mean(loss_sum)+1*torch.mean(loss1)#torch.mean(loss_sum)+1*torch.mean(loss1)#+ (torch.mean(loss1)+torch.mean(loss2))*0.0001\ndef get_optimizer(model):\n    if CFG.optim == 'SGD':\n        optimizer = torch.optim.SGD(model.parameters(), lr=CFG.lr)\n    if CFG.optim == 'Adam':\n        optimizer = torch.optim.AdamW(model.parameters(), lr=CFG.lr, amsgrad = False)\n    return optimizer\n\n","metadata":{"execution":{"iopub.status.busy":"2023-05-21T07:37:42.585542Z","iopub.execute_input":"2023-05-21T07:37:42.586250Z","iopub.status.idle":"2023-05-21T07:37:42.605417Z","shell.execute_reply.started":"2023-05-21T07:37:42.586213Z","shell.execute_reply":"2023-05-21T07:37:42.604286Z"},"trusted":true},"execution_count":70,"outputs":[]},{"cell_type":"code","source":"def get_nn_solution(CFG,xt,F,L):\n    w_t,ts,w_t_increments = get_wt(CFG,seed=1)\n\n    model = Pde_model().cuda()\n    \n    loss_pdes = loss_pde().cuda()\n    optimizer_list = [get_optimizer(model)]\n    result= []\n\n    ts = ts[::CFG.gap]\n    t = torch.tensor(ts.astype(np.float32)).reshape(len(ts),1).requires_grad_(True).cuda()\n    \n    t0 = torch.cat([t[0].view(-1) for K in range(CFG.N)],dim = 0).view(CFG.N,1).cuda()\n    \n    X0 = torch.zeros(CFG.N, CFG.d)\n    X0 = torch.fill(X0,CFG.x0).cuda()\n\n    \n    xt_l = [torch.tensor(i.detach().cpu().numpy()).requires_grad_(True).cuda() for i in xt][::CFG.gap]\n    f = [torch.tensor(i.detach().cpu().numpy()).requires_grad_(False).cuda() for i in F][::CFG.gap]\n    l = [torch.tensor(i.detach().cpu().numpy()).requires_grad_(False) for i in L][::CFG.gap]\n\n\n    current = 0 \n\n    print('Ex',torch.mean(torch.sum(xt_l[-1],dim=-1)))\n    begin = time.time()\n    for epoch in range(CFG.epoch*1-100):\n        optimizer_list[0].zero_grad()\n        loss_2 = loss_pdes(t,xt_l,f,l,model,epoch)\n        loss_2.backward()\n        optimizer_list[0].step()\n\n        if epoch % CFG.print_step== 0:\n            x =  torch.cat([t0,X0],dim=-1)\n            EX= model(x)\n            print('Epoch:{}/{}\\t PDE_loss={:.4f}\\t EX={:.4f}\\t'.format(CFG.epoch,epoch ,loss_2,EX[0].item()))\n\n    end = time.time()\n    tiems =end - begin\n    print(tiems)\n    \n    ut = [model(torch.cat([torch.cat([t[i].view(-1) for K in range(CFG.N)],dim = 0).view(CFG.N,1),xt_l[i]],dim=-1)).detach().cpu().numpy() for i in range(len(xt_l))]\n    \n    \n    return EX[0].item(),ut,t.detach().cpu().numpy().reshape(-1),xt,model ","metadata":{"execution":{"iopub.status.busy":"2023-05-21T07:37:42.970654Z","iopub.execute_input":"2023-05-21T07:37:42.971015Z","iopub.status.idle":"2023-05-21T07:37:42.987593Z","shell.execute_reply.started":"2023-05-21T07:37:42.970985Z","shell.execute_reply":"2023-05-21T07:37:42.986608Z"},"trusted":true},"execution_count":71,"outputs":[]},{"cell_type":"code","source":"mcmc = []\ngets = []\nfor i in range(30):\n    print(i)\n    see =i\n    xt,F,L = getFL(see)\n    EX,ut,t,xt_l,model =get_nn_solution(CFG,xt,F,L)\n    mcmc.append(torch.mean(torch.sum(xt[-1],dim=-1)).item())\n    gets.append(EX)\n    print(torch.mean(torch.sum(xt[-1],dim=-1)).item())\n    print(EX)\n    if np.abs(torch.mean(torch.sum(xt[-1],dim=-1)).item()- 4) > np.abs(EX-4):\n        print('A')\n    else:\n        print('B')","metadata":{"execution":{"iopub.status.busy":"2023-05-21T07:37:44.325177Z","iopub.execute_input":"2023-05-21T07:37:44.325543Z","iopub.status.idle":"2023-05-21T07:38:35.482062Z","shell.execute_reply.started":"2023-05-21T07:37:44.325510Z","shell.execute_reply":"2023-05-21T07:38:35.479543Z"},"trusted":true},"execution_count":72,"outputs":[{"name":"stdout","text":"0\n","output_type":"stream"},{"name":"stderr","text":"/tmp/ipykernel_31/3115571622.py:40: FutureWarning: The input object of type 'Tensor' is an array-like implementing one of the corresponding protocols (`__array__`, `__array_interface__` or `__array_struct__`); but not a sequence (or 0-D). In the future, this object will be coerced as if it was first converted using `np.array(obj)`. To retain the old behaviour, you have to either modify the type 'Tensor', or assign to an empty array created with `np.empty(correct_shape, dtype=object)`.\n  F = np.array(F)\n/tmp/ipykernel_31/3115571622.py:40: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n  F = np.array(F)\n/tmp/ipykernel_31/3115571622.py:41: FutureWarning: The input object of type 'Tensor' is an array-like implementing one of the corresponding protocols (`__array__`, `__array_interface__` or `__array_struct__`); but not a sequence (or 0-D). In the future, this object will be coerced as if it was first converted using `np.array(obj)`. To retain the old behaviour, you have to either modify the type 'Tensor', or assign to an empty array created with `np.empty(correct_shape, dtype=object)`.\n  L = np.array(L)\n/tmp/ipykernel_31/3115571622.py:41: VisibleDeprecationWarning: Creating an ndarray from ragged nested sequences (which is a list-or-tuple of lists-or-tuples-or ndarrays with different lengths or shapes) is deprecated. If you meant to do this, you must specify 'dtype=object' when creating the ndarray.\n  L = np.array(L)\n","output_type":"stream"},{"name":"stdout","text":"Ex tensor(3.8624, device='cuda:0', grad_fn=<MeanBackward0>)\nloss bonund 1: 35.76057052612305\nloss pde : 0.0033531971275806427\nEpoch:401/0\t PDE_loss=35.7639\t EX=0.1158\t\nloss bonund 1: 0.1518387347459793\nloss pde : 0.18162287771701813\nEpoch:401/100\t PDE_loss=0.3335\t EX=4.5168\t\nloss bonund 1: 0.0033773600589483976\nloss pde : 0.0003956859582103789\nEpoch:401/200\t PDE_loss=0.0038\t EX=4.3730\t\nloss bonund 1: 0.017411252483725548\nloss pde : 0.004392100032418966\nEpoch:401/300\t PDE_loss=0.0218\t EX=4.0800\t\n47.16729283332825\n3.862374782562256\n4.080016613006592\nA\n1\nEx tensor(4.6626, device='cuda:0', grad_fn=<MeanBackward0>)\nloss bonund 1: 40.93491744995117\nloss pde : 0.002171402098610997\nEpoch:401/0\t PDE_loss=40.9371\t EX=0.0821\t\n","output_type":"stream"},{"traceback":["\u001b[0;31m---------------------------------------------------------------------------\u001b[0m","\u001b[0;31mKeyboardInterrupt\u001b[0m                         Traceback (most recent call last)","Cell \u001b[0;32mIn[72], line 7\u001b[0m\n\u001b[1;32m      5\u001b[0m see \u001b[38;5;241m=\u001b[39mi\n\u001b[1;32m      6\u001b[0m xt,F,L \u001b[38;5;241m=\u001b[39m getFL(see)\n\u001b[0;32m----> 7\u001b[0m EX,ut,t,xt_l,model \u001b[38;5;241m=\u001b[39m\u001b[43mget_nn_solution\u001b[49m\u001b[43m(\u001b[49m\u001b[43mCFG\u001b[49m\u001b[43m,\u001b[49m\u001b[43mxt\u001b[49m\u001b[43m,\u001b[49m\u001b[43mF\u001b[49m\u001b[43m,\u001b[49m\u001b[43mL\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m      8\u001b[0m mcmc\u001b[38;5;241m.\u001b[39mappend(torch\u001b[38;5;241m.\u001b[39mmean(torch\u001b[38;5;241m.\u001b[39msum(xt[\u001b[38;5;241m-\u001b[39m\u001b[38;5;241m1\u001b[39m],dim\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m-\u001b[39m\u001b[38;5;241m1\u001b[39m))\u001b[38;5;241m.\u001b[39mitem())\n\u001b[1;32m      9\u001b[0m gets\u001b[38;5;241m.\u001b[39mappend(EX)\n","Cell \u001b[0;32mIn[71], line 30\u001b[0m, in \u001b[0;36mget_nn_solution\u001b[0;34m(CFG, xt, F, L)\u001b[0m\n\u001b[1;32m     28\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m epoch \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(CFG\u001b[38;5;241m.\u001b[39mepoch\u001b[38;5;241m*\u001b[39m\u001b[38;5;241m1\u001b[39m\u001b[38;5;241m-\u001b[39m\u001b[38;5;241m100\u001b[39m):\n\u001b[1;32m     29\u001b[0m     optimizer_list[\u001b[38;5;241m0\u001b[39m]\u001b[38;5;241m.\u001b[39mzero_grad()\n\u001b[0;32m---> 30\u001b[0m     loss_2 \u001b[38;5;241m=\u001b[39m \u001b[43mloss_pdes\u001b[49m\u001b[43m(\u001b[49m\u001b[43mt\u001b[49m\u001b[43m,\u001b[49m\u001b[43mxt_l\u001b[49m\u001b[43m,\u001b[49m\u001b[43mf\u001b[49m\u001b[43m,\u001b[49m\u001b[43ml\u001b[49m\u001b[43m,\u001b[49m\u001b[43mmodel\u001b[49m\u001b[43m,\u001b[49m\u001b[43mepoch\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m     31\u001b[0m     loss_2\u001b[38;5;241m.\u001b[39mbackward()\n\u001b[1;32m     32\u001b[0m     optimizer_list[\u001b[38;5;241m0\u001b[39m]\u001b[38;5;241m.\u001b[39mstep()\n","File \u001b[0;32m/opt/conda/lib/python3.10/site-packages/torch/nn/modules/module.py:1501\u001b[0m, in \u001b[0;36mModule._call_impl\u001b[0;34m(self, *args, **kwargs)\u001b[0m\n\u001b[1;32m   1496\u001b[0m \u001b[38;5;66;03m# If we don't have any hooks, we want to skip the rest of the logic in\u001b[39;00m\n\u001b[1;32m   1497\u001b[0m \u001b[38;5;66;03m# this function, and just call forward.\u001b[39;00m\n\u001b[1;32m   1498\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m (\u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_backward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_forward_pre_hooks\n\u001b[1;32m   1499\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_backward_pre_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_backward_hooks\n\u001b[1;32m   1500\u001b[0m         \u001b[38;5;129;01mor\u001b[39;00m _global_forward_hooks \u001b[38;5;129;01mor\u001b[39;00m _global_forward_pre_hooks):\n\u001b[0;32m-> 1501\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mforward_call\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43margs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m   1502\u001b[0m \u001b[38;5;66;03m# Do not call functions when jit is used\u001b[39;00m\n\u001b[1;32m   1503\u001b[0m full_backward_hooks, non_full_backward_hooks \u001b[38;5;241m=\u001b[39m [], []\n","Cell \u001b[0;32mIn[70], line 43\u001b[0m, in \u001b[0;36mloss_pde.forward\u001b[0;34m(self, t, xt_l, f, ll, model, epoch)\u001b[0m\n\u001b[1;32m     40\u001b[0m ut \u001b[38;5;241m=\u001b[39m d1[:,\u001b[38;5;241m0\u001b[39m]\n\u001b[1;32m     41\u001b[0m a \u001b[38;5;241m=\u001b[39m torch\u001b[38;5;241m.\u001b[39msum(f[s] \u001b[38;5;241m*\u001b[39m d1[:,\u001b[38;5;241m1\u001b[39m:],dim\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m1\u001b[39m)\n\u001b[0;32m---> 43\u001b[0m d3\u001b[38;5;241m=\u001b[39mtorch\u001b[38;5;241m.\u001b[39msum(torch\u001b[38;5;241m.\u001b[39mcat([torch\u001b[38;5;241m.\u001b[39mautograd\u001b[38;5;241m.\u001b[39mgrad(d1[:,i], x, torch\u001b[38;5;241m.\u001b[39mones_like(d1[:,i]), create_graph\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m)[\u001b[38;5;241m0\u001b[39m][:,i]\u001b[38;5;241m.\u001b[39mview(CFG\u001b[38;5;241m.\u001b[39mN,\u001b[38;5;241m1\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m i \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(\u001b[38;5;241m1\u001b[39m,CFG\u001b[38;5;241m.\u001b[39md\u001b[38;5;241m+\u001b[39m\u001b[38;5;241m1\u001b[39m)],dim \u001b[38;5;241m=\u001b[39m \u001b[38;5;241m1\u001b[39m),dim\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m1\u001b[39m)\n\u001b[1;32m     44\u001b[0m b\u001b[38;5;241m=\u001b[39m \u001b[38;5;241m1\u001b[39m\u001b[38;5;241m/\u001b[39m\u001b[38;5;241m2\u001b[39m\u001b[38;5;241m*\u001b[39md3\n\u001b[1;32m     46\u001b[0m loss_sum \u001b[38;5;241m=\u001b[39m loss_sum \u001b[38;5;241m+\u001b[39m (ut \u001b[38;5;241m+\u001b[39m a\u001b[38;5;241m+\u001b[39m b)\u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39m\u001b[38;5;241m2\u001b[39m\n","Cell \u001b[0;32mIn[70], line 43\u001b[0m, in \u001b[0;36m<listcomp>\u001b[0;34m(.0)\u001b[0m\n\u001b[1;32m     40\u001b[0m ut \u001b[38;5;241m=\u001b[39m d1[:,\u001b[38;5;241m0\u001b[39m]\n\u001b[1;32m     41\u001b[0m a \u001b[38;5;241m=\u001b[39m torch\u001b[38;5;241m.\u001b[39msum(f[s] \u001b[38;5;241m*\u001b[39m d1[:,\u001b[38;5;241m1\u001b[39m:],dim\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m1\u001b[39m)\n\u001b[0;32m---> 43\u001b[0m d3\u001b[38;5;241m=\u001b[39mtorch\u001b[38;5;241m.\u001b[39msum(torch\u001b[38;5;241m.\u001b[39mcat([\u001b[43mtorch\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mautograd\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mgrad\u001b[49m\u001b[43m(\u001b[49m\u001b[43md1\u001b[49m\u001b[43m[\u001b[49m\u001b[43m:\u001b[49m\u001b[43m,\u001b[49m\u001b[43mi\u001b[49m\u001b[43m]\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mx\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtorch\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mones_like\u001b[49m\u001b[43m(\u001b[49m\u001b[43md1\u001b[49m\u001b[43m[\u001b[49m\u001b[43m:\u001b[49m\u001b[43m,\u001b[49m\u001b[43mi\u001b[49m\u001b[43m]\u001b[49m\u001b[43m)\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mcreate_graph\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\u001b[43m)\u001b[49m[\u001b[38;5;241m0\u001b[39m][:,i]\u001b[38;5;241m.\u001b[39mview(CFG\u001b[38;5;241m.\u001b[39mN,\u001b[38;5;241m1\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m i \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(\u001b[38;5;241m1\u001b[39m,CFG\u001b[38;5;241m.\u001b[39md\u001b[38;5;241m+\u001b[39m\u001b[38;5;241m1\u001b[39m)],dim \u001b[38;5;241m=\u001b[39m \u001b[38;5;241m1\u001b[39m),dim\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m1\u001b[39m)\n\u001b[1;32m     44\u001b[0m b\u001b[38;5;241m=\u001b[39m \u001b[38;5;241m1\u001b[39m\u001b[38;5;241m/\u001b[39m\u001b[38;5;241m2\u001b[39m\u001b[38;5;241m*\u001b[39md3\n\u001b[1;32m     46\u001b[0m loss_sum \u001b[38;5;241m=\u001b[39m loss_sum \u001b[38;5;241m+\u001b[39m (ut \u001b[38;5;241m+\u001b[39m a\u001b[38;5;241m+\u001b[39m b)\u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39m\u001b[38;5;241m2\u001b[39m\n","File \u001b[0;32m/opt/conda/lib/python3.10/site-packages/torch/autograd/__init__.py:303\u001b[0m, in \u001b[0;36mgrad\u001b[0;34m(outputs, inputs, grad_outputs, retain_graph, create_graph, only_inputs, allow_unused, is_grads_batched)\u001b[0m\n\u001b[1;32m    301\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m _vmap_internals\u001b[38;5;241m.\u001b[39m_vmap(vjp, \u001b[38;5;241m0\u001b[39m, \u001b[38;5;241m0\u001b[39m, allow_none_pass_through\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m)(grad_outputs_)\n\u001b[1;32m    302\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m--> 303\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[43mVariable\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_execution_engine\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mrun_backward\u001b[49m\u001b[43m(\u001b[49m\u001b[43m  \u001b[49m\u001b[38;5;66;43;03m# Calls into the C++ engine to run the backward pass\u001b[39;49;00m\n\u001b[1;32m    304\u001b[0m \u001b[43m        \u001b[49m\u001b[43mt_outputs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mgrad_outputs_\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mretain_graph\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mcreate_graph\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mt_inputs\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    305\u001b[0m \u001b[43m        \u001b[49m\u001b[43mallow_unused\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43maccumulate_grad\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mFalse\u001b[39;49;00m\u001b[43m)\u001b[49m\n","\u001b[0;31mKeyboardInterrupt\u001b[0m: "],"ename":"KeyboardInterrupt","evalue":"","output_type":"error"}]},{"cell_type":"markdown","source":"\ngets=[4.109823226928711,\n 4.301965236663818,\n 3.963670492172241,\n 3.9696247577667236,\n 4.336550712585449,\n 4.3990797996521,\n 4.380660533905029,\n 5.110309600830078,\n 4.416534900665283,\n 4.487505912780762,\n 4.422759056091309,\n 4.470123767852783,\n 4.792152404785156,\n 3.8689281940460205,\n 3.8457119464874268,\n 3.8150579929351807,\n 4.228338241577148,\n 4.068879127502441,\n 3.97515869140625,\n 4.672130107879639,\n 4.416819095611572,\n 3.811925172805786,\n 4.0060343742370605,\n 3.89664363861084,\n 4.642745494842529,\n 3.8429617881774902,\n 4.0620832443237305,\n 3.8862268924713135,\n 4.06233024597168,\n 4.366152763366699]\n","metadata":{"execution":{"iopub.status.busy":"2023-05-07T07:56:57.548056Z","iopub.execute_input":"2023-05-07T07:56:57.548760Z","iopub.status.idle":"2023-05-07T07:56:57.556864Z","shell.execute_reply.started":"2023-05-07T07:56:57.548720Z","shell.execute_reply":"2023-05-07T07:56:57.555578Z"}}},{"cell_type":"markdown","source":"mcmc = [3.862374782562256,\n 4.662585258483887,\n 4.712591648101807,\n 4.465975761413574,\n 3.098313331604004,\n 3.728494167327881,\n 3.9587998390197754,\n 4.81437873840332,\n 4.5207414627075195,\n 3.7769787311553955,\n 3.771496534347534,\n 3.9164388179779053,\n 4.355262279510498,\n 3.673222064971924,\n 3.224835157394409,\n 3.9142062664031982,\n 4.503851890563965,\n 4.026615142822266,\n 3.4772963523864746,\n 3.823160171508789,\n 3.6742522716522217,\n 4.16671085357666,\n 3.63584041595459,\n 4.160348892211914,\n 3.877098798751831,\n 3.8082165718078613,\n 4.380477428436279,\n 4.521143913269043,\n 4.545581817626953,\n 4.275864124298096]\n","metadata":{"execution":{"iopub.status.busy":"2023-05-07T07:56:58.023033Z","iopub.execute_input":"2023-05-07T07:56:58.023759Z","iopub.status.idle":"2023-05-07T07:56:58.031453Z","shell.execute_reply.started":"2023-05-07T07:56:58.023708Z","shell.execute_reply":"2023-05-07T07:56:58.030155Z"}}},{"cell_type":"code","source":"d1 = np.array(gets)\nd2 = np.array(mcmc)\n\n\nprint('%e'%(np.mean(np.abs(d1-4))))\nprint('%e'%(np.mean(np.abs(d2-4))))\nprint('%e'%(np.mean((d1 - np.mean(d1))**2)))\nprint('%e'%(np.mean((d2 - np.mean(d2))**2)))\n\n","metadata":{"execution":{"iopub.status.busy":"2023-05-21T07:38:47.933587Z","iopub.execute_input":"2023-05-21T07:38:47.934161Z","iopub.status.idle":"2023-05-21T07:38:47.946309Z","shell.execute_reply.started":"2023-05-21T07:38:47.934125Z","shell.execute_reply":"2023-05-21T07:38:47.945232Z"},"trusted":true},"execution_count":73,"outputs":[{"name":"stdout","text":"8.001661e-02\n1.376252e-01\n0.000000e+00\n0.000000e+00\n","output_type":"stream"}]}]}