{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Non-A100 GPU detected, using math or mem efficient attention if input tensor is on cuda\n",
      "35719555\n"
     ]
    },
    {
     "data": {
      "application/vnd.jupyter.widget-view+json": {
       "model_id": "de55072daeb84f32bc4a4a61cf4d2626",
       "version_major": 2,
       "version_minor": 0
      },
      "text/plain": [
       "  0%|          | 0/700000 [00:00<?, ?it/s]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "from denoising_diffusion_pytorch import Unet, GaussianDiffusion, Trainer\n",
    "import torch\n",
    "model = Unet(\n",
    "    dim = 64,\n",
    "    dim_mults = (1,2, 4, 8),\n",
    "    flash_attn = True\n",
    ")\n",
    "#model.load_state_dict(torch.load(\"./results/model-26.pt\")['model'])\n",
    "print(sum([p.numel() for p in model.parameters()]))\n",
    "diffusion = GaussianDiffusion(\n",
    "    model,\n",
    "    image_size = 96,\n",
    "    timesteps = 1000,           # number of steps\n",
    "    sampling_timesteps = 250    # number of sampling timesteps (using ddim for faster inference [see citation for ddim paper])\n",
    ")\n",
    "\n",
    "trainer = Trainer(\n",
    "    diffusion,\n",
    "    './data/stl10',\n",
    "    train_batch_size = 56,\n",
    "    train_lr = 8e-5,\n",
    "    train_num_steps = 700000,         # total training steps\n",
    "    gradient_accumulate_every = 2,    # gradient accumulation steps\n",
    "    ema_decay = 0.995,                # exponential moving average decay\n",
    "    amp = True,                       # turn on mixed precision\n",
    "    calculate_fid = True,\n",
    "    save_best_and_latest_only=True, # whether to calculate fid during training\n",
    "    results_folder = './ddpm-stl-96/denoising_lib',\n",
    "    num_fid_samples=56,# number of samples for calculating fid\n",
    ")\n",
    "trainer.load(45)\n",
    "trainer.train()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [
    {
     "ename": "RuntimeError",
     "evalue": "Error(s) in loading state_dict for Unet:\n\tMissing key(s) in state_dict: \"init_conv.weight\", \"init_conv.bias\", \"time_mlp.1.weight\", \"time_mlp.1.bias\", \"time_mlp.3.weight\", \"time_mlp.3.bias\", \"downs.0.0.mlp.1.weight\", \"downs.0.0.mlp.1.bias\", \"downs.0.0.block1.proj.weight\", \"downs.0.0.block1.proj.bias\", \"downs.0.0.block1.norm.weight\", \"downs.0.0.block1.norm.bias\", \"downs.0.0.block2.proj.weight\", \"downs.0.0.block2.proj.bias\", \"downs.0.0.block2.norm.weight\", \"downs.0.0.block2.norm.bias\", \"downs.0.1.mlp.1.weight\", \"downs.0.1.mlp.1.bias\", \"downs.0.1.block1.proj.weight\", \"downs.0.1.block1.proj.bias\", \"downs.0.1.block1.norm.weight\", \"downs.0.1.block1.norm.bias\", \"downs.0.1.block2.proj.weight\", \"downs.0.1.block2.proj.bias\", \"downs.0.1.block2.norm.weight\", \"downs.0.1.block2.norm.bias\", \"downs.0.2.mem_kv\", \"downs.0.2.norm.g\", \"downs.0.2.to_qkv.weight\", \"downs.0.2.to_out.0.weight\", \"downs.0.2.to_out.0.bias\", \"downs.0.2.to_out.1.g\", \"downs.0.3.1.weight\", \"downs.0.3.1.bias\", \"downs.1.0.mlp.1.weight\", \"downs.1.0.mlp.1.bias\", \"downs.1.0.block1.proj.weight\", \"downs.1.0.block1.proj.bias\", \"downs.1.0.block1.norm.weight\", \"downs.1.0.block1.norm.bias\", \"downs.1.0.block2.proj.weight\", \"downs.1.0.block2.proj.bias\", \"downs.1.0.block2.norm.weight\", \"downs.1.0.block2.norm.bias\", \"downs.1.1.mlp.1.weight\", \"downs.1.1.mlp.1.bias\", \"downs.1.1.block1.proj.weight\", \"downs.1.1.block1.proj.bias\", \"downs.1.1.block1.norm.weight\", \"downs.1.1.block1.norm.bias\", \"downs.1.1.block2.proj.weight\", \"downs.1.1.block2.proj.bias\", \"downs.1.1.block2.norm.weight\", \"downs.1.1.block2.norm.bias\", \"downs.1.2.mem_kv\", \"downs.1.2.norm.g\", \"downs.1.2.to_qkv.weight\", \"downs.1.2.to_out.0.weight\", \"downs.1.2.to_out.0.bias\", \"downs.1.2.to_out.1.g\", \"downs.1.3.1.weight\", \"downs.1.3.1.bias\", \"downs.2.0.mlp.1.weight\", \"downs.2.0.mlp.1.bias\", \"downs.2.0.block1.proj.weight\", \"downs.2.0.block1.proj.bias\", \"downs.2.0.block1.norm.weight\", \"downs.2.0.block1.norm.bias\", \"downs.2.0.block2.proj.weight\", \"downs.2.0.block2.proj.bias\", \"downs.2.0.block2.norm.weight\", \"downs.2.0.block2.norm.bias\", \"downs.2.1.mlp.1.weight\", \"downs.2.1.mlp.1.bias\", \"downs.2.1.block1.proj.weight\", \"downs.2.1.block1.proj.bias\", \"downs.2.1.block1.norm.weight\", \"downs.2.1.block1.norm.bias\", \"downs.2.1.block2.proj.weight\", \"downs.2.1.block2.proj.bias\", \"downs.2.1.block2.norm.weight\", \"downs.2.1.block2.norm.bias\", \"downs.2.2.mem_kv\", \"downs.2.2.norm.g\", \"downs.2.2.to_qkv.weight\", \"downs.2.2.to_out.0.weight\", \"downs.2.2.to_out.0.bias\", \"downs.2.2.to_out.1.g\", \"downs.2.3.1.weight\", \"downs.2.3.1.bias\", \"downs.3.0.mlp.1.weight\", \"downs.3.0.mlp.1.bias\", \"downs.3.0.block1.proj.weight\", \"downs.3.0.block1.proj.bias\", \"downs.3.0.block1.norm.weight\", \"downs.3.0.block1.norm.bias\", \"downs.3.0.block2.proj.weight\", \"downs.3.0.block2.proj.bias\", \"downs.3.0.block2.norm.weight\", \"downs.3.0.block2.norm.bias\", \"downs.3.1.mlp.1.weight\", \"downs.3.1.mlp.1.bias\", \"downs.3.1.block1.proj.weight\", \"downs.3.1.block1.proj.bias\", \"downs.3.1.block1.norm.weight\", \"downs.3.1.block1.norm.bias\", \"downs.3.1.block2.proj.weight\", \"downs.3.1.block2.proj.bias\", \"downs.3.1.block2.norm.weight\", \"downs.3.1.block2.norm.bias\", \"downs.3.2.mem_kv\", \"downs.3.2.norm.g\", \"downs.3.2.to_qkv.weight\", \"downs.3.2.to_out.weight\", \"downs.3.2.to_out.bias\", \"downs.3.3.weight\", \"downs.3.3.bias\", \"ups.0.0.mlp.1.weight\", \"ups.0.0.mlp.1.bias\", \"ups.0.0.block1.proj.weight\", \"ups.0.0.block1.proj.bias\", \"ups.0.0.block1.norm.weight\", \"ups.0.0.block1.norm.bias\", \"ups.0.0.block2.proj.weight\", \"ups.0.0.block2.proj.bias\", \"ups.0.0.block2.norm.weight\", \"ups.0.0.block2.norm.bias\", \"ups.0.0.res_conv.weight\", \"ups.0.0.res_conv.bias\", \"ups.0.1.mlp.1.weight\", \"ups.0.1.mlp.1.bias\", \"ups.0.1.block1.proj.weight\", \"ups.0.1.block1.proj.bias\", \"ups.0.1.block1.norm.weight\", \"ups.0.1.block1.norm.bias\", \"ups.0.1.block2.proj.weight\", \"ups.0.1.block2.proj.bias\", \"ups.0.1.block2.norm.weight\", \"ups.0.1.block2.norm.bias\", \"ups.0.1.res_conv.weight\", \"ups.0.1.res_conv.bias\", \"ups.0.2.mem_kv\", \"ups.0.2.norm.g\", \"ups.0.2.to_qkv.weight\", \"ups.0.2.to_out.weight\", \"ups.0.2.to_out.bias\", \"ups.0.3.1.weight\", \"ups.0.3.1.bias\", \"ups.1.0.mlp.1.weight\", \"ups.1.0.mlp.1.bias\", \"ups.1.0.block1.proj.weight\", \"ups.1.0.block1.proj.bias\", \"ups.1.0.block1.norm.weight\", \"ups.1.0.block1.norm.bias\", \"ups.1.0.block2.proj.weight\", \"ups.1.0.block2.proj.bias\", \"ups.1.0.block2.norm.weight\", \"ups.1.0.block2.norm.bias\", \"ups.1.0.res_conv.weight\", \"ups.1.0.res_conv.bias\", \"ups.1.1.mlp.1.weight\", \"ups.1.1.mlp.1.bias\", \"ups.1.1.block1.proj.weight\", \"ups.1.1.block1.proj.bias\", \"ups.1.1.block1.norm.weight\", \"ups.1.1.block1.norm.bias\", \"ups.1.1.block2.proj.weight\", \"ups.1.1.block2.proj.bias\", \"ups.1.1.block2.norm.weight\", \"ups.1.1.block2.norm.bias\", \"ups.1.1.res_conv.weight\", \"ups.1.1.res_conv.bias\", \"ups.1.2.mem_kv\", \"ups.1.2.norm.g\", \"ups.1.2.to_qkv.weight\", \"ups.1.2.to_out.0.weight\", \"ups.1.2.to_out.0.bias\", \"ups.1.2.to_out.1.g\", \"ups.1.3.1.weight\", \"ups.1.3.1.bias\", \"ups.2.0.mlp.1.weight\", \"ups.2.0.mlp.1.bias\", \"ups.2.0.block1.proj.weight\", \"ups.2.0.block1.proj.bias\", \"ups.2.0.block1.norm.weight\", \"ups.2.0.block1.norm.bias\", \"ups.2.0.block2.proj.weight\", \"ups.2.0.block2.proj.bias\", \"ups.2.0.block2.norm.weight\", \"ups.2.0.block2.norm.bias\", \"ups.2.0.res_conv.weight\", \"ups.2.0.res_conv.bias\", \"ups.2.1.mlp.1.weight\", \"ups.2.1.mlp.1.bias\", \"ups.2.1.block1.proj.weight\", \"ups.2.1.block1.proj.bias\", \"ups.2.1.block1.norm.weight\", \"ups.2.1.block1.norm.bias\", \"ups.2.1.block2.proj.weight\", \"ups.2.1.block2.proj.bias\", \"ups.2.1.block2.norm.weight\", \"ups.2.1.block2.norm.bias\", \"ups.2.1.res_conv.weight\", \"ups.2.1.res_conv.bias\", \"ups.2.2.mem_kv\", \"ups.2.2.norm.g\", \"ups.2.2.to_qkv.weight\", \"ups.2.2.to_out.0.weight\", \"ups.2.2.to_out.0.bias\", \"ups.2.2.to_out.1.g\", \"ups.2.3.1.weight\", \"ups.2.3.1.bias\", \"ups.3.0.mlp.1.weight\", \"ups.3.0.mlp.1.bias\", \"ups.3.0.block1.proj.weight\", \"ups.3.0.block1.proj.bias\", \"ups.3.0.block1.norm.weight\", \"ups.3.0.block1.norm.bias\", \"ups.3.0.block2.proj.weight\", \"ups.3.0.block2.proj.bias\", \"ups.3.0.block2.norm.weight\", \"ups.3.0.block2.norm.bias\", \"ups.3.0.res_conv.weight\", \"ups.3.0.res_conv.bias\", \"ups.3.1.mlp.1.weight\", \"ups.3.1.mlp.1.bias\", \"ups.3.1.block1.proj.weight\", \"ups.3.1.block1.proj.bias\", \"ups.3.1.block1.norm.weight\", \"ups.3.1.block1.norm.bias\", \"ups.3.1.block2.proj.weight\", \"ups.3.1.block2.proj.bias\", \"ups.3.1.block2.norm.weight\", \"ups.3.1.block2.norm.bias\", \"ups.3.1.res_conv.weight\", \"ups.3.1.res_conv.bias\", \"ups.3.2.mem_kv\", \"ups.3.2.norm.g\", \"ups.3.2.to_qkv.weight\", \"ups.3.2.to_out.0.weight\", \"ups.3.2.to_out.0.bias\", \"ups.3.2.to_out.1.g\", \"ups.3.3.weight\", \"ups.3.3.bias\", \"mid_block1.mlp.1.weight\", \"mid_block1.mlp.1.bias\", \"mid_block1.block1.proj.weight\", \"mid_block1.block1.proj.bias\", \"mid_block1.block1.norm.weight\", \"mid_block1.block1.norm.bias\", \"mid_block1.block2.proj.weight\", \"mid_block1.block2.proj.bias\", \"mid_block1.block2.norm.weight\", \"mid_block1.block2.norm.bias\", \"mid_attn.mem_kv\", \"mid_attn.norm.g\", \"mid_attn.to_qkv.weight\", \"mid_attn.to_out.weight\", \"mid_attn.to_out.bias\", \"mid_block2.mlp.1.weight\", \"mid_block2.mlp.1.bias\", \"mid_block2.block1.proj.weight\", \"mid_block2.block1.proj.bias\", \"mid_block2.block1.norm.weight\", \"mid_block2.block1.norm.bias\", \"mid_block2.block2.proj.weight\", \"mid_block2.block2.proj.bias\", \"mid_block2.block2.norm.weight\", \"mid_block2.block2.norm.bias\", \"final_res_block.mlp.1.weight\", \"final_res_block.mlp.1.bias\", \"final_res_block.block1.proj.weight\", \"final_res_block.block1.proj.bias\", \"final_res_block.block1.norm.weight\", \"final_res_block.block1.norm.bias\", \"final_res_block.block2.proj.weight\", \"final_res_block.block2.proj.bias\", \"final_res_block.block2.norm.weight\", \"final_res_block.block2.norm.bias\", \"final_res_block.res_conv.weight\", \"final_res_block.res_conv.bias\", \"final_conv.weight\", \"final_conv.bias\". \n\tUnexpected key(s) in state_dict: \"betas\", \"alphas_cumprod\", \"alphas_cumprod_prev\", \"sqrt_alphas_cumprod\", \"sqrt_one_minus_alphas_cumprod\", \"log_one_minus_alphas_cumprod\", \"sqrt_recip_alphas_cumprod\", \"sqrt_recipm1_alphas_cumprod\", \"posterior_variance\", \"posterior_log_variance_clipped\", \"posterior_mean_coef1\", \"posterior_mean_coef2\", \"loss_weight\", \"model.init_conv.weight\", \"model.init_conv.bias\", \"model.time_mlp.1.weight\", \"model.time_mlp.1.bias\", \"model.time_mlp.3.weight\", \"model.time_mlp.3.bias\", \"model.downs.0.0.mlp.1.weight\", \"model.downs.0.0.mlp.1.bias\", \"model.downs.0.0.block1.proj.weight\", \"model.downs.0.0.block1.proj.bias\", \"model.downs.0.0.block1.norm.weight\", \"model.downs.0.0.block1.norm.bias\", \"model.downs.0.0.block2.proj.weight\", \"model.downs.0.0.block2.proj.bias\", \"model.downs.0.0.block2.norm.weight\", \"model.downs.0.0.block2.norm.bias\", \"model.downs.0.1.mlp.1.weight\", \"model.downs.0.1.mlp.1.bias\", \"model.downs.0.1.block1.proj.weight\", \"model.downs.0.1.block1.proj.bias\", \"model.downs.0.1.block1.norm.weight\", \"model.downs.0.1.block1.norm.bias\", \"model.downs.0.1.block2.proj.weight\", \"model.downs.0.1.block2.proj.bias\", \"model.downs.0.1.block2.norm.weight\", \"model.downs.0.1.block2.norm.bias\", \"model.downs.0.2.mem_kv\", \"model.downs.0.2.norm.g\", \"model.downs.0.2.to_qkv.weight\", \"model.downs.0.2.to_out.0.weight\", \"model.downs.0.2.to_out.0.bias\", \"model.downs.0.2.to_out.1.g\", \"model.downs.0.3.1.weight\", \"model.downs.0.3.1.bias\", \"model.downs.1.0.mlp.1.weight\", \"model.downs.1.0.mlp.1.bias\", \"model.downs.1.0.block1.proj.weight\", \"model.downs.1.0.block1.proj.bias\", \"model.downs.1.0.block1.norm.weight\", \"model.downs.1.0.block1.norm.bias\", \"model.downs.1.0.block2.proj.weight\", \"model.downs.1.0.block2.proj.bias\", \"model.downs.1.0.block2.norm.weight\", \"model.downs.1.0.block2.norm.bias\", \"model.downs.1.1.mlp.1.weight\", \"model.downs.1.1.mlp.1.bias\", \"model.downs.1.1.block1.proj.weight\", \"model.downs.1.1.block1.proj.bias\", \"model.downs.1.1.block1.norm.weight\", \"model.downs.1.1.block1.norm.bias\", \"model.downs.1.1.block2.proj.weight\", \"model.downs.1.1.block2.proj.bias\", \"model.downs.1.1.block2.norm.weight\", \"model.downs.1.1.block2.norm.bias\", \"model.downs.1.2.mem_kv\", \"model.downs.1.2.norm.g\", \"model.downs.1.2.to_qkv.weight\", \"model.downs.1.2.to_out.0.weight\", \"model.downs.1.2.to_out.0.bias\", \"model.downs.1.2.to_out.1.g\", \"model.downs.1.3.1.weight\", \"model.downs.1.3.1.bias\", \"model.downs.2.0.mlp.1.weight\", \"model.downs.2.0.mlp.1.bias\", \"model.downs.2.0.block1.proj.weight\", \"model.downs.2.0.block1.proj.bias\", \"model.downs.2.0.block1.norm.weight\", \"model.downs.2.0.block1.norm.bias\", \"model.downs.2.0.block2.proj.weight\", \"model.downs.2.0.block2.proj.bias\", \"model.downs.2.0.block2.norm.weight\", \"model.downs.2.0.block2.norm.bias\", \"model.downs.2.1.mlp.1.weight\", \"model.downs.2.1.mlp.1.bias\", \"model.downs.2.1.block1.proj.weight\", \"model.downs.2.1.block1.proj.bias\", \"model.downs.2.1.block1.norm.weight\", \"model.downs.2.1.block1.norm.bias\", \"model.downs.2.1.block2.proj.weight\", \"model.downs.2.1.block2.proj.bias\", \"model.downs.2.1.block2.norm.weight\", \"model.downs.2.1.block2.norm.bias\", \"model.downs.2.2.mem_kv\", \"model.downs.2.2.norm.g\", \"model.downs.2.2.to_qkv.weight\", \"model.downs.2.2.to_out.0.weight\", \"model.downs.2.2.to_out.0.bias\", \"model.downs.2.2.to_out.1.g\", \"model.downs.2.3.1.weight\", \"model.downs.2.3.1.bias\", \"model.downs.3.0.mlp.1.weight\", \"model.downs.3.0.mlp.1.bias\", \"model.downs.3.0.block1.proj.weight\", \"model.downs.3.0.block1.proj.bias\", \"model.downs.3.0.block1.norm.weight\", \"model.downs.3.0.block1.norm.bias\", \"model.downs.3.0.block2.proj.weight\", \"model.downs.3.0.block2.proj.bias\", \"model.downs.3.0.block2.norm.weight\", \"model.downs.3.0.block2.norm.bias\", \"model.downs.3.1.mlp.1.weight\", \"model.downs.3.1.mlp.1.bias\", \"model.downs.3.1.block1.proj.weight\", \"model.downs.3.1.block1.proj.bias\", \"model.downs.3.1.block1.norm.weight\", \"model.downs.3.1.block1.norm.bias\", \"model.downs.3.1.block2.proj.weight\", \"model.downs.3.1.block2.proj.bias\", \"model.downs.3.1.block2.norm.weight\", \"model.downs.3.1.block2.norm.bias\", \"model.downs.3.2.mem_kv\", \"model.downs.3.2.norm.g\", \"model.downs.3.2.to_qkv.weight\", \"model.downs.3.2.to_out.weight\", \"model.downs.3.2.to_out.bias\", \"model.downs.3.3.weight\", \"model.downs.3.3.bias\", \"model.ups.0.0.mlp.1.weight\", \"model.ups.0.0.mlp.1.bias\", \"model.ups.0.0.block1.proj.weight\", \"model.ups.0.0.block1.proj.bias\", \"model.ups.0.0.block1.norm.weight\", \"model.ups.0.0.block1.norm.bias\", \"model.ups.0.0.block2.proj.weight\", \"model.ups.0.0.block2.proj.bias\", \"model.ups.0.0.block2.norm.weight\", \"model.ups.0.0.block2.norm.bias\", \"model.ups.0.0.res_conv.weight\", \"model.ups.0.0.res_conv.bias\", \"model.ups.0.1.mlp.1.weight\", \"model.ups.0.1.mlp.1.bias\", \"model.ups.0.1.block1.proj.weight\", \"model.ups.0.1.block1.proj.bias\", \"model.ups.0.1.block1.norm.weight\", \"model.ups.0.1.block1.norm.bias\", \"model.ups.0.1.block2.proj.weight\", \"model.ups.0.1.block2.proj.bias\", \"model.ups.0.1.block2.norm.weight\", \"model.ups.0.1.block2.norm.bias\", \"model.ups.0.1.res_conv.weight\", \"model.ups.0.1.res_conv.bias\", \"model.ups.0.2.mem_kv\", \"model.ups.0.2.norm.g\", \"model.ups.0.2.to_qkv.weight\", \"model.ups.0.2.to_out.weight\", \"model.ups.0.2.to_out.bias\", \"model.ups.0.3.1.weight\", \"model.ups.0.3.1.bias\", \"model.ups.1.0.mlp.1.weight\", \"model.ups.1.0.mlp.1.bias\", \"model.ups.1.0.block1.proj.weight\", \"model.ups.1.0.block1.proj.bias\", \"model.ups.1.0.block1.norm.weight\", \"model.ups.1.0.block1.norm.bias\", \"model.ups.1.0.block2.proj.weight\", \"model.ups.1.0.block2.proj.bias\", \"model.ups.1.0.block2.norm.weight\", \"model.ups.1.0.block2.norm.bias\", \"model.ups.1.0.res_conv.weight\", \"model.ups.1.0.res_conv.bias\", \"model.ups.1.1.mlp.1.weight\", \"model.ups.1.1.mlp.1.bias\", \"model.ups.1.1.block1.proj.weight\", \"model.ups.1.1.block1.proj.bias\", \"model.ups.1.1.block1.norm.weight\", \"model.ups.1.1.block1.norm.bias\", \"model.ups.1.1.block2.proj.weight\", \"model.ups.1.1.block2.proj.bias\", \"model.ups.1.1.block2.norm.weight\", \"model.ups.1.1.block2.norm.bias\", \"model.ups.1.1.res_conv.weight\", \"model.ups.1.1.res_conv.bias\", \"model.ups.1.2.mem_kv\", \"model.ups.1.2.norm.g\", \"model.ups.1.2.to_qkv.weight\", \"model.ups.1.2.to_out.0.weight\", \"model.ups.1.2.to_out.0.bias\", \"model.ups.1.2.to_out.1.g\", \"model.ups.1.3.1.weight\", \"model.ups.1.3.1.bias\", \"model.ups.2.0.mlp.1.weight\", \"model.ups.2.0.mlp.1.bias\", \"model.ups.2.0.block1.proj.weight\", \"model.ups.2.0.block1.proj.bias\", \"model.ups.2.0.block1.norm.weight\", \"model.ups.2.0.block1.norm.bias\", \"model.ups.2.0.block2.proj.weight\", \"model.ups.2.0.block2.proj.bias\", \"model.ups.2.0.block2.norm.weight\", \"model.ups.2.0.block2.norm.bias\", \"model.ups.2.0.res_conv.weight\", \"model.ups.2.0.res_conv.bias\", \"model.ups.2.1.mlp.1.weight\", \"model.ups.2.1.mlp.1.bias\", \"model.ups.2.1.block1.proj.weight\", \"model.ups.2.1.block1.proj.bias\", \"model.ups.2.1.block1.norm.weight\", \"model.ups.2.1.block1.norm.bias\", \"model.ups.2.1.block2.proj.weight\", \"model.ups.2.1.block2.proj.bias\", \"model.ups.2.1.block2.norm.weight\", \"model.ups.2.1.block2.norm.bias\", \"model.ups.2.1.res_conv.weight\", \"model.ups.2.1.res_conv.bias\", \"model.ups.2.2.mem_kv\", \"model.ups.2.2.norm.g\", \"model.ups.2.2.to_qkv.weight\", \"model.ups.2.2.to_out.0.weight\", \"model.ups.2.2.to_out.0.bias\", \"model.ups.2.2.to_out.1.g\", \"model.ups.2.3.1.weight\", \"model.ups.2.3.1.bias\", \"model.ups.3.0.mlp.1.weight\", \"model.ups.3.0.mlp.1.bias\", \"model.ups.3.0.block1.proj.weight\", \"model.ups.3.0.block1.proj.bias\", \"model.ups.3.0.block1.norm.weight\", \"model.ups.3.0.block1.norm.bias\", \"model.ups.3.0.block2.proj.weight\", \"model.ups.3.0.block2.proj.bias\", \"model.ups.3.0.block2.norm.weight\", \"model.ups.3.0.block2.norm.bias\", \"model.ups.3.0.res_conv.weight\", \"model.ups.3.0.res_conv.bias\", \"model.ups.3.1.mlp.1.weight\", \"model.ups.3.1.mlp.1.bias\", \"model.ups.3.1.block1.proj.weight\", \"model.ups.3.1.block1.proj.bias\", \"model.ups.3.1.block1.norm.weight\", \"model.ups.3.1.block1.norm.bias\", \"model.ups.3.1.block2.proj.weight\", \"model.ups.3.1.block2.proj.bias\", \"model.ups.3.1.block2.norm.weight\", \"model.ups.3.1.block2.norm.bias\", \"model.ups.3.1.res_conv.weight\", \"model.ups.3.1.res_conv.bias\", \"model.ups.3.2.mem_kv\", \"model.ups.3.2.norm.g\", \"model.ups.3.2.to_qkv.weight\", \"model.ups.3.2.to_out.0.weight\", \"model.ups.3.2.to_out.0.bias\", \"model.ups.3.2.to_out.1.g\", \"model.ups.3.3.weight\", \"model.ups.3.3.bias\", \"model.mid_block1.mlp.1.weight\", \"model.mid_block1.mlp.1.bias\", \"model.mid_block1.block1.proj.weight\", \"model.mid_block1.block1.proj.bias\", \"model.mid_block1.block1.norm.weight\", \"model.mid_block1.block1.norm.bias\", \"model.mid_block1.block2.proj.weight\", \"model.mid_block1.block2.proj.bias\", \"model.mid_block1.block2.norm.weight\", \"model.mid_block1.block2.norm.bias\", \"model.mid_attn.mem_kv\", \"model.mid_attn.norm.g\", \"model.mid_attn.to_qkv.weight\", \"model.mid_attn.to_out.weight\", \"model.mid_attn.to_out.bias\", \"model.mid_block2.mlp.1.weight\", \"model.mid_block2.mlp.1.bias\", \"model.mid_block2.block1.proj.weight\", \"model.mid_block2.block1.proj.bias\", \"model.mid_block2.block1.norm.weight\", \"model.mid_block2.block1.norm.bias\", \"model.mid_block2.block2.proj.weight\", \"model.mid_block2.block2.proj.bias\", \"model.mid_block2.block2.norm.weight\", \"model.mid_block2.block2.norm.bias\", \"model.final_res_block.mlp.1.weight\", \"model.final_res_block.mlp.1.bias\", \"model.final_res_block.block1.proj.weight\", \"model.final_res_block.block1.proj.bias\", \"model.final_res_block.block1.norm.weight\", \"model.final_res_block.block1.norm.bias\", \"model.final_res_block.block2.proj.weight\", \"model.final_res_block.block2.proj.bias\", \"model.final_res_block.block2.norm.weight\", \"model.final_res_block.block2.norm.bias\", \"model.final_res_block.res_conv.weight\", \"model.final_res_block.res_conv.bias\", \"model.final_conv.weight\", \"model.final_conv.bias\". ",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mRuntimeError\u001b[0m                              Traceback (most recent call last)",
      "Input \u001b[1;32mIn [3]\u001b[0m, in \u001b[0;36m<cell line: 1>\u001b[1;34m()\u001b[0m\n\u001b[1;32m----> 1\u001b[0m \u001b[43mmodel\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload_state_dict\u001b[49m\u001b[43m(\u001b[49m\u001b[43mtorch\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mload\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43m./ddpm-stl-96/denoising_lib/model-45.pt\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m)\u001b[49m\u001b[43m[\u001b[49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[38;5;124;43mmodel\u001b[39;49m\u001b[38;5;124;43m'\u001b[39;49m\u001b[43m]\u001b[49m\u001b[43m)\u001b[49m\n",
      "File \u001b[1;32md:\\Anaconda\\lib\\site-packages\\torch\\nn\\modules\\module.py:2152\u001b[0m, in \u001b[0;36mModule.load_state_dict\u001b[1;34m(self, state_dict, strict, assign)\u001b[0m\n\u001b[0;32m   2147\u001b[0m         error_msgs\u001b[38;5;241m.\u001b[39minsert(\n\u001b[0;32m   2148\u001b[0m             \u001b[38;5;241m0\u001b[39m, \u001b[38;5;124m'\u001b[39m\u001b[38;5;124mMissing key(s) in state_dict: \u001b[39m\u001b[38;5;132;01m{}\u001b[39;00m\u001b[38;5;124m. \u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;241m.\u001b[39mformat(\n\u001b[0;32m   2149\u001b[0m                 \u001b[38;5;124m'\u001b[39m\u001b[38;5;124m, \u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;241m.\u001b[39mjoin(\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m'\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;132;01m{\u001b[39;00mk\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m'\u001b[39m \u001b[38;5;28;01mfor\u001b[39;00m k \u001b[38;5;129;01min\u001b[39;00m missing_keys)))\n\u001b[0;32m   2151\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mlen\u001b[39m(error_msgs) \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m0\u001b[39m:\n\u001b[1;32m-> 2152\u001b[0m     \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mRuntimeError\u001b[39;00m(\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mError(s) in loading state_dict for \u001b[39m\u001b[38;5;132;01m{}\u001b[39;00m\u001b[38;5;124m:\u001b[39m\u001b[38;5;130;01m\\n\u001b[39;00m\u001b[38;5;130;01m\\t\u001b[39;00m\u001b[38;5;132;01m{}\u001b[39;00m\u001b[38;5;124m'\u001b[39m\u001b[38;5;241m.\u001b[39mformat(\n\u001b[0;32m   2153\u001b[0m                        \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__class__\u001b[39m\u001b[38;5;241m.\u001b[39m\u001b[38;5;18m__name__\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;130;01m\\n\u001b[39;00m\u001b[38;5;130;01m\\t\u001b[39;00m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;241m.\u001b[39mjoin(error_msgs)))\n\u001b[0;32m   2154\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m _IncompatibleKeys(missing_keys, unexpected_keys)\n",
      "\u001b[1;31mRuntimeError\u001b[0m: Error(s) in loading state_dict for Unet:\n\tMissing key(s) in state_dict: \"init_conv.weight\", \"init_conv.bias\", \"time_mlp.1.weight\", \"time_mlp.1.bias\", \"time_mlp.3.weight\", \"time_mlp.3.bias\", \"downs.0.0.mlp.1.weight\", \"downs.0.0.mlp.1.bias\", \"downs.0.0.block1.proj.weight\", \"downs.0.0.block1.proj.bias\", \"downs.0.0.block1.norm.weight\", \"downs.0.0.block1.norm.bias\", \"downs.0.0.block2.proj.weight\", \"downs.0.0.block2.proj.bias\", \"downs.0.0.block2.norm.weight\", \"downs.0.0.block2.norm.bias\", \"downs.0.1.mlp.1.weight\", \"downs.0.1.mlp.1.bias\", \"downs.0.1.block1.proj.weight\", \"downs.0.1.block1.proj.bias\", \"downs.0.1.block1.norm.weight\", \"downs.0.1.block1.norm.bias\", \"downs.0.1.block2.proj.weight\", \"downs.0.1.block2.proj.bias\", \"downs.0.1.block2.norm.weight\", \"downs.0.1.block2.norm.bias\", \"downs.0.2.mem_kv\", \"downs.0.2.norm.g\", \"downs.0.2.to_qkv.weight\", \"downs.0.2.to_out.0.weight\", \"downs.0.2.to_out.0.bias\", \"downs.0.2.to_out.1.g\", \"downs.0.3.1.weight\", \"downs.0.3.1.bias\", \"downs.1.0.mlp.1.weight\", \"downs.1.0.mlp.1.bias\", \"downs.1.0.block1.proj.weight\", \"downs.1.0.block1.proj.bias\", \"downs.1.0.block1.norm.weight\", \"downs.1.0.block1.norm.bias\", \"downs.1.0.block2.proj.weight\", \"downs.1.0.block2.proj.bias\", \"downs.1.0.block2.norm.weight\", \"downs.1.0.block2.norm.bias\", \"downs.1.1.mlp.1.weight\", \"downs.1.1.mlp.1.bias\", \"downs.1.1.block1.proj.weight\", \"downs.1.1.block1.proj.bias\", \"downs.1.1.block1.norm.weight\", \"downs.1.1.block1.norm.bias\", \"downs.1.1.block2.proj.weight\", \"downs.1.1.block2.proj.bias\", \"downs.1.1.block2.norm.weight\", \"downs.1.1.block2.norm.bias\", \"downs.1.2.mem_kv\", \"downs.1.2.norm.g\", \"downs.1.2.to_qkv.weight\", \"downs.1.2.to_out.0.weight\", \"downs.1.2.to_out.0.bias\", \"downs.1.2.to_out.1.g\", \"downs.1.3.1.weight\", \"downs.1.3.1.bias\", \"downs.2.0.mlp.1.weight\", \"downs.2.0.mlp.1.bias\", \"downs.2.0.block1.proj.weight\", \"downs.2.0.block1.proj.bias\", \"downs.2.0.block1.norm.weight\", \"downs.2.0.block1.norm.bias\", \"downs.2.0.block2.proj.weight\", \"downs.2.0.block2.proj.bias\", \"downs.2.0.block2.norm.weight\", \"downs.2.0.block2.norm.bias\", \"downs.2.1.mlp.1.weight\", \"downs.2.1.mlp.1.bias\", \"downs.2.1.block1.proj.weight\", \"downs.2.1.block1.proj.bias\", \"downs.2.1.block1.norm.weight\", \"downs.2.1.block1.norm.bias\", \"downs.2.1.block2.proj.weight\", \"downs.2.1.block2.proj.bias\", \"downs.2.1.block2.norm.weight\", \"downs.2.1.block2.norm.bias\", \"downs.2.2.mem_kv\", \"downs.2.2.norm.g\", \"downs.2.2.to_qkv.weight\", \"downs.2.2.to_out.0.weight\", \"downs.2.2.to_out.0.bias\", \"downs.2.2.to_out.1.g\", \"downs.2.3.1.weight\", \"downs.2.3.1.bias\", \"downs.3.0.mlp.1.weight\", \"downs.3.0.mlp.1.bias\", \"downs.3.0.block1.proj.weight\", \"downs.3.0.block1.proj.bias\", \"downs.3.0.block1.norm.weight\", \"downs.3.0.block1.norm.bias\", \"downs.3.0.block2.proj.weight\", \"downs.3.0.block2.proj.bias\", \"downs.3.0.block2.norm.weight\", \"downs.3.0.block2.norm.bias\", \"downs.3.1.mlp.1.weight\", \"downs.3.1.mlp.1.bias\", \"downs.3.1.block1.proj.weight\", \"downs.3.1.block1.proj.bias\", \"downs.3.1.block1.norm.weight\", \"downs.3.1.block1.norm.bias\", \"downs.3.1.block2.proj.weight\", \"downs.3.1.block2.proj.bias\", \"downs.3.1.block2.norm.weight\", \"downs.3.1.block2.norm.bias\", \"downs.3.2.mem_kv\", \"downs.3.2.norm.g\", \"downs.3.2.to_qkv.weight\", \"downs.3.2.to_out.weight\", \"downs.3.2.to_out.bias\", \"downs.3.3.weight\", \"downs.3.3.bias\", \"ups.0.0.mlp.1.weight\", \"ups.0.0.mlp.1.bias\", \"ups.0.0.block1.proj.weight\", \"ups.0.0.block1.proj.bias\", \"ups.0.0.block1.norm.weight\", \"ups.0.0.block1.norm.bias\", \"ups.0.0.block2.proj.weight\", \"ups.0.0.block2.proj.bias\", \"ups.0.0.block2.norm.weight\", \"ups.0.0.block2.norm.bias\", \"ups.0.0.res_conv.weight\", \"ups.0.0.res_conv.bias\", \"ups.0.1.mlp.1.weight\", \"ups.0.1.mlp.1.bias\", \"ups.0.1.block1.proj.weight\", \"ups.0.1.block1.proj.bias\", \"ups.0.1.block1.norm.weight\", \"ups.0.1.block1.norm.bias\", \"ups.0.1.block2.proj.weight\", \"ups.0.1.block2.proj.bias\", \"ups.0.1.block2.norm.weight\", \"ups.0.1.block2.norm.bias\", \"ups.0.1.res_conv.weight\", \"ups.0.1.res_conv.bias\", \"ups.0.2.mem_kv\", \"ups.0.2.norm.g\", \"ups.0.2.to_qkv.weight\", \"ups.0.2.to_out.weight\", \"ups.0.2.to_out.bias\", \"ups.0.3.1.weight\", \"ups.0.3.1.bias\", \"ups.1.0.mlp.1.weight\", \"ups.1.0.mlp.1.bias\", \"ups.1.0.block1.proj.weight\", \"ups.1.0.block1.proj.bias\", \"ups.1.0.block1.norm.weight\", \"ups.1.0.block1.norm.bias\", \"ups.1.0.block2.proj.weight\", \"ups.1.0.block2.proj.bias\", \"ups.1.0.block2.norm.weight\", \"ups.1.0.block2.norm.bias\", \"ups.1.0.res_conv.weight\", \"ups.1.0.res_conv.bias\", \"ups.1.1.mlp.1.weight\", \"ups.1.1.mlp.1.bias\", \"ups.1.1.block1.proj.weight\", \"ups.1.1.block1.proj.bias\", \"ups.1.1.block1.norm.weight\", \"ups.1.1.block1.norm.bias\", \"ups.1.1.block2.proj.weight\", \"ups.1.1.block2.proj.bias\", \"ups.1.1.block2.norm.weight\", \"ups.1.1.block2.norm.bias\", \"ups.1.1.res_conv.weight\", \"ups.1.1.res_conv.bias\", \"ups.1.2.mem_kv\", \"ups.1.2.norm.g\", \"ups.1.2.to_qkv.weight\", \"ups.1.2.to_out.0.weight\", \"ups.1.2.to_out.0.bias\", \"ups.1.2.to_out.1.g\", \"ups.1.3.1.weight\", \"ups.1.3.1.bias\", \"ups.2.0.mlp.1.weight\", \"ups.2.0.mlp.1.bias\", \"ups.2.0.block1.proj.weight\", \"ups.2.0.block1.proj.bias\", \"ups.2.0.block1.norm.weight\", \"ups.2.0.block1.norm.bias\", \"ups.2.0.block2.proj.weight\", \"ups.2.0.block2.proj.bias\", \"ups.2.0.block2.norm.weight\", \"ups.2.0.block2.norm.bias\", \"ups.2.0.res_conv.weight\", \"ups.2.0.res_conv.bias\", \"ups.2.1.mlp.1.weight\", \"ups.2.1.mlp.1.bias\", \"ups.2.1.block1.proj.weight\", \"ups.2.1.block1.proj.bias\", \"ups.2.1.block1.norm.weight\", \"ups.2.1.block1.norm.bias\", \"ups.2.1.block2.proj.weight\", \"ups.2.1.block2.proj.bias\", \"ups.2.1.block2.norm.weight\", \"ups.2.1.block2.norm.bias\", \"ups.2.1.res_conv.weight\", \"ups.2.1.res_conv.bias\", \"ups.2.2.mem_kv\", \"ups.2.2.norm.g\", \"ups.2.2.to_qkv.weight\", \"ups.2.2.to_out.0.weight\", \"ups.2.2.to_out.0.bias\", \"ups.2.2.to_out.1.g\", \"ups.2.3.1.weight\", \"ups.2.3.1.bias\", \"ups.3.0.mlp.1.weight\", \"ups.3.0.mlp.1.bias\", \"ups.3.0.block1.proj.weight\", \"ups.3.0.block1.proj.bias\", \"ups.3.0.block1.norm.weight\", \"ups.3.0.block1.norm.bias\", \"ups.3.0.block2.proj.weight\", \"ups.3.0.block2.proj.bias\", \"ups.3.0.block2.norm.weight\", \"ups.3.0.block2.norm.bias\", \"ups.3.0.res_conv.weight\", \"ups.3.0.res_conv.bias\", \"ups.3.1.mlp.1.weight\", \"ups.3.1.mlp.1.bias\", \"ups.3.1.block1.proj.weight\", \"ups.3.1.block1.proj.bias\", \"ups.3.1.block1.norm.weight\", \"ups.3.1.block1.norm.bias\", \"ups.3.1.block2.proj.weight\", \"ups.3.1.block2.proj.bias\", \"ups.3.1.block2.norm.weight\", \"ups.3.1.block2.norm.bias\", \"ups.3.1.res_conv.weight\", \"ups.3.1.res_conv.bias\", \"ups.3.2.mem_kv\", \"ups.3.2.norm.g\", \"ups.3.2.to_qkv.weight\", \"ups.3.2.to_out.0.weight\", \"ups.3.2.to_out.0.bias\", \"ups.3.2.to_out.1.g\", \"ups.3.3.weight\", \"ups.3.3.bias\", \"mid_block1.mlp.1.weight\", \"mid_block1.mlp.1.bias\", \"mid_block1.block1.proj.weight\", \"mid_block1.block1.proj.bias\", \"mid_block1.block1.norm.weight\", \"mid_block1.block1.norm.bias\", \"mid_block1.block2.proj.weight\", \"mid_block1.block2.proj.bias\", \"mid_block1.block2.norm.weight\", \"mid_block1.block2.norm.bias\", \"mid_attn.mem_kv\", \"mid_attn.norm.g\", \"mid_attn.to_qkv.weight\", \"mid_attn.to_out.weight\", \"mid_attn.to_out.bias\", \"mid_block2.mlp.1.weight\", \"mid_block2.mlp.1.bias\", \"mid_block2.block1.proj.weight\", \"mid_block2.block1.proj.bias\", \"mid_block2.block1.norm.weight\", \"mid_block2.block1.norm.bias\", \"mid_block2.block2.proj.weight\", \"mid_block2.block2.proj.bias\", \"mid_block2.block2.norm.weight\", \"mid_block2.block2.norm.bias\", \"final_res_block.mlp.1.weight\", \"final_res_block.mlp.1.bias\", \"final_res_block.block1.proj.weight\", \"final_res_block.block1.proj.bias\", \"final_res_block.block1.norm.weight\", \"final_res_block.block1.norm.bias\", \"final_res_block.block2.proj.weight\", \"final_res_block.block2.proj.bias\", \"final_res_block.block2.norm.weight\", \"final_res_block.block2.norm.bias\", \"final_res_block.res_conv.weight\", \"final_res_block.res_conv.bias\", \"final_conv.weight\", \"final_conv.bias\". \n\tUnexpected key(s) in state_dict: \"betas\", \"alphas_cumprod\", \"alphas_cumprod_prev\", \"sqrt_alphas_cumprod\", \"sqrt_one_minus_alphas_cumprod\", \"log_one_minus_alphas_cumprod\", \"sqrt_recip_alphas_cumprod\", \"sqrt_recipm1_alphas_cumprod\", \"posterior_variance\", \"posterior_log_variance_clipped\", \"posterior_mean_coef1\", \"posterior_mean_coef2\", \"loss_weight\", \"model.init_conv.weight\", \"model.init_conv.bias\", \"model.time_mlp.1.weight\", \"model.time_mlp.1.bias\", \"model.time_mlp.3.weight\", \"model.time_mlp.3.bias\", \"model.downs.0.0.mlp.1.weight\", \"model.downs.0.0.mlp.1.bias\", \"model.downs.0.0.block1.proj.weight\", \"model.downs.0.0.block1.proj.bias\", \"model.downs.0.0.block1.norm.weight\", \"model.downs.0.0.block1.norm.bias\", \"model.downs.0.0.block2.proj.weight\", \"model.downs.0.0.block2.proj.bias\", \"model.downs.0.0.block2.norm.weight\", \"model.downs.0.0.block2.norm.bias\", \"model.downs.0.1.mlp.1.weight\", \"model.downs.0.1.mlp.1.bias\", \"model.downs.0.1.block1.proj.weight\", \"model.downs.0.1.block1.proj.bias\", \"model.downs.0.1.block1.norm.weight\", \"model.downs.0.1.block1.norm.bias\", \"model.downs.0.1.block2.proj.weight\", \"model.downs.0.1.block2.proj.bias\", \"model.downs.0.1.block2.norm.weight\", \"model.downs.0.1.block2.norm.bias\", \"model.downs.0.2.mem_kv\", \"model.downs.0.2.norm.g\", \"model.downs.0.2.to_qkv.weight\", \"model.downs.0.2.to_out.0.weight\", \"model.downs.0.2.to_out.0.bias\", \"model.downs.0.2.to_out.1.g\", \"model.downs.0.3.1.weight\", \"model.downs.0.3.1.bias\", \"model.downs.1.0.mlp.1.weight\", \"model.downs.1.0.mlp.1.bias\", \"model.downs.1.0.block1.proj.weight\", \"model.downs.1.0.block1.proj.bias\", \"model.downs.1.0.block1.norm.weight\", \"model.downs.1.0.block1.norm.bias\", \"model.downs.1.0.block2.proj.weight\", \"model.downs.1.0.block2.proj.bias\", \"model.downs.1.0.block2.norm.weight\", \"model.downs.1.0.block2.norm.bias\", \"model.downs.1.1.mlp.1.weight\", \"model.downs.1.1.mlp.1.bias\", \"model.downs.1.1.block1.proj.weight\", \"model.downs.1.1.block1.proj.bias\", \"model.downs.1.1.block1.norm.weight\", \"model.downs.1.1.block1.norm.bias\", \"model.downs.1.1.block2.proj.weight\", \"model.downs.1.1.block2.proj.bias\", \"model.downs.1.1.block2.norm.weight\", \"model.downs.1.1.block2.norm.bias\", \"model.downs.1.2.mem_kv\", \"model.downs.1.2.norm.g\", \"model.downs.1.2.to_qkv.weight\", \"model.downs.1.2.to_out.0.weight\", \"model.downs.1.2.to_out.0.bias\", \"model.downs.1.2.to_out.1.g\", \"model.downs.1.3.1.weight\", \"model.downs.1.3.1.bias\", \"model.downs.2.0.mlp.1.weight\", \"model.downs.2.0.mlp.1.bias\", \"model.downs.2.0.block1.proj.weight\", \"model.downs.2.0.block1.proj.bias\", \"model.downs.2.0.block1.norm.weight\", \"model.downs.2.0.block1.norm.bias\", \"model.downs.2.0.block2.proj.weight\", \"model.downs.2.0.block2.proj.bias\", \"model.downs.2.0.block2.norm.weight\", \"model.downs.2.0.block2.norm.bias\", \"model.downs.2.1.mlp.1.weight\", \"model.downs.2.1.mlp.1.bias\", \"model.downs.2.1.block1.proj.weight\", \"model.downs.2.1.block1.proj.bias\", \"model.downs.2.1.block1.norm.weight\", \"model.downs.2.1.block1.norm.bias\", \"model.downs.2.1.block2.proj.weight\", \"model.downs.2.1.block2.proj.bias\", \"model.downs.2.1.block2.norm.weight\", \"model.downs.2.1.block2.norm.bias\", \"model.downs.2.2.mem_kv\", \"model.downs.2.2.norm.g\", \"model.downs.2.2.to_qkv.weight\", \"model.downs.2.2.to_out.0.weight\", \"model.downs.2.2.to_out.0.bias\", \"model.downs.2.2.to_out.1.g\", \"model.downs.2.3.1.weight\", \"model.downs.2.3.1.bias\", \"model.downs.3.0.mlp.1.weight\", \"model.downs.3.0.mlp.1.bias\", \"model.downs.3.0.block1.proj.weight\", \"model.downs.3.0.block1.proj.bias\", \"model.downs.3.0.block1.norm.weight\", \"model.downs.3.0.block1.norm.bias\", \"model.downs.3.0.block2.proj.weight\", \"model.downs.3.0.block2.proj.bias\", \"model.downs.3.0.block2.norm.weight\", \"model.downs.3.0.block2.norm.bias\", \"model.downs.3.1.mlp.1.weight\", \"model.downs.3.1.mlp.1.bias\", \"model.downs.3.1.block1.proj.weight\", \"model.downs.3.1.block1.proj.bias\", \"model.downs.3.1.block1.norm.weight\", \"model.downs.3.1.block1.norm.bias\", \"model.downs.3.1.block2.proj.weight\", \"model.downs.3.1.block2.proj.bias\", \"model.downs.3.1.block2.norm.weight\", \"model.downs.3.1.block2.norm.bias\", \"model.downs.3.2.mem_kv\", \"model.downs.3.2.norm.g\", \"model.downs.3.2.to_qkv.weight\", \"model.downs.3.2.to_out.weight\", \"model.downs.3.2.to_out.bias\", \"model.downs.3.3.weight\", \"model.downs.3.3.bias\", \"model.ups.0.0.mlp.1.weight\", \"model.ups.0.0.mlp.1.bias\", \"model.ups.0.0.block1.proj.weight\", \"model.ups.0.0.block1.proj.bias\", \"model.ups.0.0.block1.norm.weight\", \"model.ups.0.0.block1.norm.bias\", \"model.ups.0.0.block2.proj.weight\", \"model.ups.0.0.block2.proj.bias\", \"model.ups.0.0.block2.norm.weight\", \"model.ups.0.0.block2.norm.bias\", \"model.ups.0.0.res_conv.weight\", \"model.ups.0.0.res_conv.bias\", \"model.ups.0.1.mlp.1.weight\", \"model.ups.0.1.mlp.1.bias\", \"model.ups.0.1.block1.proj.weight\", \"model.ups.0.1.block1.proj.bias\", \"model.ups.0.1.block1.norm.weight\", \"model.ups.0.1.block1.norm.bias\", \"model.ups.0.1.block2.proj.weight\", \"model.ups.0.1.block2.proj.bias\", \"model.ups.0.1.block2.norm.weight\", \"model.ups.0.1.block2.norm.bias\", \"model.ups.0.1.res_conv.weight\", \"model.ups.0.1.res_conv.bias\", \"model.ups.0.2.mem_kv\", \"model.ups.0.2.norm.g\", \"model.ups.0.2.to_qkv.weight\", \"model.ups.0.2.to_out.weight\", \"model.ups.0.2.to_out.bias\", \"model.ups.0.3.1.weight\", \"model.ups.0.3.1.bias\", \"model.ups.1.0.mlp.1.weight\", \"model.ups.1.0.mlp.1.bias\", \"model.ups.1.0.block1.proj.weight\", \"model.ups.1.0.block1.proj.bias\", \"model.ups.1.0.block1.norm.weight\", \"model.ups.1.0.block1.norm.bias\", \"model.ups.1.0.block2.proj.weight\", \"model.ups.1.0.block2.proj.bias\", \"model.ups.1.0.block2.norm.weight\", \"model.ups.1.0.block2.norm.bias\", \"model.ups.1.0.res_conv.weight\", \"model.ups.1.0.res_conv.bias\", \"model.ups.1.1.mlp.1.weight\", \"model.ups.1.1.mlp.1.bias\", \"model.ups.1.1.block1.proj.weight\", \"model.ups.1.1.block1.proj.bias\", \"model.ups.1.1.block1.norm.weight\", \"model.ups.1.1.block1.norm.bias\", \"model.ups.1.1.block2.proj.weight\", \"model.ups.1.1.block2.proj.bias\", \"model.ups.1.1.block2.norm.weight\", \"model.ups.1.1.block2.norm.bias\", \"model.ups.1.1.res_conv.weight\", \"model.ups.1.1.res_conv.bias\", \"model.ups.1.2.mem_kv\", \"model.ups.1.2.norm.g\", \"model.ups.1.2.to_qkv.weight\", \"model.ups.1.2.to_out.0.weight\", \"model.ups.1.2.to_out.0.bias\", \"model.ups.1.2.to_out.1.g\", \"model.ups.1.3.1.weight\", \"model.ups.1.3.1.bias\", \"model.ups.2.0.mlp.1.weight\", \"model.ups.2.0.mlp.1.bias\", \"model.ups.2.0.block1.proj.weight\", \"model.ups.2.0.block1.proj.bias\", \"model.ups.2.0.block1.norm.weight\", \"model.ups.2.0.block1.norm.bias\", \"model.ups.2.0.block2.proj.weight\", \"model.ups.2.0.block2.proj.bias\", \"model.ups.2.0.block2.norm.weight\", \"model.ups.2.0.block2.norm.bias\", \"model.ups.2.0.res_conv.weight\", \"model.ups.2.0.res_conv.bias\", \"model.ups.2.1.mlp.1.weight\", \"model.ups.2.1.mlp.1.bias\", \"model.ups.2.1.block1.proj.weight\", \"model.ups.2.1.block1.proj.bias\", \"model.ups.2.1.block1.norm.weight\", \"model.ups.2.1.block1.norm.bias\", \"model.ups.2.1.block2.proj.weight\", \"model.ups.2.1.block2.proj.bias\", \"model.ups.2.1.block2.norm.weight\", \"model.ups.2.1.block2.norm.bias\", \"model.ups.2.1.res_conv.weight\", \"model.ups.2.1.res_conv.bias\", \"model.ups.2.2.mem_kv\", \"model.ups.2.2.norm.g\", \"model.ups.2.2.to_qkv.weight\", \"model.ups.2.2.to_out.0.weight\", \"model.ups.2.2.to_out.0.bias\", \"model.ups.2.2.to_out.1.g\", \"model.ups.2.3.1.weight\", \"model.ups.2.3.1.bias\", \"model.ups.3.0.mlp.1.weight\", \"model.ups.3.0.mlp.1.bias\", \"model.ups.3.0.block1.proj.weight\", \"model.ups.3.0.block1.proj.bias\", \"model.ups.3.0.block1.norm.weight\", \"model.ups.3.0.block1.norm.bias\", \"model.ups.3.0.block2.proj.weight\", \"model.ups.3.0.block2.proj.bias\", \"model.ups.3.0.block2.norm.weight\", \"model.ups.3.0.block2.norm.bias\", \"model.ups.3.0.res_conv.weight\", \"model.ups.3.0.res_conv.bias\", \"model.ups.3.1.mlp.1.weight\", \"model.ups.3.1.mlp.1.bias\", \"model.ups.3.1.block1.proj.weight\", \"model.ups.3.1.block1.proj.bias\", \"model.ups.3.1.block1.norm.weight\", \"model.ups.3.1.block1.norm.bias\", \"model.ups.3.1.block2.proj.weight\", \"model.ups.3.1.block2.proj.bias\", \"model.ups.3.1.block2.norm.weight\", \"model.ups.3.1.block2.norm.bias\", \"model.ups.3.1.res_conv.weight\", \"model.ups.3.1.res_conv.bias\", \"model.ups.3.2.mem_kv\", \"model.ups.3.2.norm.g\", \"model.ups.3.2.to_qkv.weight\", \"model.ups.3.2.to_out.0.weight\", \"model.ups.3.2.to_out.0.bias\", \"model.ups.3.2.to_out.1.g\", \"model.ups.3.3.weight\", \"model.ups.3.3.bias\", \"model.mid_block1.mlp.1.weight\", \"model.mid_block1.mlp.1.bias\", \"model.mid_block1.block1.proj.weight\", \"model.mid_block1.block1.proj.bias\", \"model.mid_block1.block1.norm.weight\", \"model.mid_block1.block1.norm.bias\", \"model.mid_block1.block2.proj.weight\", \"model.mid_block1.block2.proj.bias\", \"model.mid_block1.block2.norm.weight\", \"model.mid_block1.block2.norm.bias\", \"model.mid_attn.mem_kv\", \"model.mid_attn.norm.g\", \"model.mid_attn.to_qkv.weight\", \"model.mid_attn.to_out.weight\", \"model.mid_attn.to_out.bias\", \"model.mid_block2.mlp.1.weight\", \"model.mid_block2.mlp.1.bias\", \"model.mid_block2.block1.proj.weight\", \"model.mid_block2.block1.proj.bias\", \"model.mid_block2.block1.norm.weight\", \"model.mid_block2.block1.norm.bias\", \"model.mid_block2.block2.proj.weight\", \"model.mid_block2.block2.proj.bias\", \"model.mid_block2.block2.norm.weight\", \"model.mid_block2.block2.norm.bias\", \"model.final_res_block.mlp.1.weight\", \"model.final_res_block.mlp.1.bias\", \"model.final_res_block.block1.proj.weight\", \"model.final_res_block.block1.proj.bias\", \"model.final_res_block.block1.norm.weight\", \"model.final_res_block.block1.norm.bias\", \"model.final_res_block.block2.proj.weight\", \"model.final_res_block.block2.proj.bias\", \"model.final_res_block.block2.norm.weight\", \"model.final_res_block.block2.norm.bias\", \"model.final_res_block.res_conv.weight\", \"model.final_res_block.res_conv.bias\", \"model.final_conv.weight\", \"model.final_conv.bias\". "
     ]
    }
   ],
   "source": [
    "model.load_state_dict(torch.load(\"./ddpm-stl-96/denoising_lib/model-45.pt\")['model'])"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "base",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.9.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
