{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "#!/usr/bin/env python3\n",
    "\n",
    "import accelerate\n",
    "import torch\n",
    "from torch.utils import data\n",
    "from torchvision import transforms\n",
    "\n",
    "import k_diffusion as K\n",
    "from train_openai import OpenAIDenoiser\n",
    "\n",
    "\n",
    "def to_show(x: torch.Tensor, ref=None):\n",
    "    x = x[0].permute(1, 2, 0)\n",
    "    if ref is None:\n",
    "        x_min, x_max = x.min(), x.max()\n",
    "    else:\n",
    "        x_min, x_max = ref.min(), ref.max()\n",
    "    x = (x - x_min) / (x_max - x_min)\n",
    "    return x.detach().cpu().numpy()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "class Args:\n",
    "    config = \"configs/test_ffhq_dwt.json\"\n",
    "    checkpoint = \"../../model_zoo/ffhq_dwt.ckpt\"\n",
    "\n",
    "args = Args()\n",
    "\n",
    "config = K.config.load_config(open(args.config))\n",
    "model_config = config['model']\n",
    "dataset_config = config['dataset']\n",
    "size = model_config['input_size']\n",
    "\n",
    "accelerator = accelerate.Accelerator()\n",
    "device = accelerator.device\n",
    "print(f'Using device: {device}', flush=True)\n",
    "\n",
    "model = OpenAIDenoiser.load_from_checkpoint(args.checkpoint, map_location='cpu')\n",
    "print(model.model_config)\n",
    "model = model.model\n",
    "\n",
    "# test data\n",
    "tf = transforms.Compose([\n",
    "    transforms.ToTensor(),\n",
    "    lambda x: x * 2 - 1\n",
    "])\n",
    "test_set = K.utils.FolderOfImages(dataset_config['location'], transform=tf)\n",
    "test_dl = data.DataLoader(test_set, batch_size=1)\n",
    "\n",
    "test_dl, model = accelerator.prepare(test_dl, model)\n",
    "test_dl = iter(test_dl)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import matplotlib.pyplot as plt\n",
    "\n",
    "x0, = next(test_dl)\n",
    "plt.imshow(to_show(x0))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "sigma_min = model_config['sigma_min']\n",
    "sigma_max = model_config['sigma_max']\n",
    "sigmas = K.sampling.get_sigmas_karras(50, sigma_min, sigma_max, rho=7., device=device)\n",
    "x0 = x0.to(device)\n",
    "\n",
    "sigma = torch.Tensor([1]).to(device)\n",
    "x = x0 + torch.randn_like(x0) * sigma\n",
    "x = x.requires_grad_()\n",
    "\n",
    "model_output, logvar, logvar_ot = model(x, sigma, return_variance=True)\n",
    "c_out, c_in = model.get_scalings(sigma)\n",
    "ot = model.ortho_tf\n",
    "\n",
    "x0_mean = model_output * c_out + x\n",
    "\n",
    "error = (x0_mean - x0).pow(2).mean(dim=1, keepdim=True)\n",
    "error_pred = (logvar.exp() * c_out.pow(2)).mean(dim=1, keepdim=True)\n",
    "\n",
    "error_ot = (ot(x0_mean) - ot(x0)).pow(2).mean(dim=1, keepdim=True)\n",
    "error_ot_pred = (logvar_ot.exp() * c_out.pow(2)).mean(dim=1, keepdim=True)\n",
    "\n",
    "print(error.mean().item(), error.var().item())\n",
    "print(error_pred.mean().item(), error_pred.var().item())\n",
    "\n",
    "print(error_ot.mean().item(), error_ot.var().item())\n",
    "print(error_ot_pred.mean().item(), error_ot_pred.var().item())\n",
    "\n",
    "\n",
    "fig, axes = plt.subplots(2, 4, figsize=(10, 5.5))\n",
    "for ax in axes.flatten():\n",
    "    ax.axis('off')\n",
    "plt.tight_layout()\n",
    "\n",
    "axes[0, 0].imshow(to_show(x), vmin=0, vmax=1)\n",
    "axes[0, 0].set_title(rf\"$x_t$\")\n",
    "\n",
    "axes[0, 1].imshow(to_show(x0))\n",
    "axes[0, 1].set_title(rf\"$x_0$\")\n",
    "\n",
    "axes[1, 1].imshow(to_show(x0_mean))\n",
    "axes[1, 1].set_title(rf\"Posterior Mean\")\n",
    "\n",
    "axes[0, 2].imshow(to_show(error.log(), ref=error_pred.log()), vmin=0, vmax=1)\n",
    "axes[0, 2].set_title(rf\"Spatial Square Error\")\n",
    "\n",
    "axes[1, 2].imshow(to_show(error_pred.log()), vmin=0, vmax=1)\n",
    "axes[1, 2].set_title(rf\"Spatial Variance\")\n",
    "\n",
    "axes[0, 3].imshow(to_show(error_ot.log(), ref=error_ot_pred.log()), vmin=0, vmax=1)\n",
    "axes[0, 3].set_title(rf\"DWT Square Error\")\n",
    "\n",
    "axes[1, 3].imshow(to_show(error_ot_pred.log()), vmin=0, vmax=1)\n",
    "axes[1, 3].set_title(rf\"DWT Variance\")\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "base",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
