{
 "cells": [
  {
   "cell_type": "markdown",
   "id": "ff9630a3",
   "metadata": {},
   "source": [
    "# DFN (modular) \u2014 pluggable solvers + integer-scaling for LEMON\n",
    "\n",
    "This notebook rewrites the **DFN-Gurobi** idea in the **concise, modular style** of `DFN.ipynb`:\n",
    "\n",
    "- **Graph = data** (`DigraphSpec`) so you can add new graph generators later.\n",
    "- **Solver choice**: `solver=\"gurobi\"` or `solver=\"lemon\"`.\n",
    "- **Integer-only solvers** (LEMON) receive **integers** by scaling to a fixed decimal precision `10^-p`.\n",
    "- **Objective/gradients are scaled back** so learning behaves as if everything stayed in the original units.\n",
    "- Uses **softplus** for nonnegative costs/caps.\n",
    "\n",
    "At the bottom there are **minimal smoke tests** (forward + backward) that run for any solvers available in your environment."
   ]
  },
  {
   "cell_type": "markdown",
   "id": "d934e4f7",
   "metadata": {},
   "source": [
    "## Imports"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "01bb42e5",
   "metadata": {},
   "outputs": [],
   "source": [
    "from __future__ import annotations\n",
    "\n",
    "import sys\n",
    "from pathlib import Path\n",
    "from dataclasses import dataclass\n",
    "\n",
    "import numpy as np\n",
    "import cppimport\n",
    "\n",
    "import torch\n",
    "import torch.nn as nn\n",
    "import torch.nn.functional as F\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "c3da0367",
   "metadata": {},
   "source": [
    "## (Optional) LEMON binding\n",
    "\n",
    "If you have the `lemon_mcf` cppimport module in your repo (same as your previous notebooks), this will compile/import it.\n",
    "If not, you can still use `solver=\"gurobi\"`."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ea024152",
   "metadata": {},
   "outputs": [],
   "source": [
    "# If this fails, you can ignore it and use solver=\"gurobi\".\n",
    "try:\n",
    "    repo = Path().resolve().parent\n",
    "    sys.path.insert(0, str(repo))\n",
    "    lemon_mcf = cppimport.imp(\"lemon_mcf\")\n",
    "    HAVE_LEMON = True\n",
    "except Exception as e:\n",
    "    lemon_mcf = None\n",
    "    HAVE_LEMON = False\n",
    "\n",
    "HAVE_LEMON\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "ff2f4e31",
   "metadata": {},
   "source": [
    "## Fractional precision \u2192 integerization (STE)\n",
    "\n",
    "We only do this to satisfy **integer-only solvers**.\n",
    "For a chosen `precision_digits = p`:\n",
    "\n",
    "- `scale = 10^p`, `step = 1/scale`\n",
    "- we pass solver inputs as integers: `round(x * scale)`\n",
    "- we scale the returned objective by `1/scale^2` so the result matches original units."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "bff71858",
   "metadata": {},
   "outputs": [],
   "source": [
    "class _RoundSTE(torch.autograd.Function):\n",
    "    @staticmethod\n",
    "    def forward(ctx, x: torch.Tensor) -> torch.Tensor:  # noqa\n",
    "        return torch.round(x)\n",
    "\n",
    "    @staticmethod\n",
    "    def backward(ctx, g: torch.Tensor) -> torch.Tensor:  # noqa\n",
    "        return g\n",
    "\n",
    "\n",
    "def round_ste(x: torch.Tensor) -> torch.Tensor:\n",
    "    return _RoundSTE.apply(x)\n",
    "\n",
    "\n",
    "def to_int_scaled(x: torch.Tensor, scale: float) -> torch.Tensor:\n",
    "    \"\"\"Return an integer-valued float tensor representing round(x * scale).\n",
    "\n",
    "    Gradients flow through as if this were identity (STE) times the scale factor.\n",
    "    \"\"\"\n",
    "    return round_ste(x * scale)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "e380e9d3",
   "metadata": {},
   "source": [
    "## Graph spec + a multilayer generator\n",
    "\n",
    "To add new graphs later, just write another function that returns a `DigraphSpec`."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d5a903f1",
   "metadata": {},
   "outputs": [],
   "source": [
    "@dataclass(frozen=True)\n",
    "class DigraphSpec:\n",
    "    n: int\n",
    "    src: torch.Tensor          # (m,) int64\n",
    "    dst: torch.Tensor          # (m,) int64\n",
    "    m_learn: int               # first m_learn arcs are learnable\n",
    "    fixed_cost: torch.Tensor   # (m-m_learn,) float\n",
    "    fixed_cap: torch.Tensor    # (m-m_learn,) float\n",
    "    b_nodes: torch.Tensor      # nodes using learnable b entries\n",
    "    A_nodes: torch.Tensor      # nodes using (A @ x) entries\n",
    "    slack: int                 # node index forced to -sum(other balances)\n",
    "\n",
    "\n",
    "def make_multilayer(layer_sizes, big_cost=1e6, big_cap=1e6, var_frac=0.5) -> DigraphSpec:\n",
    "    \"\"\"Layered graph (like DFN-Gurobi), returned as a generic DigraphSpec.\n",
    "\n",
    "    - Learnable arcs: fully connect Li -> L(i+1)\n",
    "    - Fixed feasibility arcs: fully connect L1 <-> LK with big cost/cap\n",
    "    - Nonzero balances only on boundary layers, with the final node as slack\n",
    "\n",
    "    var_frac controls boundary split into (A@x) vs (learnable b):\n",
    "      A_nodes = first ~var_frac; b_nodes = rest (excluding slack).\n",
    "    \"\"\"\n",
    "    sizes = list(map(int, layer_sizes))\n",
    "    if any(s <= 0 for s in sizes):\n",
    "        raise ValueError(\"all layer sizes must be positive\")\n",
    "\n",
    "    offs = np.cumsum([0] + sizes[:-1]).astype(np.int64)\n",
    "    layers = [np.arange(offs[i], offs[i] + sizes[i], dtype=np.int64) for i in range(len(sizes))]\n",
    "    n = int(sum(sizes))\n",
    "\n",
    "    # learnable arcs: Li -> Li+1 (full bipartite)\n",
    "    srcL, dstL = [], []\n",
    "    for i in range(len(layers) - 1):\n",
    "        U, V = layers[i], layers[i + 1]\n",
    "        srcL.append(np.repeat(U, len(V)))\n",
    "        dstL.append(np.tile(V, len(U)))\n",
    "    srcL = np.concatenate(srcL) if srcL else np.zeros((0,), np.int64)\n",
    "    dstL = np.concatenate(dstL) if dstL else np.zeros((0,), np.int64)\n",
    "    m_learn = int(srcL.size)\n",
    "\n",
    "    # fixed arcs: L1 <-> LK\n",
    "    L1, LK = layers[0], layers[-1]\n",
    "    srcF = np.concatenate([np.repeat(L1, len(LK)), np.repeat(LK, len(L1))])\n",
    "    dstF = np.concatenate([np.tile(LK, len(L1)),   np.tile(L1, len(LK))])\n",
    "\n",
    "    src = np.concatenate([srcL, srcF]).astype(np.int64, copy=False)\n",
    "    dst = np.concatenate([dstL, dstF]).astype(np.int64, copy=False)\n",
    "\n",
    "    slack = int(LK[-1])\n",
    "    LK_wo = LK[LK != slack]\n",
    "\n",
    "    def split(nodes):\n",
    "        k = int(round(float(len(nodes)) * float(var_frac)))\n",
    "        k = max(0, min(k, len(nodes)))\n",
    "        return nodes[:k], nodes[k:]\n",
    "\n",
    "    A1, B1 = split(L1)\n",
    "    Ak, Bk = split(LK_wo)\n",
    "\n",
    "    A_nodes = np.concatenate([A1, Ak]).astype(np.int64)\n",
    "    b_nodes = np.concatenate([B1, Bk]).astype(np.int64)\n",
    "\n",
    "    fixed_cost = torch.full((int(srcF.size),), float(big_cost), dtype=torch.float32)\n",
    "    fixed_cap  = torch.full((int(srcF.size),), float(big_cap),  dtype=torch.float32)\n",
    "\n",
    "    return DigraphSpec(\n",
    "        n=n,\n",
    "        src=torch.from_numpy(src).long(),\n",
    "        dst=torch.from_numpy(dst).long(),\n",
    "        m_learn=m_learn,\n",
    "        fixed_cost=fixed_cost,\n",
    "        fixed_cap=fixed_cap,\n",
    "        b_nodes=torch.from_numpy(b_nodes).long(),\n",
    "        A_nodes=torch.from_numpy(A_nodes).long(),\n",
    "        slack=slack,\n",
    "    )\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "f9aa077a",
   "metadata": {},
   "source": [
    "## Differentiable min-cost-flow value (LEMON + Gurobi)\n",
    "\n",
    "Both backprops use the same rule you were using:\n",
    "- `d/dcost = flow`\n",
    "- `d/dcap = reduced_cost` when the arc is tight, else `0`\n",
    "- `d/db = mean(potential) - potential`"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ddba969f",
   "metadata": {},
   "outputs": [],
   "source": [
    "class _MCFValueLEMON(torch.autograd.Function):\n",
    "    @staticmethod\n",
    "    def forward(ctx, n_nodes, src, dst, cost, cap, b):\n",
    "        if lemon_mcf is None:\n",
    "            raise RuntimeError(\"LEMON solver requested but lemon_mcf is not available.\")\n",
    "\n",
    "        n = int(n_nodes)\n",
    "        src = src.long(); dst = dst.long()\n",
    "        m = int(src.numel())\n",
    "        if dst.numel() != m or cost.numel() != m or cap.numel() != m or b.numel() != n:\n",
    "            raise ValueError(\"bad shapes\")\n",
    "\n",
    "        src_np  = src.detach().cpu().contiguous().numpy().astype(np.int64, copy=False)\n",
    "        dst_np  = dst.detach().cpu().contiguous().numpy().astype(np.int64, copy=False)\n",
    "        cost_np = cost.detach().cpu().contiguous().numpy().astype(np.float64, copy=False)\n",
    "        cap_np  = cap.detach().cpu().contiguous().numpy().astype(np.float64, copy=False)\n",
    "        b_np    = b.detach().cpu().contiguous().numpy().astype(np.float64, copy=False)\n",
    "\n",
    "        out = lemon_mcf.solve_mcf(n, src_np, dst_np, cost_np, cap_np, b_np)\n",
    "        if int(out.get(\"status\", -1)) != 1:\n",
    "            raise RuntimeError(f\"LEMON failed (status={out.get('status', -1)})\")\n",
    "\n",
    "        flow = out[\"flow\"].astype(np.float64, copy=False)\n",
    "        pot  = out[\"potential\"].astype(np.float64, copy=False)\n",
    "        red  = out[\"reduced_cost\"].astype(np.float64, copy=False)\n",
    "        at   = np.abs(flow - cap_np) <= 1e-9\n",
    "\n",
    "        ctx.flow, ctx.pot, ctx.red, ctx.at = flow, pot, red, at\n",
    "        return cost.new_tensor(float(out[\"total_cost\"]))\n",
    "\n",
    "    @staticmethod\n",
    "    def backward(ctx, g):\n",
    "        dev, dt = g.device, g.dtype\n",
    "        flow = torch.as_tensor(ctx.flow, device=dev, dtype=dt)\n",
    "        pot  = torch.as_tensor(ctx.pot,  device=dev, dtype=dt)\n",
    "        red  = torch.as_tensor(ctx.red,  device=dev, dtype=dt)\n",
    "        at   = torch.as_tensor(ctx.at,   device=dev, dtype=torch.bool)\n",
    "\n",
    "        grad_cost = flow\n",
    "        grad_cap  = torch.where(at, red, torch.zeros_like(red))\n",
    "        grad_b    = pot.mean() - pot\n",
    "        return None, None, None, grad_cost * g, grad_cap * g, grad_b * g\n",
    "\n",
    "\n",
    "class _MCFValueGUROBI(torch.autograd.Function):\n",
    "    @staticmethod\n",
    "    def forward(ctx, n_nodes, src, dst, cost, cap, b):\n",
    "        try:\n",
    "            import gurobipy as gp\n",
    "            from gurobipy import GRB\n",
    "        except Exception as e:\n",
    "            raise ImportError(\"gurobipy is required (with a valid license).\") from e\n",
    "\n",
    "        n = int(n_nodes)\n",
    "        src = src.long(); dst = dst.long()\n",
    "        m = int(src.numel())\n",
    "        if dst.numel() != m or cost.numel() != m or cap.numel() != m or b.numel() != n:\n",
    "            raise ValueError(\"bad shapes\")\n",
    "\n",
    "        src_np  = src.detach().cpu().contiguous().numpy().astype(np.int64, copy=False)\n",
    "        dst_np  = dst.detach().cpu().contiguous().numpy().astype(np.int64, copy=False)\n",
    "        cost_np = cost.detach().cpu().contiguous().numpy().astype(np.float64, copy=False)\n",
    "        cap_np  = cap.detach().cpu().contiguous().numpy().astype(np.float64, copy=False)\n",
    "        b_np    = b.detach().cpu().contiguous().numpy().astype(np.float64, copy=False).copy()\n",
    "\n",
    "                out_idx = [[] for _ in range(n)]\n",
    "        in_idx  = [[] for _ in range(n)]\n",
    "        for k in range(m):\n",
    "            out_idx[int(src_np[k])].append(k)\n",
    "            in_idx[int(dst_np[k])].append(k)\n",
    "\n",
    "        model = gp.Model()\n",
    "        model.Params.OutputFlag = 0\n",
    "\n",
    "        x = model.addVars(m, lb=0.0, ub=cap_np.tolist(), obj=cost_np.tolist(), name=\"x\")\n",
    "        bal = []\n",
    "        for i in range(n):\n",
    "            bal.append(model.addConstr(\n",
    "                gp.quicksum(x[k] for k in out_idx[i]) - gp.quicksum(x[k] for k in in_idx[i]) == float(b_np[i])\n",
    "            ))\n",
    "\n",
    "        model.optimize()\n",
    "        if model.Status != GRB.OPTIMAL:\n",
    "            raise RuntimeError(f\"Gurobi failed (status={model.Status})\")\n",
    "\n",
    "        flow = np.fromiter((x[k].X  for k in range(m)), dtype=np.float64, count=m)\n",
    "        red  = np.fromiter((x[k].RC for k in range(m)), dtype=np.float64, count=m)\n",
    "        pot  = -np.fromiter((bal[i].Pi for i in range(n)), dtype=np.float64, count=n)\n",
    "        at   = np.abs(flow - cap_np) <= 1e-9\n",
    "\n",
    "        ctx.flow, ctx.pot, ctx.red, ctx.at = flow, pot, red, at\n",
    "        return cost.new_tensor(float(model.ObjVal))\n",
    "\n",
    "    @staticmethod\n",
    "    def backward(ctx, g):\n",
    "        dev, dt = g.device, g.dtype\n",
    "        flow = torch.as_tensor(ctx.flow, device=dev, dtype=dt)\n",
    "        pot  = torch.as_tensor(ctx.pot,  device=dev, dtype=dt)\n",
    "        red  = torch.as_tensor(ctx.red,  device=dev, dtype=dt)\n",
    "        at   = torch.as_tensor(ctx.at,   device=dev, dtype=torch.bool)\n",
    "\n",
    "        grad_cost = flow\n",
    "        grad_cap  = torch.where(at, red, torch.zeros_like(red))\n",
    "        grad_b    = pot.mean() - pot\n",
    "        return None, None, None, grad_cost * g, grad_cap * g, grad_b * g\n",
    "\n",
    "\n",
    "def min_cost_flow_value(n_nodes, src, dst, cost, cap, b, solver=\"lemon\"):\n",
    "    s = str(solver).lower()\n",
    "    if s in (\"lemon\", \"lemon_mcf\"):\n",
    "        return _MCFValueLEMON.apply(n_nodes, src, dst, cost, cap, b)\n",
    "    if s in (\"gurobi\", \"grb\"):\n",
    "        return _MCFValueGUROBI.apply(n_nodes, src, dst, cost, cap, b)\n",
    "    raise ValueError(f\"unknown solver: {solver}\")\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "39f9493d",
   "metadata": {},
   "source": [
    "## DFN module (modular + solver choice)\n",
    "\n",
    "Key points vs your older `DFN.ipynb`:\n",
    "\n",
    "- We **do not quantize A itself** by default (only the solver inputs if integerization is enabled).\n",
    "- `integerize='auto'` means: use integers for LEMON, floats for Gurobi.\n",
    "- Optional **affine output** (`alpha * obj + beta`) like DFN-Gurobi."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "214a4fb4",
   "metadata": {},
   "outputs": [],
   "source": [
    "class DFN(nn.Module):\n",
    "    def __init__(\n",
    "        self,\n",
    "        graph: DigraphSpec,\n",
    "        input_dim: int,\n",
    "        *,\n",
    "        solver: str = \"gurobi\",\n",
    "        precision_digits: int = 3,\n",
    "        eps_pos: float = 0.0,\n",
    "        integerize: str | bool = \"auto\",\n",
    "        affine_obj: bool = True,\n",
    "    ):\n",
    "        super().__init__()\n",
    "\n",
    "        self.n = int(graph.n)\n",
    "        self.m_learn = int(graph.m_learn)\n",
    "        self.slack = int(graph.slack)\n",
    "\n",
    "        self.solver = str(solver)\n",
    "        self.scale = float(10 ** int(precision_digits))\n",
    "        self.step  = 1.0 / self.scale\n",
    "        self.eps_pos = float(eps_pos)\n",
    "\n",
    "        if integerize == \"auto\":\n",
    "            self.integerize = self.solver.lower() in (\"lemon\", \"lemon_mcf\")\n",
    "        else:\n",
    "            self.integerize = bool(integerize)\n",
    "\n",
    "        # graph buffers\n",
    "        self.register_buffer(\"src\", graph.src.long(), persistent=False)\n",
    "        self.register_buffer(\"dst\", graph.dst.long(), persistent=False)\n",
    "        self.register_buffer(\"b_nodes\", graph.b_nodes.long(), persistent=False)\n",
    "        self.register_buffer(\"A_nodes\", graph.A_nodes.long(), persistent=False)\n",
    "        self.register_buffer(\"fixed_cost\", graph.fixed_cost.float(), persistent=False)\n",
    "        self.register_buffer(\"fixed_cap\",  graph.fixed_cap.float(),  persistent=False)\n",
    "\n",
    "        nb = int(self.b_nodes.numel())\n",
    "        na = int(self.A_nodes.numel())\n",
    "\n",
    "        # learnables\n",
    "        self.A = nn.Parameter(0.01 * torch.randn(na, int(input_dim)))\n",
    "        self.b = nn.Parameter(torch.zeros(nb))\n",
    "\n",
    "        self.c_raw = nn.Parameter(0.01 * torch.randn(self.m_learn))\n",
    "        self.u_raw = nn.Parameter(0.01 * torch.randn(self.m_learn))\n",
    "\n",
    "        self.affine_obj = bool(affine_obj)\n",
    "        if self.affine_obj:\n",
    "            self.alpha = nn.Parameter(torch.ones(()))\n",
    "            self.beta  = nn.Parameter(torch.zeros(()))\n",
    "\n",
    "    def _solve_one(self, x1: torch.Tensor) -> torch.Tensor:\n",
    "        dev = x1.device\n",
    "        dt = torch.float64\n",
    "\n",
    "        # nonnegative learnable arc params\n",
    "        c = (F.softplus(self.c_raw) + self.eps_pos).to(dev, dtype=dt)\n",
    "        u = (F.softplus(self.u_raw) + self.eps_pos).to(dev, dtype=dt)\n",
    "\n",
    "        fC = self.fixed_cost.to(dev, dtype=dt)\n",
    "        fU = self.fixed_cap.to(dev, dtype=dt)\n",
    "\n",
    "        # balances\n",
    "        bvec = torch.zeros(self.n, device=dev, dtype=dt)\n",
    "        if self.b_nodes.numel():\n",
    "            bvec[self.b_nodes.to(dev)] = self.b.to(dev, dtype=dt)\n",
    "        if self.A_nodes.numel():\n",
    "            bvec[self.A_nodes.to(dev)] = (self.A.to(dev, dtype=dt) @ x1.to(dtype=dt))\n",
    "        bvec[self.slack] -= bvec.sum()\n",
    "\n",
    "        if self.integerize:\n",
    "            # integer solver inputs (as float tensors holding integers)\n",
    "            cI = to_int_scaled(c, self.scale)\n",
    "            uI = to_int_scaled(u, self.scale)\n",
    "            fCI = torch.round(fC * self.scale)\n",
    "            fUI = torch.round(fU * self.scale)\n",
    "\n",
    "            costI = torch.cat([cI, fCI]) if fCI.numel() else cI\n",
    "            capI  = torch.cat([uI, fUI]) if fUI.numel() else uI\n",
    "\n",
    "            bI = to_int_scaled(bvec, self.scale)\n",
    "            bI[self.slack] -= bI.sum()\n",
    "\n",
    "            objI = min_cost_flow_value(self.n, self.src.to(dev), self.dst.to(dev), costI, capI, bI, solver=self.solver)\n",
    "            out = objI * (self.step ** 2)\n",
    "        else:\n",
    "            cost = torch.cat([c, fC]) if fC.numel() else c\n",
    "            cap  = torch.cat([u, fU]) if fU.numel() else u\n",
    "            out = min_cost_flow_value(self.n, self.src.to(dev), self.dst.to(dev), cost, cap, bvec, solver=self.solver)\n",
    "\n",
    "        if self.affine_obj:\n",
    "            out = self.alpha.to(out.dtype) * out + self.beta.to(out.dtype)\n",
    "\n",
    "        return out\n",
    "\n",
    "    def forward(self, x: torch.Tensor) -> torch.Tensor:\n",
    "        if x.dim() == 1:\n",
    "            y = self._solve_one(x)\n",
    "            return y.to(x.dtype)\n",
    "\n",
    "        ys = [self._solve_one(xi) for xi in x]\n",
    "        return torch.stack(ys, 0).to(x.dtype)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "d11fa13a",
   "metadata": {},
   "source": [
    "## Minimal smoke tests (forward + backward)\n",
    "\n",
    "These tests are intentionally small and fast:\n",
    "\n",
    "- graph sanity checks\n",
    "- forward produces finite values\n",
    "- backward produces finite gradients\n",
    "\n",
    "They run for whichever solvers are available."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "dd755750",
   "metadata": {},
   "outputs": [],
   "source": [
    "def _have_gurobi():\n",
    "    try:\n",
    "        import gurobipy  # noqa\n",
    "        return True\n",
    "    except Exception:\n",
    "        return False\n",
    "\n",
    "\n",
    "def smoke_test(device=\"cpu\"):\n",
    "    torch.manual_seed(0)\n",
    "\n",
    "    g = make_multilayer([3, 4, 3], var_frac=0.5)\n",
    "    assert g.n == 10\n",
    "    assert g.m_learn > 0\n",
    "    assert g.slack not in g.A_nodes.tolist()\n",
    "    assert g.slack not in g.b_nodes.tolist()\n",
    "\n",
    "    x = torch.randn(6, 5, device=device)\n",
    "\n",
    "    solvers = []\n",
    "    if _have_gurobi():\n",
    "        solvers.append(\"gurobi\")\n",
    "    if HAVE_LEMON:\n",
    "        solvers.append(\"lemon\")\n",
    "\n",
    "    if not solvers:\n",
    "        print(\"No solvers available in this environment.\")\n",
    "        return\n",
    "\n",
    "    for s in solvers:\n",
    "        model = DFN(\n",
    "            g,\n",
    "            input_dim=5,\n",
    "            solver=s,\n",
    "            integerize=\"auto\",\n",
    "            precision_digits=3,\n",
    "            eps_pos=1e-6,\n",
    "            affine_obj=True,\n",
    "        ).to(device)\n",
    "\n",
    "        y = model(x).mean()\n",
    "        assert torch.isfinite(y).all()\n",
    "\n",
    "        y.backward()\n",
    "\n",
    "        for name, p in model.named_parameters():\n",
    "            assert p.grad is not None, f\"missing grad: {name}\"\n",
    "            assert torch.isfinite(p.grad).all(), f\"bad grad: {name}\"\n",
    "\n",
    "    print(f\"Smoke test passed for solvers: {solvers}\")\n",
    "\n",
    "\n",
    "smoke_test()\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "name": "python3"
  },
  "language_info": {
   "name": "python",
   "version": "3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}