[
    {
        "description": "Combines the max activation values from convolutional layers with the mean of BatchNorm variances, emphasizing peak activations and stable feature scaling.",
        "code": "import torch\n\ndef heuristic_17(model, inputs, targets):\n    model.eval()\n    max_activations = []\n    bn_vars = []\n    hooks = []\n    for name, module in model.named_modules():\n        if isinstance(module, torch.nn.Conv2d):\n            def hook_fn(_, __, output):\n                max_val = torch.max(output).item()\n                max_activations.append(max_val)\n            hooks.append(module.register_forward_hook(hook_fn))\n        if isinstance(module, torch.nn.BatchNorm2d):\n            var = module.running_var.cpu()\n            bn_vars.append(torch.mean(var).item())\n    _ = model(inputs.cuda())\n    for hook in hooks:\n        hook.remove()\n    return (sum(max_activations) / len(max_activations) if max_activations else 0) + (sum(bn_vars) / len(bn_vars) if bn_vars else 0)",
        "score": 0.8856825749167592
    },
    {
        "description": "This metric evaluates the variance of BatchNorm statistics (mean and variance) across all BatchNorm layers. Larger variance indicates more dynamic feature scaling, which can enhance model expressiveness.",
        "code": "import torch\n\ndef heuristic_6(model, inputs, targets):\n    model.eval()\n    variances = []\n    for module in model.modules():\n        if isinstance(module, torch.nn.BatchNorm2d):\n            mean = module.running_mean.cpu()\n            var = module.running_var.cpu()\n            stats = torch.cat([mean, torch.sqrt(var + 1e-5)])\n            variances.append(torch.var(stats).item())\n    return sum(variances) / len(variances) if variances else 0",
        "score": 0.8641012034398905
    },
    {
        "description": "This metric calculates the normalized L1 norm of gradients with respect to weights in convolutional layers, emphasizing sparsity.",
        "code": "import torch\n\ndef heuristic_10(model, inputs, targets):\n    model.eval()\n    l1_norms = []\n    for name, param in model.named_parameters():\n        if 'conv' in name and 'weight' in name:\n            param.requires_grad_(True)\n            outputs = model(inputs.cuda())\n            loss = torch.sum(outputs)\n            grads = torch.autograd.grad(loss, param, retain_graph=True)[0].detach().cpu()\n            l1_norm = torch.norm(grads, p=1).item()\n            l1_norms.append(l1_norm)\n            param.requires_grad_(False)\n    return sum(l1_norms) / len(l1_norms) if l1_norms else 0",
        "score": 0.8375061366659832
    },
    {
        "description": "Combines the normalized L1 norm of gradients with respect to weights in convolutional layers and the variance of BatchNorm statistics, emphasizing both sparsity and dynamic feature scaling.",
        "code": "import torch\n\ndef heuristic_13(model, inputs, targets):\n    model.eval()\n    l1_norms = []\n    variances = []\n    for name, param in model.named_parameters():\n        if 'conv' in name and 'weight' in name:\n            param.requires_grad_(True)\n            outputs = model(inputs.cuda())\n            loss = torch.sum(outputs)\n            grads = torch.autograd.grad(loss, param, retain_graph=True)[0].detach().cpu()\n            l1_norm = torch.norm(grads, p=1).item()\n            l1_norms.append(l1_norm)\n            param.requires_grad_(False)\n    for module in model.modules():\n        if isinstance(module, torch.nn.BatchNorm2d):\n            mean = module.running_mean.cpu()\n            var = module.running_var.cpu()\n            stats = torch.cat([mean, torch.sqrt(var + 1e-5)])\n            variances.append(torch.var(stats).item())\n    return (sum(l1_norms) / len(l1_norms) if l1_norms else 0) + (sum(variances) / len(variances) if variances else 0)",
        "score": 0.8309071512373737
    },
    {
        "description": "This metric merges the smoothness of decision boundaries (gradient norm) with activation entropy to assess generalization and representation diversity.",
        "code": "import torch\nimport numpy as np\n\ndef heuristic_7(model, inputs, targets):\n    model.eval()\n    inputs.requires_grad_(True)\n    outputs = model(inputs.cuda())\n    loss = torch.sum(outputs)\n    grads = torch.autograd.grad(loss, inputs)[0].detach().cpu()\n    grad_norm = torch.norm(grads, p=2, dim=(1, 2, 3)).mean().item()\n    \n    entropies = []\n    hooks = []\n    for name, module in model.named_modules():\n        if isinstance(module, torch.nn.Conv2d):\n            def hook_fn(_, __, output):\n                activations = output.flatten(1).cpu()\n                prob = torch.softmax(activations, dim=1)\n                entropy = -torch.sum(prob * torch.log(prob + 1e-8), dim=1).mean().item()\n                entropies.append(entropy)\n            hooks.append(module.register_forward_hook(hook_fn))\n    _ = model(inputs.cuda())\n    for hook in hooks:\n        hook.remove()\n    \n    entropy_score = np.mean(entropies) if entropies else 0.0\n    return grad_norm * entropy_score",
        "score": 0.7552700771726557
    }
]