[
    {
        "description": "This metric evaluates the \"Mean of Absolute Activations\" of the model's activation layers. It measures the average magnitude of activations across the network, indicating the model's activation patterns.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_2(model, inputs, targets):\n    model.eval()\n    activations = []\n    handles = []\n    \n    def hook_fn(module, input, output):\n        activations.append(output.detach().abs().mean().cpu().item())\n    \n    for name, module in model.named_modules():\n        if isinstance(module, nn.ReLU) or isinstance(module, nn.LeakyReLU):\n            handles.append(module.register_forward_hook(hook_fn))\n    \n    model(inputs)\n    mean_activation = sum(activations) / len(activations) if activations else 0\n    \n    for handle in handles:\n        handle.remove()\n    \n    return mean_activation",
        "score": 0.8411749706093619
    },
    {
        "description": "This metric performs an aggregation crossover between \"Mean of Activation Outputs\" and \"Variance of BatchNorm Means\". It combines these two metrics to provide insights into both activation patterns and normalization statistics.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_4(model, inputs, targets):\n    model.eval()\n    activation_means = []\n    batchnorm_means = []\n    handles = []\n    \n    def activation_hook_fn(module, input, output):\n        activation_means.append(output.detach().mean().cpu().item())\n    \n    for name, module in model.named_modules():\n        if isinstance(module, nn.ReLU) or isinstance(module, nn.LeakyReLU):\n            handles.append(module.register_forward_hook(activation_hook_fn))\n        if isinstance(module, nn.BatchNorm2d):\n            batchnorm_means.append(module.running_mean.mean().cpu().item())\n    \n    model(inputs)\n    \n    for handle in handles:\n        handle.remove()\n    \n    mean_activation = sum(activation_means) / len(activation_means) if activation_means else 0\n    variance_batchnorm_means = torch.var(torch.tensor(batchnorm_means)).item() if batchnorm_means else 0\n    \n    return (mean_activation + variance_batchnorm_means) / 2",
        "score": 0.8071905980532438
    },
    {
        "description": "This metric performs an aggregation crossover between \"Nuclear Norm of Jacobian\" and \"Mean of Absolute Gradients of Convolutional Layer Weights\". It combines the nuclear norm of the Jacobian and the mean absolute gradients using a weighted average, providing insights into the model's sensitivity and learning.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_3(model, inputs, targets):\n    # Nuclear Norm of Jacobian component\n    inputs.requires_grad = True\n    outputs = model(inputs)\n    jacobian = torch.autograd.grad(outputs, inputs, grad_outputs=torch.ones_like(outputs), retain_graph=True, create_graph=False)[0]\n    jacobian = jacobian.view(jacobian.size(0), -1)\n    nuclear_norm = torch.sum(torch.sqrt(torch.sum(jacobian**2, dim=1))).cpu().item()\n    \n    # Mean of Absolute Gradients component\n    model.zero_grad()\n    outputs = model(inputs)\n    loss = nn.CrossEntropyLoss()(outputs, targets)\n    loss.backward()\n    grad_score = 0\n    grad_count = 0\n    for name, module in model.named_modules():\n        if isinstance(module, nn.Conv2d):\n            grad = module.weight.grad.detach().abs().mean().cpu()\n            grad_score += grad.item()\n            grad_count += 1\n    grad_score /= grad_count if grad_count > 0 else 1\n    \n    return 0.7 * nuclear_norm + 0.3 * grad_score",
        "score": 0.6809110133706959
    },
    {
        "description": "This metric evaluates the nuclear norm of the Jacobian matrix of the output with respect to the input for a batch of data. It measures the model's sensitivity and stability.",
        "code": "import torch\n\ndef heuristic_3(model, inputs, targets):\n    inputs.requires_grad = True\n    outputs = model(inputs)\n    jacobian = torch.autograd.grad(outputs, inputs, grad_outputs=torch.ones_like(outputs), retain_graph=True, create_graph=False)[0]\n    jacobian = jacobian.view(jacobian.size(0), -1)\n    score = torch.sum(torch.sqrt(torch.sum(jacobian**2, dim=1)))\n    return score.cpu().item()",
        "score": 0.6597366019204223
    },
    {
        "description": "This metric performs an operation crossover between \"Spectral Norm of Jacobian\" and \"Mean of Absolute Gradients of Convolutional Layer Weights\". It combines the spectral norm of the Jacobian with the mean absolute gradients of convolutional layer weights, providing insights into the model's sensitivity and learning.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_1(model, inputs, targets):\n    # Spectral Norm of Jacobian component\n    inputs.requires_grad = True\n    outputs = model(inputs)\n    jacobian = torch.autograd.grad(outputs[:, 0].sum(), inputs, retain_graph=True, create_graph=False)[0].cpu()\n    _, s, _ = torch.svd(jacobian.view(jacobian.size(0), -1))\n    spectral_norm = s[0].item()\n    \n    # Mean of Absolute Gradients component\n    model.zero_grad()\n    outputs = model(inputs)\n    loss = nn.CrossEntropyLoss()(outputs, targets)\n    loss.backward()\n    grad_score = 0\n    grad_count = 0\n    for name, module in model.named_modules():\n        if isinstance(module, nn.Conv2d):\n            grad = module.weight.grad.detach().abs().mean().cpu()\n            grad_score += grad.item()\n            grad_count += 1\n    grad_score /= grad_count if grad_count > 0 else 1\n    \n    return (spectral_norm + grad_score) / 2",
        "score": 0.6542582716740644
    }
]