[
    {
        "description": "This metric combines the sum of BatchNorm layer output variances from proxy 1 with the variance of the weights in the first convolutional layer from proxy 4, emphasizing normalization variance and initial layer weight variability.",
        "code": "import torch\n\ndef heuristic_4(model, inputs, targets):\n    bn_variances = []\n    first_conv_weight_variance = None\n    \n    def bn_hook(module, input, output):\n        if isinstance(module, torch.nn.BatchNorm2d):\n            variance = torch.var(output).item()\n            bn_variances.append(variance)\n    \n    for layer in model.modules():\n        if isinstance(layer, torch.nn.Conv2d) and first_conv_weight_variance is None:\n            first_conv_weight_variance = torch.var(layer.weight).item()\n    \n    hooks = []\n    for layer in model.modules():\n        if isinstance(layer, torch.nn.BatchNorm2d):\n            hooks.append(layer.register_forward_hook(bn_hook))\n    \n    outputs = model(inputs)\n    loss = torch.nn.functional.cross_entropy(outputs, targets)\n    loss.backward()\n    \n    for hook in hooks:\n        hook.remove()\n    \n    sum_bn_variance_score = torch.tensor(bn_variances).sum().item()\n    return sum_bn_variance_score + (first_conv_weight_variance if first_conv_weight_variance is not None else 0)",
        "score": 0.8474033614676059
    },
    {
        "description": "This metric combines the sum of the maximum values of BatchNorm layer outputs with the mean gradient magnitude of convolutional layers, emphasizing peak normalization outputs and optimization dynamics.",
        "code": "import torch\n\ndef heuristic_3(model, inputs, targets):\n    bn_max_outputs = []\n    conv_gradient_magnitudes = []\n    \n    def bn_max_hook(module, input, output):\n        if isinstance(module, torch.nn.BatchNorm2d):\n            max_output = output.max().item()\n            bn_max_outputs.append(max_output)\n    \n    def conv_gradient_hook(module, grad_input, grad_output):\n        if isinstance(module, torch.nn.Conv2d):\n            grad_magnitude = grad_output[0].abs().mean().item()\n            conv_gradient_magnitudes.append(grad_magnitude)\n    \n    hooks = []\n    for layer in model.modules():\n        if isinstance(layer, torch.nn.BatchNorm2d):\n            hooks.append(layer.register_forward_hook(bn_max_hook))\n        if isinstance(layer, torch.nn.Conv2d):\n            hooks.append(layer.register_backward_hook(conv_gradient_hook))\n    \n    outputs = model(inputs)\n    loss = torch.nn.functional.cross_entropy(outputs, targets)\n    loss.backward()\n    \n    for hook in hooks:\n        hook.remove()\n    \n    sum_bn_max_output_score = torch.tensor(bn_max_outputs).sum().item()\n    mean_conv_gradient_score = torch.tensor(conv_gradient_magnitudes).mean().item()\n    return sum_bn_max_output_score + mean_conv_gradient_score",
        "score": 0.8265881177670837
    },
    {
        "description": "This metric combines the sum of the maximum values of BatchNorm layer outputs with the variance of the output of the last residual block, highlighting peak normalization outputs and variability in the final block's output.",
        "code": "import torch\n\ndef heuristic_1(model, inputs, targets):\n    bn_max_outputs = []\n    last_res_block_output_variance = None\n    \n    def bn_hook(module, input, output):\n        if isinstance(module, torch.nn.BatchNorm2d):\n            max_output = output.max().item()\n            bn_max_outputs.append(max_output)\n    \n    def res_block_hook(module, input, output):\n        nonlocal last_res_block_output_variance\n        if isinstance(module, torch.nn.Sequential):\n            last_res_block_output_variance = torch.var(output).item()\n    \n    hooks = []\n    for layer in model.modules():\n        if isinstance(layer, torch.nn.BatchNorm2d):\n            hooks.append(layer.register_forward_hook(bn_hook))\n        if isinstance(layer, torch.nn.Sequential):\n            hooks.append(layer.register_forward_hook(res_block_hook))\n    \n    outputs = model(inputs)\n    loss = torch.nn.functional.cross_entropy(outputs, targets)\n    loss.backward()\n    \n    for hook in hooks:\n        hook.remove()\n    \n    sum_bn_max_output_score = torch.tensor(bn_max_outputs).sum().item()\n    return sum_bn_max_output_score + (last_res_block_output_variance if last_res_block_output_variance is not None else 0)",
        "score": 0.8130883013954319
    },
    {
        "description": "This metric combines the sum of BatchNorm layer output variances from proxy 4 with the mean gradient magnitude of BatchNorm layers from proxy 5, emphasizing both normalization variance and optimization dynamics.",
        "code": "import torch\n\ndef heuristic_8(model, inputs, targets):\n    bn_variances = []\n    gradient_magnitudes = []\n    \n    def bn_variance_hook(module, input, output):\n        if isinstance(module, torch.nn.BatchNorm2d):\n            variance = torch.var(output).item()\n            bn_variances.append(variance)\n    \n    def bn_gradient_hook(module, grad_input, grad_output):\n        if isinstance(module, torch.nn.BatchNorm2d):\n            grad_magnitude = grad_output[0].abs().mean().item()\n            gradient_magnitudes.append(grad_magnitude)\n    \n    hooks = []\n    for layer in model.modules():\n        if isinstance(layer, torch.nn.BatchNorm2d):\n            hooks.append(layer.register_forward_hook(bn_variance_hook))\n            hooks.append(layer.register_backward_hook(bn_gradient_hook))\n    \n    outputs = model(inputs)\n    loss = torch.nn.functional.cross_entropy(outputs, targets)\n    loss.backward()\n    \n    for hook in hooks:\n        hook.remove()\n    \n    sum_bn_variance_score = torch.tensor(bn_variances).sum().item()\n    mean_gradient_score = torch.tensor(gradient_magnitudes).mean().item()\n    return sum_bn_variance_score + mean_gradient_score",
        "score": 0.7879784003007089
    },
    {
        "description": "This metric combines the sum of the minimum values of BatchNorm layer outputs with the mean gradient magnitude of the activation outputs from ReLU layers, emphasizing minimal normalization outputs and optimization dynamics.",
        "code": "import torch\n\ndef heuristic_3(model, inputs, targets):\n    bn_min_outputs = []\n    relu_gradient_magnitudes = []\n    \n    def bn_min_hook(module, input, output):\n        if isinstance(module, torch.nn.BatchNorm2d):\n            min_output = output.min().item()\n            bn_min_outputs.append(min_output)\n    \n    def relu_gradient_hook(module, grad_input, grad_output):\n        if isinstance(module, torch.nn.ReLU):\n            grad_magnitude = grad_output[0].abs().mean().item()\n            relu_gradient_magnitudes.append(grad_magnitude)\n    \n    hooks = []\n    for layer in model.modules():\n        if isinstance(layer, torch.nn.BatchNorm2d):\n            hooks.append(layer.register_forward_hook(bn_min_hook))\n        if isinstance(layer, torch.nn.ReLU):\n            hooks.append(layer.register_backward_hook(relu_gradient_hook))\n    \n    outputs = model(inputs)\n    loss = torch.nn.functional.cross_entropy(outputs, targets)\n    loss.backward()\n    \n    for hook in hooks:\n        hook.remove()\n    \n    sum_bn_min_output_score = torch.tensor(bn_min_outputs).sum().item()\n    mean_relu_gradient_score = torch.tensor(relu_gradient_magnitudes).mean().item()\n    return sum_bn_min_output_score + mean_relu_gradient_score",
        "score": 0.7798932771247215
    }
]