[
    {
        "description": "This metric, named \"Feature-BatchNorm Sensitivity Blend (FBSB)\", is a crossover of proxy 1 (Feature-BatchNorm Diversity Ratio) and proxy 5 (Feature Diversity Score) using Input Crossover and Aggregation Crossover. It combines feature map diversity from proxy 5 and BatchNorm statistics from proxy 1 as inputs, and aggregates the results using a weighted average instead of a simple ratio to balance the contributions of diversity and stability.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_1(model, inputs, targets):\n    model.eval()\n    with torch.no_grad():\n        intermediate_outputs = []\n        bn_stats = []\n        \n        def hook(module, input, output):\n            intermediate_outputs.append(output)\n        \n        conv_layers = [m for m in model.modules() if isinstance(m, nn.Conv2d)]\n        if len(conv_layers) > 0:\n            selected_layer = conv_layers[len(conv_layers)//2]\n            handle = selected_layer.register_forward_hook(hook)\n        \n        _ = model(inputs)\n        if handle is not None:\n            handle.remove()\n        \n        for module in model.modules():\n            if isinstance(module, nn.BatchNorm2d):\n                running_mean = module.running_mean\n                running_var = module.running_var\n                stability = torch.max(torch.abs(running_mean - running_var))\n                bn_stats.append(stability)\n        \n        if len(intermediate_outputs) == 0 or not bn_stats:\n            return torch.tensor(0.0).cpu()\n        \n        feat_map = intermediate_outputs[0]\n        batch_std = torch.std(feat_map, dim=(2, 3), unbiased=False)\n        channel_diversity = torch.mean(batch_std, dim=0)\n        diversity_score = torch.mean(channel_diversity) / (feat_map.shape[1] + 1e-8)\n        bn_score = sum(bn_stats) / len(bn_stats)\n        \n        combined_score = 0.7 * diversity_score + 0.3 * bn_score\n        return combined_score.cpu()",
        "score": 0.8386366923321344
    },
    {
        "description": "This metric, named \"Feature Diversity-Stability Sum (FDSS)\", is a crossover of proxy 2 (Feature-BatchNorm Diversity Ratio) and proxy 5 (Feature-Weight Diversity Blend) using Aggregation Crossover and Operation Crossover. It retains the feature diversity and BatchNorm inputs from proxy 2 and the weighted addition from proxy 5, but replaces the ratio operation in proxy 2 with a sum aggregation to combine diversity and stability scores.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_4(model, inputs, targets):\n    model.eval()\n    with torch.no_grad():\n        intermediate_outputs = []\n        bn_stats = []\n        \n        def hook(module, input, output):\n            intermediate_outputs.append(output)\n        \n        conv_layers = [m for m in model.modules() if isinstance(m, nn.Conv2d)]\n        if len(conv_layers) > 0:\n            selected_layer = conv_layers[len(conv_layers)//2]\n            handle = selected_layer.register_forward_hook(hook)\n        \n        _ = model(inputs)\n        if handle is not None:\n            handle.remove()\n        \n        for module in model.modules():\n            if isinstance(module, nn.BatchNorm2d):\n                running_mean = module.running_mean\n                running_var = module.running_var\n                stability = torch.max(torch.abs(running_mean - running_var))\n                bn_stats.append(stability)\n        \n        if len(intermediate_outputs) == 0 or not bn_stats:\n            return torch.tensor(0.0).cpu()\n        \n        feat_map = intermediate_outputs[0]\n        batch_std = torch.std(feat_map, dim=(2, 3), unbiased=False)\n        channel_diversity = torch.mean(batch_std, dim=0)\n        diversity_score = torch.mean(channel_diversity) / (feat_map.shape[1] + 1e-8)\n        bn_score = sum(bn_stats) / len(bn_stats)\n        \n        combined_score = diversity_score + bn_score\n        return combined_score.cpu()",
        "score": 0.8187914335353933
    },
    {
        "description": "This metric, named \"Feature-BatchNorm Diversity Ratio (FBDR)\", is a crossover of proxy 4 (Feature Diversity Score) and proxy 2 (BatchNorm Stability Index) using Input Crossover and Operation Crossover. It combines feature map diversity from proxy 4 and BatchNorm statistics from proxy 2 as inputs, and replaces the simple mean operation in proxy 4 with a division to measure the ratio of feature diversity to BatchNorm stability.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_5(model, inputs, targets):\n    model.eval()\n    with torch.no_grad():\n        intermediate_outputs = []\n        bn_stats = []\n        \n        def hook(module, input, output):\n            intermediate_outputs.append(output)\n        \n        conv_layers = [m for m in model.modules() if isinstance(m, nn.Conv2d)]\n        if len(conv_layers) > 0:\n            selected_layer = conv_layers[len(conv_layers)//2]\n            handle = selected_layer.register_forward_hook(hook)\n        \n        _ = model(inputs)\n        if handle is not None:\n            handle.remove()\n        \n        for module in model.modules():\n            if isinstance(module, nn.BatchNorm2d):\n                running_mean = module.running_mean\n                running_var = module.running_var\n                stability = torch.max(torch.abs(running_mean - running_var))\n                bn_stats.append(stability)\n        \n        if len(intermediate_outputs) == 0 or not bn_stats:\n            return torch.tensor(0.0).cpu()\n        \n        feat_map = intermediate_outputs[0]\n        batch_std = torch.std(feat_map, dim=(2, 3), unbiased=False)\n        channel_diversity = torch.mean(batch_std, dim=0)\n        diversity_score = torch.mean(channel_diversity) / (feat_map.shape[1] + 1e-8)\n        bn_score = sum(bn_stats) / len(bn_stats)\n        \n        combined_score = diversity_score / (bn_score + 1e-8)\n        return combined_score.cpu()",
        "score": 0.8092147763169828
    },
    {
        "description": "This metric, named \"Feature Diversity-Gradient Balance (FDGB)\", is a crossover of proxy 1 (Feature-Weight Diversity Blend) and proxy 5 (Gradient-Feature Sensitivity) using Operation Crossover and Aggregation Crossover. It retains the feature diversity and gradient inputs from both parents, replaces the weighted addition in proxy 1 with a subtraction operation to capture contrast between diversity and sensitivity, and aggregates results using a mean operation for balance.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_5(model, inputs, targets):\n    model.eval()\n    with torch.no_grad():\n        intermediate_outputs = []\n        grad_mags = []\n        \n        def hook(module, input, output):\n            intermediate_outputs.append(output)\n            if output.requires_grad:\n                grad = torch.autograd.grad(output.mean(), input[0], create_graph=False)[0]\n                if grad is not None:\n                    grad_mags.append(grad.abs().mean())\n        \n        conv_layers = [m for m in model.modules() if isinstance(m, nn.Conv2d)]\n        if len(conv_layers) > 0:\n            selected_layer = conv_layers[len(conv_layers)//2]\n            handle = selected_layer.register_forward_hook(hook)\n        \n        _ = model(inputs)\n        if handle is not None:\n            handle.remove()\n        \n        if len(intermediate_outputs) == 0:\n            return torch.tensor(0.0).cpu()\n        \n        feat_map = intermediate_outputs[0]\n        batch_std = torch.std(feat_map, dim=(2, 3), unbiased=False)\n        channel_diversity = torch.mean(batch_std, dim=0)\n        diversity_score = torch.mean(channel_diversity) / (feat_map.shape[1] + 1e-8)\n        grad_score = sum(grad_mags) / len(grad_mags) if grad_mags else torch.tensor(0.0)\n        \n        combined_score = (diversity_score - grad_score).abs()\n        return combined_score.cpu()",
        "score": 0.7786174807489948
    },
    {
        "description": "This metric, named \"BatchNorm Stability Index (BNSI)\", applies an Input Mutation by replacing feature map outputs with BatchNorm statistics (running mean and variance) as inputs to evaluate the stability of feature distributions across layers. It also uses an Operation Mutation by computing the maximum of the absolute differences between running mean and variance instead of standard deviation or mean. Finally, an Aggregation Mutation is applied by using a sum operation across layers to aggregate the stability scores into a single scalar.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_1(model, inputs, targets):\n    model.eval()\n    with torch.no_grad():\n        bn_stats = []\n        \n        for module in model.modules():\n            if isinstance(module, nn.BatchNorm2d):\n                running_mean = module.running_mean\n                running_var = module.running_var\n                stability = torch.max(torch.abs(running_mean - running_var))\n                bn_stats.append(stability)\n        \n        if not bn_stats:\n            return torch.tensor(0.0).cpu()\n        \n        final_score = sum(bn_stats)\n        return final_score.cpu()",
        "score": 0.7208874668814673
    }
]