[
    {
        "description": "This metric computes the average channel-wise correlation of feature maps across different spatial positions. Lower correlation indicates more diverse local features. We average the off-diagonal elements of the spatial correlation matrix for each channel.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_4(model, inputs, targets):\n    model.eval()\n    total_corr = 0.0\n    count = 0\n    \n    def hook_fn(module, input, output):\n        nonlocal total_corr, count\n        if isinstance(module, nn.Conv2d):\n            b, c, h, w = output.shape\n            if h * w < 2:\n                return\n            flattened = output.flatten(2)  # [b, c, h*w]\n            corr = torch.bmm(flattened, flattened.transpose(1, 2)) / (h * w)\n            mask = ~torch.eye(c, device=corr.device).bool()\n            avg_corr = corr[:, mask].abs().mean()\n            total_corr += avg_corr\n            count += 1\n    \n    hooks = []\n    for layer in model.modules():\n        if isinstance(layer, nn.Conv2d):\n            hooks.append(layer.register_forward_hook(hook_fn))\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    for hook in hooks:\n        hook.remove()\n    \n    avg_corr = total_corr / count if count > 0 else 0.0\n    return (1 - avg_corr).cpu().item()",
        "score": 0.8119244975063108
    },
    {
        "description": "This metric evaluates the ratio of positive to negative activations in feature maps across all layers. A balanced ratio may indicate better representation capability as it suggests the network is learning both inhibitory and excitatory features.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_5(model, inputs, targets):\n    pos_neg_ratios = []\n    hooks = []\n    \n    def hook_fn(module, input, output):\n        if isinstance(output, torch.Tensor):\n            pos = (output > 0).float().mean()\n            neg = (output < 0).float().mean()\n            ratio = (pos + 1e-6) / (neg + 1e-6)\n            pos_neg_ratios.append(ratio.log())\n    \n    for layer in model.modules():\n        if isinstance(layer, (nn.Conv2d, nn.ReLU)):\n            hooks.append(layer.register_forward_hook(hook_fn))\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    for hook in hooks:\n        hook.remove()\n    \n    if not pos_neg_ratios:\n        return 0.0\n    \n    avg_ratio = torch.stack(pos_neg_ratios).mean().exp()\n    return (1.0 / (1.0 + (avg_ratio - 1.0).abs())).cpu().item()",
        "score": 0.810646973849288
    },
    {
        "description": "This metric merges the rank estimation from proxy 3 with the sparsity measurement from proxy 4. It computes the average rank of feature maps weighted by their sparsity, favoring layers with both high rank and low sparsity.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_2(model, inputs, targets):\n    ranks = []\n    sparsities = []\n    hooks = []\n    \n    def hook_fn(module, input, output):\n        if isinstance(module, nn.Conv2d):\n            # Rank estimation part\n            B, C, H, W = output.shape\n            features = output.permute(0, 2, 3, 1).reshape(-1, C)\n            U, S, V = torch.svd(features)\n            threshold = S.max() * 1e-3\n            rank = (S > threshold).sum().float()\n            min_rank = min(features.shape)\n            ranks.append(rank / min_rank)\n            \n            # Sparsity part\n            abs_output = output.abs()\n            sparsity = (abs_output < 1e-3).float().mean()\n            sparsities.append(sparsity)\n    \n    for module in model.modules():\n        if isinstance(module, nn.Conv2d):\n            hooks.append(module.register_forward_hook(hook_fn))\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    for hook in hooks:\n        hook.remove()\n    \n    if not ranks:\n        return 0.0\n    \n    avg_rank = torch.stack(ranks).mean()\n    avg_sparsity = torch.stack(sparsities).mean()\n    return (avg_rank * (1 - avg_sparsity)).cpu().item()",
        "score": 0.7804149235891743
    },
    {
        "description": "This metric combines the rank estimation from proxy 4 with the positive-negative ratio from proxy 2. It computes the normalized rank of feature maps weighted by their balance between positive and negative activations, favoring layers with both high rank and balanced activations.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_8(model, inputs, targets):\n    ranks = []\n    pos_neg_ratios = []\n    hooks = []\n    \n    def hook_fn(module, input, output):\n        if isinstance(module, nn.Conv2d):\n            # Rank estimation part\n            B, C, H, W = output.shape\n            features = output.permute(0, 2, 3, 1).reshape(-1, C)\n            U, S, V = torch.svd(features)\n            threshold = S.max() * 1e-3\n            rank = (S > threshold).sum().float()\n            min_rank = min(features.shape)\n            ranks.append(rank / min_rank)\n            \n            # Positive-negative ratio part\n            pos = (output > 0).float().mean()\n            neg = (output < 0).float().mean()\n            ratio = (pos + 1e-6) / (neg + 1e-6)\n            pos_neg_ratios.append(ratio.log())\n    \n    for module in model.modules():\n        if isinstance(module, nn.Conv2d):\n            hooks.append(module.register_forward_hook(hook_fn))\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    for hook in hooks:\n        hook.remove()\n    \n    if not ranks or not pos_neg_ratios:\n        return 0.0\n    \n    avg_rank = torch.stack(ranks).mean()\n    avg_ratio = torch.stack(pos_neg_ratios).mean().exp()\n    balance_score = 1.0 / (1.0 + (avg_ratio - 1.0).abs())\n    return (avg_rank * balance_score).cpu().item()",
        "score": 0.751531450940651
    },
    {
        "description": "This metric computes the average rank of feature maps across different convolutional layers using singular value decomposition. The rank is estimated as the number of singular values above a threshold (1e-3 of the maximum singular value), normalized by the minimum possible rank.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_4(model, inputs, targets):\n    ranks = []\n    hooks = []\n    \n    def hook_fn(module, input, output):\n        if isinstance(output, tuple):\n            output = output[0]\n        # Reshape to (batch*H*W, channels)\n        B, C, H, W = output.shape\n        features = output.permute(0, 2, 3, 1).reshape(-1, C)\n        \n        # Compute SVD\n        U, S, V = torch.svd(features)\n        \n        # Estimate rank\n        threshold = S.max() * 1e-3\n        rank = (S > threshold).sum().float()\n        min_rank = min(features.shape)\n        ranks.append((rank / min_rank).item())\n    \n    # Register hooks on all Conv2d layers\n    for module in model.modules():\n        if isinstance(module, nn.Conv2d):\n            hooks.append(module.register_forward_hook(hook_fn))\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    # Remove hooks\n    for hook in hooks:\n        hook.remove()\n    \n    if not ranks:\n        return 0.0\n    \n    return sum(ranks) / len(ranks)",
        "score": 0.7453509183504514
    }
]