[
    {
        "description": "Combines the BatchNorm stable rank from proxy 4 with the weight norm ratio from proxy 1 using structure crossover. Computes the sum of the BatchNorm stable ranks multiplied by the sum of the weight norm ratios.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_4(model, inputs, targets):\n    bn_ranks = []\n    ratios = []\n    hooks = []\n    \n    def bn_hook(module, inp, out):\n        if isinstance(out, torch.Tensor):\n            B, C, H, W = out.shape\n            mat = out.view(B, C, -1).permute(0, 2, 1).reshape(-1, C)\n            frob_norm = torch.linalg.matrix_norm(mat, ord='fro')**2\n            spec_norm = torch.linalg.matrix_norm(mat, ord=2)**2\n            stable_rank = frob_norm / (spec_norm + 1e-6)\n            bn_ranks.append(stable_rank.mean())\n    \n    for layer in model.modules():\n        if isinstance(layer, nn.BatchNorm2d):\n            hooks.append(layer.register_forward_hook(bn_hook))\n        elif isinstance(layer, nn.Conv2d):\n            weights = layer.weight\n            l1_norm = weights.abs().sum(dim=(1,2,3)).mean()\n            l2_norm = weights.norm(p=2, dim=(1,2,3)).mean()\n            ratios.append((l1_norm / l2_norm).item())\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    for hook in hooks:\n        hook.remove()\n    \n    bn_sum = torch.stack(bn_ranks).sum().item() if bn_ranks else 0.0\n    ratio_sum = sum(ratios) if ratios else 0.0\n    \n    return bn_sum * ratio_sum",
        "score": 0.8619524622217951
    },
    {
        "description": "Combines the BatchNorm stable rank from proxy 4 with the convolutional stable rank from proxy 3 using structure crossover. Computes the maximum of the sum of BatchNorm stable ranks and the sum of convolutional stable ranks.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_3(model, inputs, targets):\n    bn_ranks = []\n    conv_ranks = []\n    hooks = []\n    \n    def bn_hook(module, inp, out):\n        if isinstance(out, torch.Tensor):\n            B, C, H, W = out.shape\n            mat = out.view(B, C, -1).permute(0, 2, 1).reshape(-1, C)\n            frob_norm = torch.linalg.matrix_norm(mat, ord='fro')**2\n            spec_norm = torch.linalg.matrix_norm(mat, ord=2)**2\n            stable_rank = frob_norm / (spec_norm + 1e-6)\n            bn_ranks.append(stable_rank.mean())\n    \n    def conv_hook(module, inp, out):\n        if isinstance(out, torch.Tensor):\n            B, C, H, W = out.shape\n            mat = out.view(B, C, -1).permute(0, 2, 1).reshape(-1, C)\n            frob_norm = torch.linalg.matrix_norm(mat, ord='fro')**2\n            spec_norm = torch.linalg.matrix_norm(mat, ord=2)**2\n            stable_rank = frob_norm / (spec_norm + 1e-6)\n            conv_ranks.append(stable_rank.mean())\n    \n    for layer in model.modules():\n        if isinstance(layer, nn.BatchNorm2d):\n            hooks.append(layer.register_forward_hook(bn_hook))\n        elif isinstance(layer, nn.Conv2d):\n            hooks.append(layer.register_forward_hook(conv_hook))\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    for hook in hooks:\n        hook.remove()\n    \n    bn_sum = torch.stack(bn_ranks).sum().item() if bn_ranks else 0.0\n    conv_sum = torch.stack(conv_ranks).sum().item() if conv_ranks else 0.0\n    \n    return max(bn_sum, conv_sum)",
        "score": 0.8551750657160976
    },
    {
        "description": "Combines the weight norm ratio from proxy 1 with the convolutional stable rank from proxy 2 using operation crossover. Computes the product of the sum of weight norm ratios and the sum of convolutional stable ranks.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_5(model, inputs, targets):\n    conv_ranks = []\n    ratios = []\n    hooks = []\n    \n    def conv_hook(module, inp, out):\n        if isinstance(out, torch.Tensor):\n            B, C, H, W = out.shape\n            mat = out.view(B, C, -1).permute(0, 2, 1).reshape(-1, C)\n            frob_norm = torch.linalg.matrix_norm(mat, ord='fro')**2\n            spec_norm = torch.linalg.matrix_norm(mat, ord=2)**2\n            stable_rank = frob_norm / (spec_norm + 1e-6)\n            conv_ranks.append(stable_rank.mean())\n    \n    for layer in model.modules():\n        if isinstance(layer, nn.Conv2d):\n            hooks.append(layer.register_forward_hook(conv_hook))\n            weights = layer.weight\n            l1_norm = weights.abs().sum(dim=(1,2,3)).mean()\n            l2_norm = weights.norm(p=2, dim=(1,2,3)).mean()\n            ratios.append((l1_norm / l2_norm).item())\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    for hook in hooks:\n        hook.remove()\n    \n    conv_sum = torch.stack(conv_ranks).sum().item() if conv_ranks else 1.0\n    ratio_sum = sum(ratios) if ratios else 1.0\n    \n    return conv_sum * ratio_sum",
        "score": 0.8404788293980506
    },
    {
        "description": "Combines the BatchNorm stable rank from proxy 1 with the weight norm ratio from proxy 2. Computes the sum of stable ranks from BatchNorm outputs multiplied by the sum of weight norm ratios from 3x3 convolutional layers.",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_5(model, inputs, targets):\n    ranks = []\n    ratios = []\n    hooks = []\n    \n    def bn_hook(module, inp, out):\n        if isinstance(out, torch.Tensor):\n            B, C, H, W = out.shape\n            mat = out.view(B, C, -1).permute(0, 2, 1).reshape(-1, C)\n            frob_norm = torch.linalg.matrix_norm(mat, ord='fro')**2\n            spec_norm = torch.linalg.matrix_norm(mat, ord=2)**2\n            stable_rank = frob_norm / (spec_norm + 1e-6)\n            ranks.append(stable_rank.mean())\n    \n    for layer in model.modules():\n        if isinstance(layer, nn.BatchNorm2d):\n            hooks.append(layer.register_forward_hook(bn_hook))\n        elif isinstance(layer, nn.Conv2d) and layer.kernel_size == (3, 3):\n            weights = layer.weight\n            l1_norm = weights.abs().sum(dim=(1,2,3)).mean()\n            l2_norm = weights.norm(p=2, dim=(1,2,3)).mean()\n            ratios.append((l1_norm / l2_norm).item())\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    for hook in hooks:\n        hook.remove()\n    \n    rank_sum = torch.stack(ranks).sum().item() if ranks else 0.0\n    ratio_sum = sum(ratios) if ratios else 0.0\n    \n    return rank_sum * ratio_sum",
        "score": 0.8357808074088738
    },
    {
        "description": "Combines the BatchNorm stable rank from proxy 4 with the weight norm ratio from proxy 1 using aggregation crossover. Computes the weighted sum of BatchNorm stable ranks (0.6) and weight norm ratios (0.4).",
        "code": "import torch\nimport torch.nn as nn\n\ndef heuristic_4(model, inputs, targets):\n    bn_ranks = []\n    ratios = []\n    hooks = []\n    \n    def bn_hook(module, inp, out):\n        if isinstance(out, torch.Tensor):\n            B, C, H, W = out.shape\n            mat = out.view(B, C, -1).permute(0, 2, 1).reshape(-1, C)\n            frob_norm = torch.linalg.matrix_norm(mat, ord='fro')**2\n            spec_norm = torch.linalg.matrix_norm(mat, ord=2)**2\n            stable_rank = frob_norm / (spec_norm + 1e-6)\n            bn_ranks.append(stable_rank.mean())\n    \n    for layer in model.modules():\n        if isinstance(layer, nn.BatchNorm2d):\n            hooks.append(layer.register_forward_hook(bn_hook))\n        elif isinstance(layer, nn.Conv2d):\n            weights = layer.weight\n            l1_norm = weights.abs().sum(dim=(1,2,3)).mean()\n            l2_norm = weights.norm(p=2, dim=(1,2,3)).mean()\n            ratios.append((l1_norm / l2_norm).item())\n    \n    with torch.no_grad():\n        model(inputs)\n    \n    for hook in hooks:\n        hook.remove()\n    \n    bn_sum = torch.stack(bn_ranks).sum().item() if bn_ranks else 0.0\n    ratio_sum = sum(ratios) if ratios else 0.0\n    \n    return 0.6 * bn_sum + 0.4 * ratio_sum",
        "score": 0.8354877014552566
    }
]