{
  "aggregate_metrics": {
    "train_r": 0.3318268083032877,
    "train_p": 1.1434878501278425e-83,
    "val_r": 0.26481052279597517,
    "val_p": 3.696237311518426e-07
  },
  "per_fold_stats": {
    "train_r_mean": 0.5145121386564082,
    "train_r_std": 0.08159380308796446,
    "val_r_mean": 0.3935141877602133,
    "val_r_std": 0.1800244871190147
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 14.119417190551758,
    "right_subspace_overlap_bottom_k": -5.767834663391113,
    "interaction_matrix_overlap_top_k": 12.556540489196777,
    "interaction_matrix_overlap_bottom_k": 11.321340560913086,
    "effective_rank": 4.034346580505371,
    "effective_rank_mergeability_score": 4.600121974945068,
    "stable_rank": -2.1511895656585693,
    "spectral_gap": 5.348729133605957,
    "singular_value_ratio": -2.1478819847106934,
    "layerwise_effective_rank": -5.67301082611084,
    "layerwise_effective_rank_mergeability_score": 0.07685728371143341,
    "singular_value_overlap": -20.46152114868164,
    "subspace_overlap": 17.619558334350586,
    "right_subspace_overlap": 12.905008316040039,
    "activation_l2_distance": -7.2193284034729,
    "activation_cosine_similarity": 15.962809562683105,
    "activation_magnitude_ratio": -5.314408302307129,
    "activation_dot_product": 7.48459005355835,
    "encoder_gradient_cosine_similarity": 8.19008731842041,
    "encoder_gradient_l2_distance": -29.133434295654297,
    "encoder_gradient_dot_product": 6.477674961090088,
    "input_gradient_cosine_similarity": 9.75427532196045,
    "input_gradient_l2_distance": -29.107894897460938,
    "input_gradient_dot_product": -22.47701072692871
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 12.30291748046875,
    "right_subspace_overlap_bottom_k": 15.38562297821045,
    "interaction_matrix_overlap_top_k": 17.342649459838867,
    "interaction_matrix_overlap_bottom_k": 15.661320686340332,
    "effective_rank": 11.577472686767578,
    "effective_rank_mergeability_score": 12.088871002197266,
    "stable_rank": 10.299169540405273,
    "spectral_gap": 9.567400932312012,
    "singular_value_ratio": 11.56169605255127,
    "layerwise_effective_rank": 21.21300506591797,
    "layerwise_effective_rank_mergeability_score": 17.80553436279297,
    "singular_value_overlap": 14.74803352355957,
    "subspace_overlap": 20.141372680664062,
    "right_subspace_overlap": 14.255441665649414,
    "activation_l2_distance": 10.894170761108398,
    "activation_cosine_similarity": 10.45805549621582,
    "activation_magnitude_ratio": 9.391753196716309,
    "activation_dot_product": 13.484771728515625,
    "encoder_gradient_cosine_similarity": 8.023262023925781,
    "encoder_gradient_l2_distance": 18.099227905273438,
    "encoder_gradient_dot_product": 6.375010013580322,
    "input_gradient_cosine_similarity": 7.414261817932129,
    "input_gradient_l2_distance": 11.51064682006836,
    "input_gradient_dot_product": 23.355955123901367
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.482610333252911,
      "val_r": 0.3822349686679651,
      "n_iterations": 616,
      "coefficients": {
        "right_subspace_overlap_top_k": 28.34377670288086,
        "right_subspace_overlap_bottom_k": -6.758167743682861,
        "interaction_matrix_overlap_top_k": 2.1974804401397705,
        "interaction_matrix_overlap_bottom_k": 26.167280197143555,
        "effective_rank": -25.3055419921875,
        "effective_rank_mergeability_score": -0.06970669329166412,
        "stable_rank": 2.0768160820007324,
        "spectral_gap": 10.609889030456543,
        "singular_value_ratio": -15.570098876953125,
        "layerwise_effective_rank": 19.285282135009766,
        "layerwise_effective_rank_mergeability_score": -14.283636093139648,
        "singular_value_overlap": -40.228179931640625,
        "subspace_overlap": 19.201799392700195,
        "right_subspace_overlap": 23.516876220703125,
        "activation_l2_distance": 4.390182971954346,
        "activation_cosine_similarity": 25.535503387451172,
        "activation_magnitude_ratio": -12.857666015625,
        "activation_dot_product": 22.97817611694336,
        "encoder_gradient_cosine_similarity": -3.4038660526275635,
        "encoder_gradient_l2_distance": -54.63661193847656,
        "encoder_gradient_dot_product": -9.435650825500488,
        "input_gradient_cosine_similarity": 19.667007446289062,
        "input_gradient_l2_distance": -15.899869918823242,
        "input_gradient_dot_product": -4.523545742034912
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5285297628054565,
      "val_r": 0.3652038125920084,
      "n_iterations": 934,
      "coefficients": {
        "right_subspace_overlap_top_k": -8.858386993408203,
        "right_subspace_overlap_bottom_k": 11.86046028137207,
        "interaction_matrix_overlap_top_k": 0.03186450153589249,
        "interaction_matrix_overlap_bottom_k": -8.442291259765625,
        "effective_rank": 17.81745719909668,
        "effective_rank_mergeability_score": -6.170420169830322,
        "stable_rank": -5.609588146209717,
        "spectral_gap": 12.92708969116211,
        "singular_value_ratio": -1.8408864736557007,
        "layerwise_effective_rank": 5.404196739196777,
        "layerwise_effective_rank_mergeability_score": 16.846141815185547,
        "singular_value_overlap": -9.980436325073242,
        "subspace_overlap": 2.3371832370758057,
        "right_subspace_overlap": 26.350269317626953,
        "activation_l2_distance": -5.13045597076416,
        "activation_cosine_similarity": 13.943649291992188,
        "activation_magnitude_ratio": -4.350587368011475,
        "activation_dot_product": -6.09344482421875,
        "encoder_gradient_cosine_similarity": -0.059561219066381454,
        "encoder_gradient_l2_distance": -21.988927841186523,
        "encoder_gradient_dot_product": 7.90430212020874,
        "input_gradient_cosine_similarity": 1.4288681745529175,
        "input_gradient_l2_distance": -23.848438262939453,
        "input_gradient_dot_product": -13.479629516601562
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.49898530233874716,
      "val_r": 0.41813261194714546,
      "n_iterations": 605,
      "coefficients": {
        "right_subspace_overlap_top_k": 25.524658203125,
        "right_subspace_overlap_bottom_k": -14.113786697387695,
        "interaction_matrix_overlap_top_k": 21.242164611816406,
        "interaction_matrix_overlap_bottom_k": 20.982080459594727,
        "effective_rank": 7.344912528991699,
        "effective_rank_mergeability_score": 6.645753383636475,
        "stable_rank": 5.196351528167725,
        "spectral_gap": -6.92702579498291,
        "singular_value_ratio": -10.779349327087402,
        "layerwise_effective_rank": -16.43260955810547,
        "layerwise_effective_rank_mergeability_score": 8.427144050598145,
        "singular_value_overlap": -31.681917190551758,
        "subspace_overlap": 15.04929256439209,
        "right_subspace_overlap": 17.055652618408203,
        "activation_l2_distance": -9.144969940185547,
        "activation_cosine_similarity": 12.484496116638184,
        "activation_magnitude_ratio": -10.983078002929688,
        "activation_dot_product": 13.177202224731445,
        "encoder_gradient_cosine_similarity": 6.781496524810791,
        "encoder_gradient_l2_distance": -24.65355110168457,
        "encoder_gradient_dot_product": 9.719962120056152,
        "input_gradient_cosine_similarity": 15.923280715942383,
        "input_gradient_l2_distance": -31.223512649536133,
        "input_gradient_dot_product": -28.617162704467773
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5196210575704936,
      "val_r": 0.2750394992299855,
      "n_iterations": 735,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.340874195098877,
        "right_subspace_overlap_bottom_k": 2.994988441467285,
        "interaction_matrix_overlap_top_k": 14.656915664672852,
        "interaction_matrix_overlap_bottom_k": 4.70757532119751,
        "effective_rank": 3.534442901611328,
        "effective_rank_mergeability_score": 11.049209594726562,
        "stable_rank": -0.5490593314170837,
        "spectral_gap": 5.831988334655762,
        "singular_value_ratio": -4.155269145965576,
        "layerwise_effective_rank": 6.531237602233887,
        "layerwise_effective_rank_mergeability_score": 2.484354257583618,
        "singular_value_overlap": -22.05815315246582,
        "subspace_overlap": 16.20134925842285,
        "right_subspace_overlap": 10.62297248840332,
        "activation_l2_distance": -3.6043739318847656,
        "activation_cosine_similarity": 14.773627281188965,
        "activation_magnitude_ratio": -6.1379876136779785,
        "activation_dot_product": -0.7032983303070068,
        "encoder_gradient_cosine_similarity": 5.747458457946777,
        "encoder_gradient_l2_distance": -29.81177520751953,
        "encoder_gradient_dot_product": 3.2874717712402344,
        "input_gradient_cosine_similarity": 9.025246620178223,
        "input_gradient_l2_distance": -19.40557289123535,
        "input_gradient_dot_product": -27.366289138793945
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4396848478732758,
      "val_r": 0.4737826451449773,
      "n_iterations": 456,
      "coefficients": {
        "right_subspace_overlap_top_k": 18.220327377319336,
        "right_subspace_overlap_bottom_k": 20.856287002563477,
        "interaction_matrix_overlap_top_k": 38.07107925415039,
        "interaction_matrix_overlap_bottom_k": -13.365461349487305,
        "effective_rank": 28.445430755615234,
        "effective_rank_mergeability_score": 40.02216720581055,
        "stable_rank": -20.184350967407227,
        "spectral_gap": -7.051898002624512,
        "singular_value_ratio": 6.042202472686768,
        "layerwise_effective_rank": -40.888912200927734,
        "layerwise_effective_rank_mergeability_score": -31.90715980529785,
        "singular_value_overlap": -39.59371566772461,
        "subspace_overlap": 83.71076965332031,
        "right_subspace_overlap": 32.01662063598633,
        "activation_l2_distance": -36.72880554199219,
        "activation_cosine_similarity": 15.9818754196167,
        "activation_magnitude_ratio": -16.849868774414062,
        "activation_dot_product": 38.59208679199219,
        "encoder_gradient_cosine_similarity": 17.595367431640625,
        "encoder_gradient_l2_distance": -38.2269172668457,
        "encoder_gradient_dot_product": 6.2207932472229,
        "input_gradient_cosine_similarity": 30.94353485107422,
        "input_gradient_l2_distance": -47.711647033691406,
        "input_gradient_dot_product": -83.21305847167969
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.4981021774068783,
      "val_r": 0.6956005543086647,
      "n_iterations": 569,
      "coefficients": {
        "right_subspace_overlap_top_k": 4.1641974449157715,
        "right_subspace_overlap_bottom_k": 1.679530143737793,
        "interaction_matrix_overlap_top_k": 16.596498489379883,
        "interaction_matrix_overlap_bottom_k": 15.221346855163574,
        "effective_rank": -2.5924952030181885,
        "effective_rank_mergeability_score": 4.120330810546875,
        "stable_rank": -3.154924154281616,
        "spectral_gap": -3.739504814147949,
        "singular_value_ratio": -2.0339760780334473,
        "layerwise_effective_rank": -2.9591028690338135,
        "layerwise_effective_rank_mergeability_score": 13.21554946899414,
        "singular_value_overlap": -27.692180633544922,
        "subspace_overlap": 14.29337215423584,
        "right_subspace_overlap": 17.899545669555664,
        "activation_l2_distance": -6.349045753479004,
        "activation_cosine_similarity": 11.502598762512207,
        "activation_magnitude_ratio": -6.000173568725586,
        "activation_dot_product": 17.22829818725586,
        "encoder_gradient_cosine_similarity": 11.314677238464355,
        "encoder_gradient_l2_distance": -30.582876205444336,
        "encoder_gradient_dot_product": 0.11348126828670502,
        "input_gradient_cosine_similarity": 12.212714195251465,
        "input_gradient_l2_distance": -22.432661056518555,
        "input_gradient_dot_product": -31.027801513671875
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.4648804040623954,
      "val_r": 0.23663304192174547,
      "n_iterations": 544,
      "coefficients": {
        "right_subspace_overlap_top_k": 34.36361312866211,
        "right_subspace_overlap_bottom_k": -23.328218460083008,
        "interaction_matrix_overlap_top_k": -25.751977920532227,
        "interaction_matrix_overlap_bottom_k": -3.939565658569336,
        "effective_rank": 10.442103385925293,
        "effective_rank_mergeability_score": -12.383810043334961,
        "stable_rank": -16.137964248657227,
        "spectral_gap": 3.465789794921875,
        "singular_value_ratio": 14.223567008972168,
        "layerwise_effective_rank": -47.29713439941406,
        "layerwise_effective_rank_mergeability_score": 0.6019549369812012,
        "singular_value_overlap": -45.6707649230957,
        "subspace_overlap": 50.73278045654297,
        "right_subspace_overlap": 39.72226333618164,
        "activation_l2_distance": -12.341073989868164,
        "activation_cosine_similarity": 52.859649658203125,
        "activation_magnitude_ratio": 26.619535446166992,
        "activation_dot_product": -1.1250113248825073,
        "encoder_gradient_cosine_similarity": 34.339195251464844,
        "encoder_gradient_l2_distance": -92.52062225341797,
        "encoder_gradient_dot_product": 11.629029273986816,
        "input_gradient_cosine_similarity": 10.070840835571289,
        "input_gradient_l2_distance": -43.461814880371094,
        "input_gradient_dot_product": 35.884849548339844
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.38390612253702466,
      "val_r": -0.018793645977256274,
      "n_iterations": 629,
      "coefficients": {
        "right_subspace_overlap_top_k": 30.16448402404785,
        "right_subspace_overlap_bottom_k": 11.402137756347656,
        "interaction_matrix_overlap_top_k": 6.709160327911377,
        "interaction_matrix_overlap_bottom_k": -2.312346935272217,
        "effective_rank": -7.781772613525391,
        "effective_rank_mergeability_score": -12.785612106323242,
        "stable_rank": -5.2906718254089355,
        "spectral_gap": 18.713550567626953,
        "singular_value_ratio": -16.37509536743164,
        "layerwise_effective_rank": -10.00205135345459,
        "layerwise_effective_rank_mergeability_score": -19.932491302490234,
        "singular_value_overlap": 13.144667625427246,
        "subspace_overlap": 18.183813095092773,
        "right_subspace_overlap": 24.552318572998047,
        "activation_l2_distance": -30.806888580322266,
        "activation_cosine_similarity": 3.9938464164733887,
        "activation_magnitude_ratio": -21.813020706176758,
        "activation_dot_product": 22.384389877319336,
        "encoder_gradient_cosine_similarity": 12.180599212646484,
        "encoder_gradient_l2_distance": -27.33077621459961,
        "encoder_gradient_dot_product": 13.756980895996094,
        "input_gradient_cosine_similarity": 7.270514488220215,
        "input_gradient_l2_distance": -30.77480697631836,
        "input_gradient_dot_product": 3.7465672492980957
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5462877983803647,
      "val_r": 0.06638855348031472,
      "n_iterations": 830,
      "coefficients": {
        "right_subspace_overlap_top_k": 20.101545333862305,
        "right_subspace_overlap_bottom_k": -4.670459270477295,
        "interaction_matrix_overlap_top_k": 4.121395587921143,
        "interaction_matrix_overlap_bottom_k": 6.266798973083496,
        "effective_rank": -2.8596513271331787,
        "effective_rank_mergeability_score": 5.272651195526123,
        "stable_rank": 9.409390449523926,
        "spectral_gap": 2.3062052726745605,
        "singular_value_ratio": -1.1185762882232666,
        "layerwise_effective_rank": 5.742580890655518,
        "layerwise_effective_rank_mergeability_score": 17.171152114868164,
        "singular_value_overlap": -14.429375648498535,
        "subspace_overlap": 1.740536093711853,
        "right_subspace_overlap": -0.2518955171108246,
        "activation_l2_distance": -6.7803239822387695,
        "activation_cosine_similarity": 9.962695121765137,
        "activation_magnitude_ratio": -1.969326138496399,
        "activation_dot_product": -1.0783077478408813,
        "encoder_gradient_cosine_similarity": 8.140018463134766,
        "encoder_gradient_l2_distance": -18.73501205444336,
        "encoder_gradient_dot_product": 4.55377197265625,
        "input_gradient_cosine_similarity": 2.8606271743774414,
        "input_gradient_l2_distance": -23.582368850708008,
        "input_gradient_dot_product": -21.175888061523438
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5010041868451925,
      "val_r": 0.5157814776660087,
      "n_iterations": 590,
      "coefficients": {
        "right_subspace_overlap_top_k": 16.04686164855957,
        "right_subspace_overlap_bottom_k": -25.659870147705078,
        "interaction_matrix_overlap_top_k": 14.289681434631348,
        "interaction_matrix_overlap_bottom_k": 33.90150833129883,
        "effective_rank": -2.6856346130371094,
        "effective_rank_mergeability_score": 21.041484832763672,
        "stable_rank": 1.9588543176651,
        "spectral_gap": -16.521240234375,
        "singular_value_ratio": -25.391742706298828,
        "layerwise_effective_rank": 46.17119216918945,
        "layerwise_effective_rank_mergeability_score": 34.028411865234375,
        "singular_value_overlap": -38.65129089355469,
        "subspace_overlap": 11.58993911743164,
        "right_subspace_overlap": 35.79671859741211,
        "activation_l2_distance": -12.963349342346191,
        "activation_cosine_similarity": 5.564289093017578,
        "activation_magnitude_ratio": -8.938560485839844,
        "activation_dot_product": 0.9871547818183899,
        "encoder_gradient_cosine_similarity": 12.271106719970703,
        "encoder_gradient_l2_distance": -35.7931022644043,
        "encoder_gradient_dot_product": 10.447818756103516,
        "input_gradient_cosine_similarity": 3.3294365406036377,
        "input_gradient_l2_distance": -36.235660552978516,
        "input_gradient_dot_product": -43.58653259277344
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5026142442995892,
      "val_r": 0.2448288042192334,
      "n_iterations": 655,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.814764022827148,
        "right_subspace_overlap_bottom_k": 4.796172618865967,
        "interaction_matrix_overlap_top_k": 4.378621578216553,
        "interaction_matrix_overlap_bottom_k": 9.21117877960205,
        "effective_rank": -9.806722640991211,
        "effective_rank_mergeability_score": 10.59415054321289,
        "stable_rank": 1.4740495681762695,
        "spectral_gap": 17.9252872467041,
        "singular_value_ratio": 14.042969703674316,
        "layerwise_effective_rank": 0.4206969141960144,
        "layerwise_effective_rank_mergeability_score": -11.481852531433105,
        "singular_value_overlap": -11.41766357421875,
        "subspace_overlap": 14.315881729125977,
        "right_subspace_overlap": -8.579792022705078,
        "activation_l2_distance": -9.758255004882812,
        "activation_cosine_similarity": 13.69425106048584,
        "activation_magnitude_ratio": -3.3749330043792725,
        "activation_dot_product": 8.704119682312012,
        "encoder_gradient_cosine_similarity": 0.9208440780639648,
        "encoder_gradient_l2_distance": -25.763463973999023,
        "encoder_gradient_dot_product": -3.315430164337158,
        "input_gradient_cosine_similarity": 8.999175071716309,
        "input_gradient_l2_distance": -19.400890350341797,
        "input_gradient_dot_product": -15.395469665527344
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.48100809722913146,
      "val_r": 0.36786251413269044,
      "n_iterations": 739,
      "coefficients": {
        "right_subspace_overlap_top_k": 13.015987396240234,
        "right_subspace_overlap_bottom_k": 4.547016620635986,
        "interaction_matrix_overlap_top_k": 13.453898429870605,
        "interaction_matrix_overlap_bottom_k": 20.518047332763672,
        "effective_rank": 7.128629684448242,
        "effective_rank_mergeability_score": 12.557836532592773,
        "stable_rank": 2.2873053550720215,
        "spectral_gap": 8.063555717468262,
        "singular_value_ratio": -17.185102462768555,
        "layerwise_effective_rank": -15.286038398742676,
        "layerwise_effective_rank_mergeability_score": -26.548070907592773,
        "singular_value_overlap": -34.34156036376953,
        "subspace_overlap": 33.052371978759766,
        "right_subspace_overlap": 15.17734432220459,
        "activation_l2_distance": 0.6535686254501343,
        "activation_cosine_similarity": 12.855071067810059,
        "activation_magnitude_ratio": -17.180130004882812,
        "activation_dot_product": 26.13164520263672,
        "encoder_gradient_cosine_similarity": 10.391432762145996,
        "encoder_gradient_l2_distance": -22.156707763671875,
        "encoder_gradient_dot_product": 17.99951934814453,
        "input_gradient_cosine_similarity": 21.324935913085938,
        "input_gradient_l2_distance": -34.35320281982422,
        "input_gradient_dot_product": -51.10947036743164
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.500140525439878,
      "val_r": 0.5187006504067804,
      "n_iterations": 930,
      "coefficients": {
        "right_subspace_overlap_top_k": 22.205684661865234,
        "right_subspace_overlap_bottom_k": -7.976184844970703,
        "interaction_matrix_overlap_top_k": 6.913715362548828,
        "interaction_matrix_overlap_bottom_k": 17.038724899291992,
        "effective_rank": 7.991059303283691,
        "effective_rank_mergeability_score": -2.9873645305633545,
        "stable_rank": -5.410268306732178,
        "spectral_gap": 4.887261867523193,
        "singular_value_ratio": -2.815995454788208,
        "layerwise_effective_rank": 2.2783312797546387,
        "layerwise_effective_rank_mergeability_score": 6.687589645385742,
        "singular_value_overlap": -18.404014587402344,
        "subspace_overlap": 9.968561172485352,
        "right_subspace_overlap": -8.164932250976562,
        "activation_l2_distance": -5.236979961395264,
        "activation_cosine_similarity": 8.082941055297852,
        "activation_magnitude_ratio": -3.838413953781128,
        "activation_dot_product": 4.19374942779541,
        "encoder_gradient_cosine_similarity": 6.441166877746582,
        "encoder_gradient_l2_distance": -3.4438071250915527,
        "encoder_gradient_dot_product": 7.101759910583496,
        "input_gradient_cosine_similarity": 5.686378479003906,
        "input_gradient_l2_distance": -37.36528778076172,
        "input_gradient_dot_product": -12.835304260253906
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5221695048301316,
      "val_r": 0.6434024923215454,
      "n_iterations": 630,
      "coefficients": {
        "right_subspace_overlap_top_k": 14.548479080200195,
        "right_subspace_overlap_bottom_k": 1.6222083568572998,
        "interaction_matrix_overlap_top_k": 26.272836685180664,
        "interaction_matrix_overlap_bottom_k": -4.252975940704346,
        "effective_rank": -0.30378395318984985,
        "effective_rank_mergeability_score": 2.4934186935424805,
        "stable_rank": 7.9804229736328125,
        "spectral_gap": 1.635521411895752,
        "singular_value_ratio": -2.8908936977386475,
        "layerwise_effective_rank": 6.096875190734863,
        "layerwise_effective_rank_mergeability_score": 20.437593460083008,
        "singular_value_overlap": -26.513227462768555,
        "subspace_overlap": 3.9045755863189697,
        "right_subspace_overlap": 13.590985298156738,
        "activation_l2_distance": -10.31240463256836,
        "activation_cosine_similarity": 23.12145233154297,
        "activation_magnitude_ratio": -4.522274494171143,
        "activation_dot_product": -13.202826499938965,
        "encoder_gradient_cosine_similarity": 8.640678405761719,
        "encoder_gradient_l2_distance": -26.99661636352539,
        "encoder_gradient_dot_product": 15.403068542480469,
        "input_gradient_cosine_similarity": 5.481928825378418,
        "input_gradient_l2_distance": -33.71028518676758,
        "input_gradient_dot_product": -27.527109146118164
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4896686266088885,
      "val_r": 0.5829208081989534,
      "n_iterations": 846,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.04617166519165,
        "right_subspace_overlap_bottom_k": 4.405786991119385,
        "interaction_matrix_overlap_top_k": 14.152901649475098,
        "interaction_matrix_overlap_bottom_k": -5.780767440795898,
        "effective_rank": -0.056106481701135635,
        "effective_rank_mergeability_score": 17.20401382446289,
        "stable_rank": 14.999956130981445,
        "spectral_gap": 14.905328750610352,
        "singular_value_ratio": 1.902814269065857,
        "layerwise_effective_rank": -1.3214912414550781,
        "layerwise_effective_rank_mergeability_score": -3.2099311351776123,
        "singular_value_overlap": -8.849286079406738,
        "subspace_overlap": 8.895751953125,
        "right_subspace_overlap": 3.338717222213745,
        "activation_l2_distance": -7.655126571655273,
        "activation_cosine_similarity": 16.51741600036621,
        "activation_magnitude_ratio": -3.9898011684417725,
        "activation_dot_product": 1.8398492336273193,
        "encoder_gradient_cosine_similarity": 3.919687032699585,
        "encoder_gradient_l2_distance": -31.066755294799805,
        "encoder_gradient_dot_product": 8.620369911193848,
        "input_gradient_cosine_similarity": 2.985475540161133,
        "input_gradient_l2_distance": -31.002521514892578,
        "input_gradient_dot_product": -26.804256439208984
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.46949247734394556,
      "val_r": 0.35973416354973664,
      "n_iterations": 487,
      "coefficients": {
        "right_subspace_overlap_top_k": 25.778474807739258,
        "right_subspace_overlap_bottom_k": -48.407371520996094,
        "interaction_matrix_overlap_top_k": 62.053794860839844,
        "interaction_matrix_overlap_bottom_k": 47.78425598144531,
        "effective_rank": 4.692432880401611,
        "effective_rank_mergeability_score": 3.9537241458892822,
        "stable_rank": -30.366424560546875,
        "spectral_gap": 6.540866374969482,
        "singular_value_ratio": 22.407272338867188,
        "layerwise_effective_rank": -46.3310661315918,
        "layerwise_effective_rank_mergeability_score": -34.59324264526367,
        "singular_value_overlap": -8.054335594177246,
        "subspace_overlap": 38.26561737060547,
        "right_subspace_overlap": -11.251408576965332,
        "activation_l2_distance": 12.184394836425781,
        "activation_cosine_similarity": 24.639284133911133,
        "activation_magnitude_ratio": -4.199883460998535,
        "activation_dot_product": 22.551513671875,
        "encoder_gradient_cosine_similarity": 13.91691780090332,
        "encoder_gradient_l2_distance": -25.372835159301758,
        "encoder_gradient_dot_product": 9.286083221435547,
        "input_gradient_cosine_similarity": 7.867395877838135,
        "input_gradient_l2_distance": -54.04069519042969,
        "input_gradient_dot_product": -38.30792236328125
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5048021903936567,
      "val_r": 0.3635926198699961,
      "n_iterations": 669,
      "coefficients": {
        "right_subspace_overlap_top_k": 24.011159896850586,
        "right_subspace_overlap_bottom_k": -14.26430606842041,
        "interaction_matrix_overlap_top_k": 29.115068435668945,
        "interaction_matrix_overlap_bottom_k": 13.114598274230957,
        "effective_rank": 15.155768394470215,
        "effective_rank_mergeability_score": 4.450618267059326,
        "stable_rank": -6.993777751922607,
        "spectral_gap": -2.653700590133667,
        "singular_value_ratio": -12.564436912536621,
        "layerwise_effective_rank": -6.9868550300598145,
        "layerwise_effective_rank_mergeability_score": 0.646597146987915,
        "singular_value_overlap": -21.136974334716797,
        "subspace_overlap": -1.5782440900802612,
        "right_subspace_overlap": 10.360011100769043,
        "activation_l2_distance": 4.645589828491211,
        "activation_cosine_similarity": 20.44314956665039,
        "activation_magnitude_ratio": -3.3144776821136475,
        "activation_dot_product": 8.726139068603516,
        "encoder_gradient_cosine_similarity": 10.63953971862793,
        "encoder_gradient_l2_distance": -26.117351531982422,
        "encoder_gradient_dot_product": 10.149064064025879,
        "input_gradient_cosine_similarity": 12.300726890563965,
        "input_gradient_l2_distance": -30.024229049682617,
        "input_gradient_dot_product": -37.1259880065918
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5644945640931007,
      "val_r": 0.4052663643434628,
      "n_iterations": 876,
      "coefficients": {
        "right_subspace_overlap_top_k": -9.83307933807373,
        "right_subspace_overlap_bottom_k": -20.709062576293945,
        "interaction_matrix_overlap_top_k": 1.8666051626205444,
        "interaction_matrix_overlap_bottom_k": 33.99951171875,
        "effective_rank": 21.884965896606445,
        "effective_rank_mergeability_score": -1.7419672012329102,
        "stable_rank": 7.296547889709473,
        "spectral_gap": 18.372098922729492,
        "singular_value_ratio": 4.518306255340576,
        "layerwise_effective_rank": -16.429763793945312,
        "layerwise_effective_rank_mergeability_score": 11.634916305541992,
        "singular_value_overlap": -13.58568000793457,
        "subspace_overlap": 15.590353965759277,
        "right_subspace_overlap": 11.03969669342041,
        "activation_l2_distance": -10.445063591003418,
        "activation_cosine_similarity": 17.563045501708984,
        "activation_magnitude_ratio": -3.359941005706787,
        "activation_dot_product": -13.574869155883789,
        "encoder_gradient_cosine_similarity": 2.923401117324829,
        "encoder_gradient_l2_distance": -27.17943572998047,
        "encoder_gradient_dot_product": 2.8247573375701904,
        "input_gradient_cosine_similarity": 12.160245895385742,
        "input_gradient_l2_distance": -26.762943267822266,
        "input_gradient_dot_product": -17.054109573364258
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8233188948042487,
      "val_r": 0.662957108585699,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.6014306545257568,
        "right_subspace_overlap_bottom_k": -4.074592590332031,
        "interaction_matrix_overlap_top_k": -0.826973557472229,
        "interaction_matrix_overlap_bottom_k": 2.800565481185913,
        "effective_rank": 1.5456328392028809,
        "effective_rank_mergeability_score": -0.5030186176300049,
        "stable_rank": -1.75128173828125,
        "spectral_gap": -0.053071681410074234,
        "singular_value_ratio": 0.6120737195014954,
        "layerwise_effective_rank": 0.47056424617767334,
        "layerwise_effective_rank_mergeability_score": 1.9905920028686523,
        "singular_value_overlap": -0.38808542490005493,
        "subspace_overlap": -1.7078936100006104,
        "right_subspace_overlap": 2.7808899879455566,
        "activation_l2_distance": 1.3504196405410767,
        "activation_cosine_similarity": 2.7628636360168457,
        "activation_magnitude_ratio": -0.08436201512813568,
        "activation_dot_product": 0.06497076153755188,
        "encoder_gradient_cosine_similarity": 0.6199696063995361,
        "encoder_gradient_l2_distance": -3.2614006996154785,
        "encoder_gradient_dot_product": 0.5155867338180542,
        "input_gradient_cosine_similarity": 0.053047869354486465,
        "input_gradient_l2_distance": -2.3905837535858154,
        "input_gradient_dot_product": -1.127741813659668
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5689216550128565,
      "val_r": 0.31101471059460883,
      "n_iterations": 791,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.787262439727783,
        "right_subspace_overlap_bottom_k": -9.559259414672852,
        "interaction_matrix_overlap_top_k": 1.5860812664031982,
        "interaction_matrix_overlap_bottom_k": 12.806756973266602,
        "effective_rank": 6.095808029174805,
        "effective_rank_mergeability_score": -10.761011123657227,
        "stable_rank": -0.2551737129688263,
        "spectral_gap": 17.736587524414062,
        "singular_value_ratio": 6.014580726623535,
        "layerwise_effective_rank": -1.9261447191238403,
        "layerwise_effective_rank_mergeability_score": 9.321532249450684,
        "singular_value_overlap": -9.698254585266113,
        "subspace_overlap": -1.3566738367080688,
        "right_subspace_overlap": 2.527284622192383,
        "activation_l2_distance": -0.3536030054092407,
        "activation_cosine_similarity": 12.974482536315918,
        "activation_magnitude_ratio": 0.8567826151847839,
        "activation_dot_product": -2.089740037918091,
        "encoder_gradient_cosine_similarity": 0.4816034436225891,
        "encoder_gradient_l2_distance": -17.030179977416992,
        "encoder_gradient_dot_product": 2.7707583904266357,
        "input_gradient_cosine_similarity": 5.494122505187988,
        "input_gradient_l2_distance": -18.53087615966797,
        "input_gradient_dot_product": -8.894416809082031
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}