{
  "aggregate_metrics": {
    "train_r": 0.24492452865003247,
    "train_p": 3.17402985637274e-45,
    "val_r": 0.10151357665093144,
    "val_p": 0.05498818033981994
  },
  "per_fold_stats": {
    "train_r_mean": 0.5304529973560933,
    "train_r_std": 0.09549791960836355,
    "val_r_mean": 0.4067349523981342,
    "val_r_std": 0.15799383070988898
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 15.251970291137695,
    "right_subspace_overlap_bottom_k": 2.760052442550659,
    "interaction_matrix_overlap_top_k": 21.560771942138672,
    "interaction_matrix_overlap_bottom_k": 26.4493408203125,
    "effective_rank": 0.7705947756767273,
    "effective_rank_mergeability_score": 0.6480341553688049,
    "stable_rank": -11.98284912109375,
    "spectral_gap": 2.6140217781066895,
    "singular_value_ratio": -3.7376303672790527,
    "layerwise_effective_rank": -9.341665267944336,
    "layerwise_effective_rank_mergeability_score": -9.396736145019531,
    "task_vector_cosine_similarity": 5.314227104187012,
    "task_vector_l2_distance": -20.004880905151367,
    "task_vector_dot_product": 0.18795600533485413,
    "weight_space_angle": 4.805553436279297,
    "task_vector_magnitude_ratio": -3.4575753211975098,
    "singular_value_overlap": -21.135501861572266,
    "subspace_overlap": 6.9286370277404785,
    "right_subspace_overlap": 15.611178398132324,
    "activation_l2_distance": 0.7871624827384949,
    "activation_cosine_similarity": 9.998977661132812,
    "activation_magnitude_ratio": -13.819186210632324,
    "activation_dot_product": 14.594337463378906,
    "encoder_gradient_cosine_similarity": 16.364322662353516,
    "encoder_gradient_l2_distance": -26.2069034576416,
    "encoder_gradient_dot_product": 20.15337562561035,
    "input_gradient_cosine_similarity": 15.079889297485352,
    "input_gradient_l2_distance": -31.532512664794922,
    "input_gradient_dot_product": -28.273250579833984
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 25.391090393066406,
    "right_subspace_overlap_bottom_k": 26.849031448364258,
    "interaction_matrix_overlap_top_k": 34.47611618041992,
    "interaction_matrix_overlap_bottom_k": 53.826541900634766,
    "effective_rank": 19.256519317626953,
    "effective_rank_mergeability_score": 43.10554122924805,
    "stable_rank": 30.524980545043945,
    "spectral_gap": 18.345239639282227,
    "singular_value_ratio": 23.031044006347656,
    "layerwise_effective_rank": 29.315549850463867,
    "layerwise_effective_rank_mergeability_score": 24.065414428710938,
    "task_vector_cosine_similarity": 14.401755332946777,
    "task_vector_l2_distance": 30.135807037353516,
    "task_vector_dot_product": 12.94448471069336,
    "weight_space_angle": 18.672029495239258,
    "task_vector_magnitude_ratio": 23.814903259277344,
    "singular_value_overlap": 27.911853790283203,
    "subspace_overlap": 19.685285568237305,
    "right_subspace_overlap": 23.904661178588867,
    "activation_l2_distance": 9.71066665649414,
    "activation_cosine_similarity": 16.80158042907715,
    "activation_magnitude_ratio": 30.308298110961914,
    "activation_dot_product": 18.696733474731445,
    "encoder_gradient_cosine_similarity": 24.65271759033203,
    "encoder_gradient_l2_distance": 26.553253173828125,
    "encoder_gradient_dot_product": 29.480791091918945,
    "input_gradient_cosine_similarity": 18.92156410217285,
    "input_gradient_l2_distance": 32.93882751464844,
    "input_gradient_dot_product": 43.21636199951172
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5012324981395968,
      "val_r": 0.44649294059644934,
      "n_iterations": 729,
      "coefficients": {
        "right_subspace_overlap_top_k": -10.79191780090332,
        "right_subspace_overlap_bottom_k": 13.634425163269043,
        "interaction_matrix_overlap_top_k": 60.871482849121094,
        "interaction_matrix_overlap_bottom_k": 104.17683410644531,
        "effective_rank": 56.96668243408203,
        "effective_rank_mergeability_score": -8.888720512390137,
        "stable_rank": -48.89186477661133,
        "spectral_gap": 36.626380920410156,
        "singular_value_ratio": -28.093387603759766,
        "layerwise_effective_rank": -37.48271942138672,
        "layerwise_effective_rank_mergeability_score": -22.41193389892578,
        "task_vector_cosine_similarity": 45.99231719970703,
        "task_vector_l2_distance": -78.60530853271484,
        "task_vector_dot_product": 25.38918113708496,
        "weight_space_angle": 8.991119384765625,
        "task_vector_magnitude_ratio": 9.583780288696289,
        "singular_value_overlap": -80.7516860961914,
        "subspace_overlap": 20.896488189697266,
        "right_subspace_overlap": 63.2941780090332,
        "activation_l2_distance": 11.50796890258789,
        "activation_cosine_similarity": 59.403541564941406,
        "activation_magnitude_ratio": -77.0784912109375,
        "activation_dot_product": 63.41400146484375,
        "encoder_gradient_cosine_similarity": 3.5290210247039795,
        "encoder_gradient_l2_distance": -53.77997589111328,
        "encoder_gradient_dot_product": 48.16864013671875,
        "input_gradient_cosine_similarity": 41.995452880859375,
        "input_gradient_l2_distance": -73.03117370605469,
        "input_gradient_dot_product": -153.63650512695312
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.593654161590368,
      "val_r": 0.5874444869340101,
      "n_iterations": 570,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.31997251510620117,
        "right_subspace_overlap_bottom_k": -0.27758461236953735,
        "interaction_matrix_overlap_top_k": 1.4864237308502197,
        "interaction_matrix_overlap_bottom_k": 2.2905962467193604,
        "effective_rank": 1.1336185932159424,
        "effective_rank_mergeability_score": -0.22717365622520447,
        "stable_rank": -1.0037786960601807,
        "spectral_gap": 2.3324623107910156,
        "singular_value_ratio": 1.5124247074127197,
        "layerwise_effective_rank": 0.034011393785476685,
        "layerwise_effective_rank_mergeability_score": 0.5514737963676453,
        "task_vector_cosine_similarity": -0.8334976434707642,
        "task_vector_l2_distance": -2.264190435409546,
        "task_vector_dot_product": 0.1455981433391571,
        "weight_space_angle": 0.9462910890579224,
        "task_vector_magnitude_ratio": 0.0732719898223877,
        "singular_value_overlap": -1.637311339378357,
        "subspace_overlap": 1.0001862049102783,
        "right_subspace_overlap": 0.3657078146934509,
        "activation_l2_distance": 0.6427633762359619,
        "activation_cosine_similarity": 1.2904913425445557,
        "activation_magnitude_ratio": -0.5059384107589722,
        "activation_dot_product": -0.034224916249513626,
        "encoder_gradient_cosine_similarity": 0.28630101680755615,
        "encoder_gradient_l2_distance": -3.492976188659668,
        "encoder_gradient_dot_product": 0.4521086513996124,
        "input_gradient_cosine_similarity": 0.30490005016326904,
        "input_gradient_l2_distance": -2.312614917755127,
        "input_gradient_dot_product": -0.9394665956497192
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5313387286287222,
      "val_r": 0.46858758581286847,
      "n_iterations": 464,
      "coefficients": {
        "right_subspace_overlap_top_k": 11.123887062072754,
        "right_subspace_overlap_bottom_k": 0.029667779803276062,
        "interaction_matrix_overlap_top_k": 23.423925399780273,
        "interaction_matrix_overlap_bottom_k": 2.130774974822998,
        "effective_rank": -2.7010529041290283,
        "effective_rank_mergeability_score": 13.231605529785156,
        "stable_rank": -3.2858808040618896,
        "spectral_gap": 12.699238777160645,
        "singular_value_ratio": 11.009332656860352,
        "layerwise_effective_rank": -23.111167907714844,
        "layerwise_effective_rank_mergeability_score": -19.52268409729004,
        "task_vector_cosine_similarity": 8.087801933288574,
        "task_vector_l2_distance": -6.100175380706787,
        "task_vector_dot_product": 1.6652311086654663,
        "weight_space_angle": 13.482682228088379,
        "task_vector_magnitude_ratio": 8.198013305664062,
        "singular_value_overlap": -23.924240112304688,
        "subspace_overlap": 2.852480173110962,
        "right_subspace_overlap": 16.227109909057617,
        "activation_l2_distance": 3.8984475135803223,
        "activation_cosine_similarity": 28.459529876708984,
        "activation_magnitude_ratio": -3.9972240924835205,
        "activation_dot_product": -3.5780906677246094,
        "encoder_gradient_cosine_similarity": 8.373799324035645,
        "encoder_gradient_l2_distance": -33.142974853515625,
        "encoder_gradient_dot_product": 4.9955153465271,
        "input_gradient_cosine_similarity": 9.240973472595215,
        "input_gradient_l2_distance": -26.504030227661133,
        "input_gradient_dot_product": -32.265594482421875
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.45377669717221586,
      "val_r": 0.27832254090156516,
      "n_iterations": 81,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.0154435634613037,
        "right_subspace_overlap_bottom_k": 1.3776071071624756,
        "interaction_matrix_overlap_top_k": 5.845307350158691,
        "interaction_matrix_overlap_bottom_k": -0.2982182800769806,
        "effective_rank": 2.3093607425689697,
        "effective_rank_mergeability_score": 8.558171272277832,
        "stable_rank": 8.705137252807617,
        "spectral_gap": 0.32301339507102966,
        "singular_value_ratio": 4.111536502838135,
        "layerwise_effective_rank": -7.359975814819336,
        "layerwise_effective_rank_mergeability_score": 0.7346417307853699,
        "task_vector_cosine_similarity": -3.121464729309082,
        "task_vector_l2_distance": -1.2421377897262573,
        "task_vector_dot_product": 1.3121707439422607,
        "weight_space_angle": -6.217233657836914,
        "task_vector_magnitude_ratio": -2.113738536834717,
        "singular_value_overlap": -4.401858806610107,
        "subspace_overlap": -3.642184257507324,
        "right_subspace_overlap": 3.49302339553833,
        "activation_l2_distance": 0.4021044373512268,
        "activation_cosine_similarity": 3.5068185329437256,
        "activation_magnitude_ratio": -0.2658998966217041,
        "activation_dot_product": -1.7939378023147583,
        "encoder_gradient_cosine_similarity": -2.369215726852417,
        "encoder_gradient_l2_distance": -4.715723991394043,
        "encoder_gradient_dot_product": 2.9081239700317383,
        "input_gradient_cosine_similarity": -0.9255454540252686,
        "input_gradient_l2_distance": -3.378329038619995,
        "input_gradient_dot_product": -1.7761293649673462
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4451218740758496,
      "val_r": 0.4238549746554788,
      "n_iterations": 64,
      "coefficients": {
        "right_subspace_overlap_top_k": 11.595870971679688,
        "right_subspace_overlap_bottom_k": -3.748995065689087,
        "interaction_matrix_overlap_top_k": -2.4964687824249268,
        "interaction_matrix_overlap_bottom_k": 5.219600677490234,
        "effective_rank": -2.0750129222869873,
        "effective_rank_mergeability_score": -0.505033552646637,
        "stable_rank": -6.758187294006348,
        "spectral_gap": -1.4749338626861572,
        "singular_value_ratio": 1.9493128061294556,
        "layerwise_effective_rank": 11.284605026245117,
        "layerwise_effective_rank_mergeability_score": -0.051148366183042526,
        "task_vector_cosine_similarity": 6.5288496017456055,
        "task_vector_l2_distance": 1.1087009906768799,
        "task_vector_dot_product": -11.556818962097168,
        "weight_space_angle": -11.314127922058105,
        "task_vector_magnitude_ratio": -8.214138984680176,
        "singular_value_overlap": -3.8234574794769287,
        "subspace_overlap": 4.424465179443359,
        "right_subspace_overlap": 3.725329637527466,
        "activation_l2_distance": -3.516353130340576,
        "activation_cosine_similarity": -1.6215287446975708,
        "activation_magnitude_ratio": 3.072103500366211,
        "activation_dot_product": 10.59032154083252,
        "encoder_gradient_cosine_similarity": 4.754327297210693,
        "encoder_gradient_l2_distance": -7.057869911193848,
        "encoder_gradient_dot_product": 9.328828811645508,
        "input_gradient_cosine_similarity": 8.898133277893066,
        "input_gradient_l2_distance": -6.174816131591797,
        "input_gradient_dot_product": -11.115640640258789
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.2939932432191886,
      "val_r": 0.4550408462957205,
      "n_iterations": 498,
      "coefficients": {
        "right_subspace_overlap_top_k": 96.02865600585938,
        "right_subspace_overlap_bottom_k": 104.18041229248047,
        "interaction_matrix_overlap_top_k": 46.062347412109375,
        "interaction_matrix_overlap_bottom_k": 219.11691284179688,
        "effective_rank": 8.256997108459473,
        "effective_rank_mergeability_score": -177.09092712402344,
        "stable_rank": -109.30901336669922,
        "spectral_gap": 44.407649993896484,
        "singular_value_ratio": 17.070711135864258,
        "layerwise_effective_rank": -120.34727478027344,
        "layerwise_effective_rank_mergeability_score": -29.33827781677246,
        "task_vector_cosine_similarity": -8.832879066467285,
        "task_vector_l2_distance": 5.395580291748047,
        "task_vector_dot_product": -42.051475524902344,
        "weight_space_angle": 22.45985221862793,
        "task_vector_magnitude_ratio": -99.68523406982422,
        "singular_value_overlap": 21.22843360900879,
        "subspace_overlap": -21.16972541809082,
        "right_subspace_overlap": 79.05936431884766,
        "activation_l2_distance": -22.346166610717773,
        "activation_cosine_similarity": -17.692142486572266,
        "activation_magnitude_ratio": -120.33917236328125,
        "activation_dot_product": 26.79765510559082,
        "encoder_gradient_cosine_similarity": 94.21806335449219,
        "encoder_gradient_l2_distance": -21.932159423828125,
        "encoder_gradient_dot_product": 125.28096008300781,
        "input_gradient_cosine_similarity": 56.382240295410156,
        "input_gradient_l2_distance": -101.91633605957031,
        "input_gradient_dot_product": -72.8982162475586
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5113859975555461,
      "val_r": 0.25617774178436953,
      "n_iterations": 97,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.184262752532959,
        "right_subspace_overlap_bottom_k": 0.7305101752281189,
        "interaction_matrix_overlap_top_k": 2.0509588718414307,
        "interaction_matrix_overlap_bottom_k": 1.7377036809921265,
        "effective_rank": 0.4482249319553375,
        "effective_rank_mergeability_score": -0.23211310803890228,
        "stable_rank": -1.1294587850570679,
        "spectral_gap": 0.27300772070884705,
        "singular_value_ratio": 0.15415610373020172,
        "layerwise_effective_rank": -0.822769820690155,
        "layerwise_effective_rank_mergeability_score": 0.8438687324523926,
        "task_vector_cosine_similarity": 1.1977683305740356,
        "task_vector_l2_distance": -2.1392838954925537,
        "task_vector_dot_product": -0.7376183867454529,
        "weight_space_angle": 0.815792977809906,
        "task_vector_magnitude_ratio": -0.30504655838012695,
        "singular_value_overlap": -3.76122784614563,
        "subspace_overlap": 2.7080202102661133,
        "right_subspace_overlap": 2.2668724060058594,
        "activation_l2_distance": -1.3317315578460693,
        "activation_cosine_similarity": 1.7916761636734009,
        "activation_magnitude_ratio": 1.1958757638931274,
        "activation_dot_product": 0.926642656326294,
        "encoder_gradient_cosine_similarity": 1.795755386352539,
        "encoder_gradient_l2_distance": -4.148499965667725,
        "encoder_gradient_dot_product": 2.5485646724700928,
        "input_gradient_cosine_similarity": -0.4985980987548828,
        "input_gradient_l2_distance": -2.5648796558380127,
        "input_gradient_dot_product": -4.021543979644775
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5132266436646721,
      "val_r": 0.16193475469113167,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5715122222900391,
        "right_subspace_overlap_bottom_k": 0.36822187900543213,
        "interaction_matrix_overlap_top_k": 0.8623564839363098,
        "interaction_matrix_overlap_bottom_k": 0.5379340052604675,
        "effective_rank": -0.03277076408267021,
        "effective_rank_mergeability_score": 0.20688888430595398,
        "stable_rank": 0.107296422123909,
        "spectral_gap": 0.37690794467926025,
        "singular_value_ratio": 0.3052588701248169,
        "layerwise_effective_rank": 0.1531652957201004,
        "layerwise_effective_rank_mergeability_score": -0.22701424360275269,
        "task_vector_cosine_similarity": 0.3762451708316803,
        "task_vector_l2_distance": -1.586079716682434,
        "task_vector_dot_product": -0.44973427057266235,
        "weight_space_angle": 0.48238956928253174,
        "task_vector_magnitude_ratio": -0.7285875082015991,
        "singular_value_overlap": -0.7342870235443115,
        "subspace_overlap": 0.07014630734920502,
        "right_subspace_overlap": 0.8906176090240479,
        "activation_l2_distance": 0.25547271966934204,
        "activation_cosine_similarity": 0.2424730658531189,
        "activation_magnitude_ratio": -0.5345813035964966,
        "activation_dot_product": 0.6122154593467712,
        "encoder_gradient_cosine_similarity": 0.7637238502502441,
        "encoder_gradient_l2_distance": -1.2367770671844482,
        "encoder_gradient_dot_product": 0.2771410048007965,
        "input_gradient_cosine_similarity": 0.6572659015655518,
        "input_gradient_l2_distance": -1.7181692123413086,
        "input_gradient_dot_product": 0.09289349615573883
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5737726871331964,
      "val_r": 0.13201139612222865,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -6.006141662597656,
        "right_subspace_overlap_bottom_k": -42.544677734375,
        "interaction_matrix_overlap_top_k": 39.30878448486328,
        "interaction_matrix_overlap_bottom_k": 89.86554718017578,
        "effective_rank": -21.1973934173584,
        "effective_rank_mergeability_score": 26.168140411376953,
        "stable_rank": -31.059797286987305,
        "spectral_gap": 1.0352425575256348,
        "singular_value_ratio": 26.509273529052734,
        "layerwise_effective_rank": -16.51115608215332,
        "layerwise_effective_rank_mergeability_score": -10.188654899597168,
        "task_vector_cosine_similarity": 3.0042481422424316,
        "task_vector_l2_distance": -95.53699493408203,
        "task_vector_dot_product": 20.180871963500977,
        "weight_space_angle": 29.214336395263672,
        "task_vector_magnitude_ratio": -3.755281925201416,
        "singular_value_overlap": -60.818058013916016,
        "subspace_overlap": 39.912960052490234,
        "right_subspace_overlap": 61.79894256591797,
        "activation_l2_distance": 27.09375,
        "activation_cosine_similarity": 32.27980422973633,
        "activation_magnitude_ratio": -23.819215774536133,
        "activation_dot_product": 29.03558921813965,
        "encoder_gradient_cosine_similarity": 56.24105453491211,
        "encoder_gradient_l2_distance": -82.97402954101562,
        "encoder_gradient_dot_product": 45.55881881713867,
        "input_gradient_cosine_similarity": 15.373163223266602,
        "input_gradient_l2_distance": -67.1937484741211,
        "input_gradient_dot_product": -79.97698211669922
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5709532265669062,
      "val_r": 0.18616669333363448,
      "n_iterations": 107,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.2578989267349243,
        "right_subspace_overlap_bottom_k": 0.7860862016677856,
        "interaction_matrix_overlap_top_k": 0.4259584844112396,
        "interaction_matrix_overlap_bottom_k": 1.4078952074050903,
        "effective_rank": -1.1506894826889038,
        "effective_rank_mergeability_score": 0.11196590214967728,
        "stable_rank": 0.4532654583454132,
        "spectral_gap": 1.6534819602966309,
        "singular_value_ratio": 0.4862794280052185,
        "layerwise_effective_rank": 1.0222465991973877,
        "layerwise_effective_rank_mergeability_score": 0.3751743733882904,
        "task_vector_cosine_similarity": -0.12530608475208282,
        "task_vector_l2_distance": -2.9436371326446533,
        "task_vector_dot_product": -1.5773545503616333,
        "weight_space_angle": 0.7641453742980957,
        "task_vector_magnitude_ratio": 0.12622609734535217,
        "singular_value_overlap": -2.5934207439422607,
        "subspace_overlap": 2.141533613204956,
        "right_subspace_overlap": 1.6770334243774414,
        "activation_l2_distance": 1.3849897384643555,
        "activation_cosine_similarity": -0.7299240827560425,
        "activation_magnitude_ratio": -0.2608647048473358,
        "activation_dot_product": 0.9160833954811096,
        "encoder_gradient_cosine_similarity": 1.0876399278640747,
        "encoder_gradient_l2_distance": -1.9491276741027832,
        "encoder_gradient_dot_product": 1.6850813627243042,
        "input_gradient_cosine_similarity": 0.06863052397966385,
        "input_gradient_l2_distance": -2.760892868041992,
        "input_gradient_dot_product": -2.7508385181427
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5313701186352027,
      "val_r": 0.4508946813975813,
      "n_iterations": 68,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0007844012579880655,
        "right_subspace_overlap_bottom_k": -0.38032266497612,
        "interaction_matrix_overlap_top_k": 0.4176298975944519,
        "interaction_matrix_overlap_bottom_k": 1.4714969396591187,
        "effective_rank": -0.6936475038528442,
        "effective_rank_mergeability_score": 0.3968293368816376,
        "stable_rank": -0.9043840765953064,
        "spectral_gap": 0.8286277651786804,
        "singular_value_ratio": 0.8637908101081848,
        "layerwise_effective_rank": 0.42571011185646057,
        "layerwise_effective_rank_mergeability_score": -0.34440290927886963,
        "task_vector_cosine_similarity": 1.1618462800979614,
        "task_vector_l2_distance": -1.46199631690979,
        "task_vector_dot_product": -0.4962731599807739,
        "weight_space_angle": 0.4852708578109741,
        "task_vector_magnitude_ratio": 0.7077045440673828,
        "singular_value_overlap": -1.5726157426834106,
        "subspace_overlap": 0.11052609235048294,
        "right_subspace_overlap": 1.1767241954803467,
        "activation_l2_distance": 0.2899045944213867,
        "activation_cosine_similarity": 0.5893514156341553,
        "activation_magnitude_ratio": -0.0565374530851841,
        "activation_dot_product": 0.6798562407493591,
        "encoder_gradient_cosine_similarity": 0.36888349056243896,
        "encoder_gradient_l2_distance": -1.5270048379898071,
        "encoder_gradient_dot_product": 0.6045596599578857,
        "input_gradient_cosine_similarity": 1.0318254232406616,
        "input_gradient_l2_distance": -1.7454596757888794,
        "input_gradient_dot_product": -1.4438565969467163
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5113189133190287,
      "val_r": 0.4725446510523773,
      "n_iterations": 963,
      "coefficients": {
        "right_subspace_overlap_top_k": 21.81405258178711,
        "right_subspace_overlap_bottom_k": -17.245391845703125,
        "interaction_matrix_overlap_top_k": 104.73380279541016,
        "interaction_matrix_overlap_bottom_k": 39.64406204223633,
        "effective_rank": -13.06257152557373,
        "effective_rank_mergeability_score": 29.754871368408203,
        "stable_rank": -4.831271171569824,
        "spectral_gap": 19.50666046142578,
        "singular_value_ratio": -48.79582977294922,
        "layerwise_effective_rank": 10.91087818145752,
        "layerwise_effective_rank_mergeability_score": -88.17958068847656,
        "task_vector_cosine_similarity": -17.741220474243164,
        "task_vector_l2_distance": -11.9109525680542,
        "task_vector_dot_product": -1.9762715101242065,
        "weight_space_angle": 46.440887451171875,
        "task_vector_magnitude_ratio": -4.90252161026001,
        "singular_value_overlap": -67.85932159423828,
        "subspace_overlap": 45.93583297729492,
        "right_subspace_overlap": 25.103830337524414,
        "activation_l2_distance": 10.437338829040527,
        "activation_cosine_similarity": 28.601667404174805,
        "activation_magnitude_ratio": -20.953296661376953,
        "activation_dot_product": 50.396873474121094,
        "encoder_gradient_cosine_similarity": 24.235715866088867,
        "encoder_gradient_l2_distance": -46.32015609741211,
        "encoder_gradient_dot_product": 38.867462158203125,
        "input_gradient_cosine_similarity": 37.85570526123047,
        "input_gradient_l2_distance": -75.21228790283203,
        "input_gradient_dot_product": -114.2506332397461
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.529984414858288,
      "val_r": 0.5649769927925103,
      "n_iterations": 529,
      "coefficients": {
        "right_subspace_overlap_top_k": 23.600393295288086,
        "right_subspace_overlap_bottom_k": 31.82444190979004,
        "interaction_matrix_overlap_top_k": -29.165292739868164,
        "interaction_matrix_overlap_bottom_k": 2.3587000370025635,
        "effective_rank": -27.044431686401367,
        "effective_rank_mergeability_score": 37.039310455322266,
        "stable_rank": 40.732669830322266,
        "spectral_gap": 1.738634467124939,
        "singular_value_ratio": -5.633970260620117,
        "layerwise_effective_rank": -7.073736667633057,
        "layerwise_effective_rank_mergeability_score": -20.203813552856445,
        "task_vector_cosine_similarity": 27.910823822021484,
        "task_vector_l2_distance": -36.86201095581055,
        "task_vector_dot_product": 6.175471305847168,
        "weight_space_angle": -2.1185474395751953,
        "task_vector_magnitude_ratio": -1.4808518886566162,
        "singular_value_overlap": -26.220434188842773,
        "subspace_overlap": -4.435115337371826,
        "right_subspace_overlap": 15.92049503326416,
        "activation_l2_distance": 7.85397481918335,
        "activation_cosine_similarity": 11.963473320007324,
        "activation_magnitude_ratio": -2.1039459705352783,
        "activation_dot_product": 21.180654525756836,
        "encoder_gradient_cosine_similarity": 9.964482307434082,
        "encoder_gradient_l2_distance": -70.5561752319336,
        "encoder_gradient_dot_product": 14.622990608215332,
        "input_gradient_cosine_similarity": 15.697757720947266,
        "input_gradient_l2_distance": -45.03114700317383,
        "input_gradient_dot_product": 10.342446327209473
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5863983397318245,
      "val_r": 0.7185201530776644,
      "n_iterations": 75,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.22949621081352234,
        "right_subspace_overlap_bottom_k": 0.7372342348098755,
        "interaction_matrix_overlap_top_k": 1.048509955406189,
        "interaction_matrix_overlap_bottom_k": 0.2272128015756607,
        "effective_rank": -0.059840962290763855,
        "effective_rank_mergeability_score": 1.0424593687057495,
        "stable_rank": 0.736874520778656,
        "spectral_gap": 0.4104516804218292,
        "singular_value_ratio": 0.6426733136177063,
        "layerwise_effective_rank": -0.11396905779838562,
        "layerwise_effective_rank_mergeability_score": -0.22193381190299988,
        "task_vector_cosine_similarity": 0.08296886086463928,
        "task_vector_l2_distance": -1.1360865831375122,
        "task_vector_dot_product": -0.2332024723291397,
        "weight_space_angle": 0.5937795042991638,
        "task_vector_magnitude_ratio": -0.5045027136802673,
        "singular_value_overlap": -0.9604610800743103,
        "subspace_overlap": 0.9034358263015747,
        "right_subspace_overlap": -0.05055968835949898,
        "activation_l2_distance": 0.20953433215618134,
        "activation_cosine_similarity": 0.5786482095718384,
        "activation_magnitude_ratio": -0.23294970393180847,
        "activation_dot_product": 0.11497335135936737,
        "encoder_gradient_cosine_similarity": 0.10637543350458145,
        "encoder_gradient_l2_distance": -1.4216049909591675,
        "encoder_gradient_dot_product": 0.3554185628890991,
        "input_gradient_cosine_similarity": 0.3625856041908264,
        "input_gradient_l2_distance": -1.4552268981933594,
        "input_gradient_dot_product": -0.5405555367469788
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.42984166605516255,
      "val_r": 0.5646495421265024,
      "n_iterations": 438,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.433302402496338,
        "right_subspace_overlap_bottom_k": -15.02072525024414,
        "interaction_matrix_overlap_top_k": 24.586803436279297,
        "interaction_matrix_overlap_bottom_k": 6.5257391929626465,
        "effective_rank": -6.383344650268555,
        "effective_rank_mergeability_score": -2.4300944805145264,
        "stable_rank": -25.756820678710938,
        "spectral_gap": -8.332119941711426,
        "singular_value_ratio": 17.411802291870117,
        "layerwise_effective_rank": -17.155841827392578,
        "layerwise_effective_rank_mergeability_score": 4.609292507171631,
        "task_vector_cosine_similarity": 3.939354419708252,
        "task_vector_l2_distance": -7.629650115966797,
        "task_vector_dot_product": 11.039752006530762,
        "weight_space_angle": -19.99427604675293,
        "task_vector_magnitude_ratio": -1.4426610469818115,
        "singular_value_overlap": -35.27433776855469,
        "subspace_overlap": 31.81615447998047,
        "right_subspace_overlap": 7.1423139572143555,
        "activation_l2_distance": -1.2926290035247803,
        "activation_cosine_similarity": 27.537405014038086,
        "activation_magnitude_ratio": 3.6190578937530518,
        "activation_dot_product": 18.28687858581543,
        "encoder_gradient_cosine_similarity": 17.682144165039062,
        "encoder_gradient_l2_distance": -26.523101806640625,
        "encoder_gradient_dot_product": 20.937314987182617,
        "input_gradient_cosine_similarity": 7.176882266998291,
        "input_gradient_l2_distance": -37.060768127441406,
        "input_gradient_dot_product": -4.451362609863281
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.6117326349951087,
      "val_r": 0.33789015154372715,
      "n_iterations": 80,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.3756614029407501,
        "right_subspace_overlap_bottom_k": -0.09657428413629532,
        "interaction_matrix_overlap_top_k": 0.4100377857685089,
        "interaction_matrix_overlap_bottom_k": 1.1227062940597534,
        "effective_rank": -0.23210656642913818,
        "effective_rank_mergeability_score": 0.7255793213844299,
        "stable_rank": 0.3188837468624115,
        "spectral_gap": 0.5653424263000488,
        "singular_value_ratio": 0.1328507959842682,
        "layerwise_effective_rank": 0.6990109086036682,
        "layerwise_effective_rank_mergeability_score": 0.09151144325733185,
        "task_vector_cosine_similarity": -0.3508749008178711,
        "task_vector_l2_distance": -1.343299388885498,
        "task_vector_dot_product": 0.26839086413383484,
        "weight_space_angle": -0.13249699771404266,
        "task_vector_magnitude_ratio": 0.1334524154663086,
        "singular_value_overlap": -0.39304590225219727,
        "subspace_overlap": 0.15019068121910095,
        "right_subspace_overlap": -0.4290371537208557,
        "activation_l2_distance": 0.5685641169548035,
        "activation_cosine_similarity": 0.4363284409046173,
        "activation_magnitude_ratio": -0.2903215289115906,
        "activation_dot_product": -0.0013593065086752176,
        "encoder_gradient_cosine_similarity": 0.011363261379301548,
        "encoder_gradient_l2_distance": -0.3198665976524353,
        "encoder_gradient_dot_product": 0.2830903232097626,
        "input_gradient_cosine_similarity": 0.17974641919136047,
        "input_gradient_l2_distance": -1.4547208547592163,
        "input_gradient_dot_product": -0.43083423376083374
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.48176306968333166,
      "val_r": 0.30605573395470276,
      "n_iterations": 703,
      "coefficients": {
        "right_subspace_overlap_top_k": 58.113624572753906,
        "right_subspace_overlap_bottom_k": -0.9927545189857483,
        "interaction_matrix_overlap_top_k": 59.625267028808594,
        "interaction_matrix_overlap_bottom_k": -21.36684799194336,
        "effective_rank": -24.564672470092773,
        "effective_rank_mergeability_score": 31.207380294799805,
        "stable_rank": 19.893239974975586,
        "spectral_gap": -8.651460647583008,
        "singular_value_ratio": -44.8949089050293,
        "layerwise_effective_rank": 27.473487854003906,
        "layerwise_effective_rank_mergeability_score": -16.971118927001953,
        "task_vector_cosine_similarity": 35.29401397705078,
        "task_vector_l2_distance": -35.30446243286133,
        "task_vector_dot_product": -11.15161418914795,
        "weight_space_angle": -41.57389831542969,
        "task_vector_magnitude_ratio": 11.222352027893066,
        "singular_value_overlap": -27.29311752319336,
        "subspace_overlap": 13.44500732421875,
        "right_subspace_overlap": 11.141265869140625,
        "activation_l2_distance": -17.38459014892578,
        "activation_cosine_similarity": 13.301555633544922,
        "activation_magnitude_ratio": -25.366456985473633,
        "activation_dot_product": 9.022185325622559,
        "encoder_gradient_cosine_similarity": 47.647796630859375,
        "encoder_gradient_l2_distance": -48.10589599609375,
        "encoder_gradient_dot_product": 47.471927642822266,
        "input_gradient_cosine_similarity": 32.90009307861328,
        "input_gradient_l2_distance": -42.21186828613281,
        "input_gradient_dot_product": -50.927772521972656
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5607664199607235,
      "val_r": 0.3358186631815669,
      "n_iterations": 494,
      "coefficients": {
        "right_subspace_overlap_top_k": 43.42226791381836,
        "right_subspace_overlap_bottom_k": -5.159389019012451,
        "interaction_matrix_overlap_top_k": -5.458878040313721,
        "interaction_matrix_overlap_bottom_k": 28.872739791870117,
        "effective_rank": -3.6093039512634277,
        "effective_rank_mergeability_score": 29.47016143798828,
        "stable_rank": -20.013023376464844,
        "spectral_gap": 1.9388984441757202,
        "singular_value_ratio": 27.192256927490234,
        "layerwise_effective_rank": -22.749269485473633,
        "layerwise_effective_rank_mergeability_score": -32.782772064208984,
        "task_vector_cosine_similarity": -0.9126455187797546,
        "task_vector_l2_distance": -39.85596466064453,
        "task_vector_dot_product": -2.14682674407959,
        "weight_space_angle": 32.7115478515625,
        "task_vector_magnitude_ratio": -9.052151679992676,
        "singular_value_overlap": -30.911785125732422,
        "subspace_overlap": 39.520626068115234,
        "right_subspace_overlap": 27.657899856567383,
        "activation_l2_distance": -4.041533470153809,
        "activation_cosine_similarity": 3.1593644618988037,
        "activation_magnitude_ratio": 0.43649107217788696,
        "activation_dot_product": 23.939661026000977,
        "encoder_gradient_cosine_similarity": 13.697961807250977,
        "encoder_gradient_l2_distance": -62.95753860473633,
        "encoder_gradient_dot_product": 27.769390106201172,
        "input_gradient_cosine_similarity": 18.219295501708984,
        "input_gradient_l2_distance": -47.24363708496094,
        "input_gradient_dot_product": -30.11680030822754
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.812585287300356,
      "val_r": 0.6467254633942623,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 5.793140411376953,
        "right_subspace_overlap_bottom_k": -1.2897217273712158,
        "interaction_matrix_overlap_top_k": 1.8529996871948242,
        "interaction_matrix_overlap_bottom_k": -1.2109730243682861,
        "effective_rank": 3.571838617324829,
        "effective_rank_mergeability_score": -1.7696712017059326,
        "stable_rank": -3.7016959190368652,
        "spectral_gap": -0.6107546091079712,
        "singular_value_ratio": 2.3267807960510254,
        "layerwise_effective_rank": -3.5908656120300293,
        "layerwise_effective_rank_mergeability_score": 1.3794523477554321,
        "task_vector_cosine_similarity": -1.052841067314148,
        "task_vector_l2_distance": -0.8587320446968079,
        "task_vector_dot_product": 0.10492546111345291,
        "weight_space_angle": 3.5697076320648193,
        "task_vector_magnitude_ratio": -1.08588707447052,
        "singular_value_overlap": -0.48171502351760864,
        "subspace_overlap": -2.1755011081695557,
        "right_subspace_overlap": 1.7825735807418823,
        "activation_l2_distance": 2.6368894577026367,
        "activation_cosine_similarity": 3.8806114196777344,
        "activation_magnitude_ratio": -0.3411160409450531,
        "activation_dot_product": 1.9228086471557617,
        "encoder_gradient_cosine_similarity": 1.351078748703003,
        "encoder_gradient_l2_distance": -4.610458850860596,
        "encoder_gradient_dot_product": 1.2233377695083618,
        "input_gradient_cosine_similarity": -0.04032174125313759,
        "input_gradient_l2_distance": -5.260448455810547,
        "input_gradient_dot_product": -2.3165106773376465
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5648433248365791,
      "val_r": 0.3405890543143324,
      "n_iterations": 599,
      "coefficients": {
        "right_subspace_overlap_top_k": 39.05614471435547,
        "right_subspace_overlap_bottom_k": -11.711431503295898,
        "interaction_matrix_overlap_top_k": 95.32350158691406,
        "interaction_matrix_overlap_bottom_k": 45.15639114379883,
        "effective_rank": 45.53201675415039,
        "effective_rank_mergeability_score": 26.19104766845703,
        "stable_rank": -53.959163665771484,
        "spectral_gap": -53.366294860839844,
        "singular_value_ratio": -59.01295471191406,
        "layerwise_effective_rank": 17.482328414916992,
        "layerwise_effective_rank_mergeability_score": 43.923187255859375,
        "task_vector_cosine_similarity": 5.679020404815674,
        "task_vector_l2_distance": -79.82095336914062,
        "task_vector_dot_product": 9.854717254638672,
        "weight_space_angle": 16.503849029541016,
        "task_vector_magnitude_ratio": 34.074283599853516,
        "singular_value_overlap": -70.526123046875,
        "subspace_overlap": -35.892791748046875,
        "right_subspace_overlap": -10.020094871520996,
        "activation_l2_distance": -1.5254493951797485,
        "activation_cosine_similarity": 3.0004289150238037,
        "activation_magnitude_ratio": -8.561261177062988,
        "activation_dot_product": 39.457950592041016,
        "encoder_gradient_cosine_similarity": 43.54018020629883,
        "encoder_gradient_l2_distance": -47.36613464355469,
        "encoder_gradient_dot_product": 9.72825813293457,
        "input_gradient_cosine_similarity": 56.71759033203125,
        "input_gradient_l2_distance": -86.41972351074219,
        "input_gradient_dot_product": -12.041058540344238
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}