{
  "aggregate_metrics": {
    "train_r": 0.14263140035908786,
    "train_p": 4.132390682492131e-16,
    "val_r": 0.24997581780362269,
    "val_p": 1.6721953734313622e-06
  },
  "per_fold_stats": {
    "train_r_mean": 0.7403321946671069,
    "train_r_std": 0.08046908449510773,
    "val_r_mean": 0.6086115734157599,
    "val_r_std": 0.21265087770185623
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 10.898747444152832,
    "right_subspace_overlap_bottom_k": -0.8623163104057312,
    "interaction_matrix_overlap_top_k": 13.932268142700195,
    "interaction_matrix_overlap_bottom_k": -9.838746070861816,
    "effective_rank": -4.0033674240112305,
    "effective_rank_mergeability_score": -10.859968185424805,
    "stable_rank": -8.795872688293457,
    "spectral_gap": -5.87529993057251,
    "singular_value_ratio": 5.647424221038818,
    "layerwise_effective_rank": 0.3538892865180969,
    "layerwise_effective_rank_mergeability_score": 10.910131454467773,
    "task_vector_cosine_similarity": -6.186434745788574,
    "task_vector_l2_distance": -1.380467176437378,
    "task_vector_dot_product": -0.018287498503923416,
    "weight_space_angle": 2.259608745574951,
    "task_vector_magnitude_ratio": -4.586515426635742,
    "singular_value_overlap": 9.719736099243164,
    "subspace_overlap": 11.173913955688477,
    "right_subspace_overlap": 0.9220489263534546,
    "activation_l2_distance": -1.435880422592163,
    "activation_cosine_similarity": -0.10497410595417023,
    "activation_magnitude_ratio": -4.792350769042969,
    "activation_dot_product": 4.46563720703125,
    "encoder_gradient_cosine_similarity": 11.896528244018555,
    "encoder_gradient_l2_distance": -5.008673191070557,
    "encoder_gradient_dot_product": 3.3356165885925293,
    "input_gradient_cosine_similarity": 6.012997627258301,
    "input_gradient_l2_distance": -25.01630401611328,
    "input_gradient_dot_product": -1.7659467458724976
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 30.45414924621582,
    "right_subspace_overlap_bottom_k": 25.592998504638672,
    "interaction_matrix_overlap_top_k": 43.38706970214844,
    "interaction_matrix_overlap_bottom_k": 23.96672248840332,
    "effective_rank": 20.747159957885742,
    "effective_rank_mergeability_score": 36.237850189208984,
    "stable_rank": 33.910675048828125,
    "spectral_gap": 23.406068801879883,
    "singular_value_ratio": 15.290914535522461,
    "layerwise_effective_rank": 19.95014762878418,
    "layerwise_effective_rank_mergeability_score": 39.395782470703125,
    "task_vector_cosine_similarity": 23.70966148376465,
    "task_vector_l2_distance": 11.519659996032715,
    "task_vector_dot_product": 12.363191604614258,
    "weight_space_angle": 4.849324703216553,
    "task_vector_magnitude_ratio": 18.079519271850586,
    "singular_value_overlap": 23.75921058654785,
    "subspace_overlap": 42.58895492553711,
    "right_subspace_overlap": 22.849815368652344,
    "activation_l2_distance": 4.340395450592041,
    "activation_cosine_similarity": 19.99277687072754,
    "activation_magnitude_ratio": 15.983172416687012,
    "activation_dot_product": 7.099811553955078,
    "encoder_gradient_cosine_similarity": 40.4615364074707,
    "encoder_gradient_l2_distance": 14.822592735290527,
    "encoder_gradient_dot_product": 8.388590812683105,
    "input_gradient_cosine_similarity": 19.298471450805664,
    "input_gradient_l2_distance": 85.09378814697266,
    "input_gradient_dot_product": 7.366115093231201
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7383554426992431,
      "val_r": 0.6159762573182455,
      "n_iterations": 81,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.8599808216094971,
        "right_subspace_overlap_bottom_k": -1.8761943578720093,
        "interaction_matrix_overlap_top_k": 0.8256967663764954,
        "interaction_matrix_overlap_bottom_k": -0.4264709949493408,
        "effective_rank": 0.5607798099517822,
        "effective_rank_mergeability_score": -0.8031554222106934,
        "stable_rank": -1.1650354862213135,
        "spectral_gap": 0.3376457095146179,
        "singular_value_ratio": 0.007605420425534248,
        "layerwise_effective_rank": -0.28925126791000366,
        "layerwise_effective_rank_mergeability_score": 0.2522401511669159,
        "task_vector_cosine_similarity": 0.2491496056318283,
        "task_vector_l2_distance": -0.03962133824825287,
        "task_vector_dot_product": -0.10469424724578857,
        "weight_space_angle": 1.2046363353729248,
        "task_vector_magnitude_ratio": 0.6927991509437561,
        "singular_value_overlap": 0.37618547677993774,
        "subspace_overlap": 1.6706229448318481,
        "right_subspace_overlap": 0.3515515923500061,
        "activation_l2_distance": -0.30914369225502014,
        "activation_cosine_similarity": 1.284883975982666,
        "activation_magnitude_ratio": -0.342682421207428,
        "activation_dot_product": 0.02513796091079712,
        "encoder_gradient_cosine_similarity": 0.6299861669540405,
        "encoder_gradient_l2_distance": -1.4322997331619263,
        "encoder_gradient_dot_product": 0.5114133358001709,
        "input_gradient_cosine_similarity": 0.5808448791503906,
        "input_gradient_l2_distance": -1.480334758758545,
        "input_gradient_dot_product": -1.1690614223480225
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7285803828063417,
      "val_r": 0.8002321891190286,
      "n_iterations": 663,
      "coefficients": {
        "right_subspace_overlap_top_k": 17.95650863647461,
        "right_subspace_overlap_bottom_k": -16.40998077392578,
        "interaction_matrix_overlap_top_k": 1.7318484783172607,
        "interaction_matrix_overlap_bottom_k": -9.800074577331543,
        "effective_rank": -9.149293899536133,
        "effective_rank_mergeability_score": -4.9683451652526855,
        "stable_rank": 5.243716716766357,
        "spectral_gap": -2.1313912868499756,
        "singular_value_ratio": 6.235317707061768,
        "layerwise_effective_rank": -14.110591888427734,
        "layerwise_effective_rank_mergeability_score": -0.5545151233673096,
        "task_vector_cosine_similarity": -1.4194495677947998,
        "task_vector_l2_distance": -1.9114513397216797,
        "task_vector_dot_product": 2.719437599182129,
        "weight_space_angle": 8.779257774353027,
        "task_vector_magnitude_ratio": -0.44894614815711975,
        "singular_value_overlap": 12.152000427246094,
        "subspace_overlap": 1.8808887004852295,
        "right_subspace_overlap": 9.387431144714355,
        "activation_l2_distance": -4.254150867462158,
        "activation_cosine_similarity": 5.148298263549805,
        "activation_magnitude_ratio": -3.964618444442749,
        "activation_dot_product": 18.270103454589844,
        "encoder_gradient_cosine_similarity": 6.2301926612854,
        "encoder_gradient_l2_distance": -29.32243537902832,
        "encoder_gradient_dot_product": 2.7258198261260986,
        "input_gradient_cosine_similarity": 5.622804641723633,
        "input_gradient_l2_distance": -6.743100643157959,
        "input_gradient_dot_product": 2.102470874786377
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.814458764964025,
      "val_r": 0.8006011889385716,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.7703233361244202,
        "right_subspace_overlap_bottom_k": -1.7245465517044067,
        "interaction_matrix_overlap_top_k": 0.28143301606178284,
        "interaction_matrix_overlap_bottom_k": 0.6416876316070557,
        "effective_rank": 0.0056238677352666855,
        "effective_rank_mergeability_score": -0.44851693511009216,
        "stable_rank": 0.7608089447021484,
        "spectral_gap": -0.22757916152477264,
        "singular_value_ratio": 0.19374796748161316,
        "layerwise_effective_rank": -0.264925092458725,
        "layerwise_effective_rank_mergeability_score": 1.0271990299224854,
        "task_vector_cosine_similarity": 0.5214828252792358,
        "task_vector_l2_distance": 0.1732947677373886,
        "task_vector_dot_product": -0.2511220872402191,
        "weight_space_angle": 0.6577175855636597,
        "task_vector_magnitude_ratio": -0.5734212398529053,
        "singular_value_overlap": 0.129765123128891,
        "subspace_overlap": -0.7143340706825256,
        "right_subspace_overlap": 1.0032545328140259,
        "activation_l2_distance": 0.2257828563451767,
        "activation_cosine_similarity": 1.126695156097412,
        "activation_magnitude_ratio": -0.14397792518138885,
        "activation_dot_product": -0.21708446741104126,
        "encoder_gradient_cosine_similarity": 0.07804691046476364,
        "encoder_gradient_l2_distance": -1.3322222232818604,
        "encoder_gradient_dot_product": 0.0038278040010482073,
        "input_gradient_cosine_similarity": 0.1493416577577591,
        "input_gradient_l2_distance": -0.6024740934371948,
        "input_gradient_dot_product": -0.24743075668811798
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7439512638833096,
      "val_r": 0.7393575279148963,
      "n_iterations": 86,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.25708356499671936,
        "right_subspace_overlap_bottom_k": -0.562557578086853,
        "interaction_matrix_overlap_top_k": 0.38276976346969604,
        "interaction_matrix_overlap_bottom_k": -0.32962796092033386,
        "effective_rank": 0.580077588558197,
        "effective_rank_mergeability_score": 0.24707449972629547,
        "stable_rank": -0.43022996187210083,
        "spectral_gap": 0.41197606921195984,
        "singular_value_ratio": 0.3372579514980316,
        "layerwise_effective_rank": -0.2454700618982315,
        "layerwise_effective_rank_mergeability_score": 0.16796530783176422,
        "task_vector_cosine_similarity": -0.014073236845433712,
        "task_vector_l2_distance": -0.05108847841620445,
        "task_vector_dot_product": -0.26028624176979065,
        "weight_space_angle": -0.1775963008403778,
        "task_vector_magnitude_ratio": 0.4383961260318756,
        "singular_value_overlap": 0.5632049441337585,
        "subspace_overlap": -0.008646488189697266,
        "right_subspace_overlap": 0.8644238710403442,
        "activation_l2_distance": 0.20493347942829132,
        "activation_cosine_similarity": 0.8088462948799133,
        "activation_magnitude_ratio": -0.264634907245636,
        "activation_dot_product": 0.6715022921562195,
        "encoder_gradient_cosine_similarity": 0.2127343714237213,
        "encoder_gradient_l2_distance": -1.3631446361541748,
        "encoder_gradient_dot_product": -0.0863424688577652,
        "input_gradient_cosine_similarity": 0.1011810228228569,
        "input_gradient_l2_distance": -0.8474652767181396,
        "input_gradient_dot_product": -0.09299689531326294
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6369282748334341,
      "val_r": 0.7167848316332007,
      "n_iterations": 54,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00015725253615528345,
        "right_subspace_overlap_bottom_k": -0.20276634395122528,
        "interaction_matrix_overlap_top_k": 0.36845627427101135,
        "interaction_matrix_overlap_bottom_k": -0.19595159590244293,
        "effective_rank": 0.5299469232559204,
        "effective_rank_mergeability_score": 0.04440184310078621,
        "stable_rank": -0.5347023606300354,
        "spectral_gap": -1.362492561340332,
        "singular_value_ratio": 0.31119608879089355,
        "layerwise_effective_rank": -1.069807767868042,
        "layerwise_effective_rank_mergeability_score": 0.327812522649765,
        "task_vector_cosine_similarity": 1.001638650894165,
        "task_vector_l2_distance": 0.35426589846611023,
        "task_vector_dot_product": 0.20712129771709442,
        "weight_space_angle": -0.5622943043708801,
        "task_vector_magnitude_ratio": -0.8565579652786255,
        "singular_value_overlap": 1.276171326637268,
        "subspace_overlap": 0.882401704788208,
        "right_subspace_overlap": -0.3140789568424225,
        "activation_l2_distance": -0.02090362459421158,
        "activation_cosine_similarity": 1.363538146018982,
        "activation_magnitude_ratio": -0.6420818567276001,
        "activation_dot_product": 2.608773946762085,
        "encoder_gradient_cosine_similarity": 0.5392841696739197,
        "encoder_gradient_l2_distance": -0.9388313889503479,
        "encoder_gradient_dot_product": -0.3370216190814972,
        "input_gradient_cosine_similarity": 1.152563452720642,
        "input_gradient_l2_distance": -3.1436119079589844,
        "input_gradient_dot_product": 0.1947818100452423
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.784841100494872,
      "val_r": 0.7543917766430709,
      "n_iterations": 119,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.14015954732894897,
        "right_subspace_overlap_bottom_k": -0.36826521158218384,
        "interaction_matrix_overlap_top_k": 0.5627046823501587,
        "interaction_matrix_overlap_bottom_k": -0.1005922257900238,
        "effective_rank": 0.356578528881073,
        "effective_rank_mergeability_score": -0.5059483051300049,
        "stable_rank": -0.1882418841123581,
        "spectral_gap": 0.1290292590856552,
        "singular_value_ratio": 0.1617944836616516,
        "layerwise_effective_rank": -0.20669691264629364,
        "layerwise_effective_rank_mergeability_score": 0.616215705871582,
        "task_vector_cosine_similarity": -0.07018545269966125,
        "task_vector_l2_distance": -0.12079426646232605,
        "task_vector_dot_product": 0.08738153427839279,
        "weight_space_angle": 0.5735269784927368,
        "task_vector_magnitude_ratio": -0.04346427693963051,
        "singular_value_overlap": 0.11649559438228607,
        "subspace_overlap": -0.3223060369491577,
        "right_subspace_overlap": 0.46433764696121216,
        "activation_l2_distance": 0.21796290576457977,
        "activation_cosine_similarity": 0.5546327233314514,
        "activation_magnitude_ratio": -0.0720970630645752,
        "activation_dot_product": 0.1246950551867485,
        "encoder_gradient_cosine_similarity": 0.162993922829628,
        "encoder_gradient_l2_distance": -0.8842995762825012,
        "encoder_gradient_dot_product": 0.0328366793692112,
        "input_gradient_cosine_similarity": 0.09107409417629242,
        "input_gradient_l2_distance": -0.33793121576309204,
        "input_gradient_dot_product": -0.17545925080776215
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7627550054062622,
      "val_r": 0.6673386210606237,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.631526470184326,
        "right_subspace_overlap_bottom_k": -7.543515682220459,
        "interaction_matrix_overlap_top_k": 4.342350482940674,
        "interaction_matrix_overlap_bottom_k": -6.0165791511535645,
        "effective_rank": -3.2389256954193115,
        "effective_rank_mergeability_score": 1.612115502357483,
        "stable_rank": 2.889418363571167,
        "spectral_gap": -1.1984517574310303,
        "singular_value_ratio": -3.748995542526245,
        "layerwise_effective_rank": 3.8115146160125732,
        "layerwise_effective_rank_mergeability_score": 2.6017396450042725,
        "task_vector_cosine_similarity": -0.12843622267246246,
        "task_vector_l2_distance": -0.038674671202898026,
        "task_vector_dot_product": 1.6154935359954834,
        "weight_space_angle": 0.09744258970022202,
        "task_vector_magnitude_ratio": 2.209977388381958,
        "singular_value_overlap": 4.1422271728515625,
        "subspace_overlap": -1.1571201086044312,
        "right_subspace_overlap": 6.887217044830322,
        "activation_l2_distance": -2.426409959793091,
        "activation_cosine_similarity": 6.69526481628418,
        "activation_magnitude_ratio": -0.6725826859474182,
        "activation_dot_product": 0.034101828932762146,
        "encoder_gradient_cosine_similarity": 2.863192081451416,
        "encoder_gradient_l2_distance": -10.29025936126709,
        "encoder_gradient_dot_product": 3.2065813541412354,
        "input_gradient_cosine_similarity": 0.3954707682132721,
        "input_gradient_l2_distance": -8.761510848999023,
        "input_gradient_dot_product": -3.8154165744781494
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.46939297421922765,
      "val_r": 0.0034167290489222346,
      "n_iterations": 400,
      "coefficients": {
        "right_subspace_overlap_top_k": 141.59649658203125,
        "right_subspace_overlap_bottom_k": 102.40628814697266,
        "interaction_matrix_overlap_top_k": 199.716796875,
        "interaction_matrix_overlap_bottom_k": -110.19810485839844,
        "effective_rank": -92.86228942871094,
        "effective_rank_mergeability_score": -165.08184814453125,
        "stable_rank": -153.68568420410156,
        "spectral_gap": -106.51715087890625,
        "singular_value_ratio": 69.57646942138672,
        "layerwise_effective_rank": 80.4477767944336,
        "layerwise_effective_rank_mergeability_score": 181.79095458984375,
        "task_vector_cosine_similarity": -108.75445556640625,
        "task_vector_l2_distance": -48.7348747253418,
        "task_vector_dot_product": 46.96683120727539,
        "weight_space_angle": 13.6090726852417,
        "task_vector_magnitude_ratio": -82.66228485107422,
        "singular_value_overlap": 108.9786605834961,
        "subspace_overlap": 195.36883544921875,
        "right_subspace_overlap": -88.71089172363281,
        "activation_l2_distance": -18.84733009338379,
        "activation_cosine_similarity": -83.85076904296875,
        "activation_magnitude_ratio": -74.03280639648438,
        "activation_dot_product": 11.398058891296387,
        "encoder_gradient_cosine_similarity": 187.45240783691406,
        "encoder_gradient_l2_distance": 40.48320007324219,
        "encoder_gradient_dot_product": 38.50603103637695,
        "input_gradient_cosine_similarity": 89.32343292236328,
        "input_gradient_l2_distance": -394.6093444824219,
        "input_gradient_dot_product": 21.92269515991211
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.82248031722507,
      "val_r": 0.36439253904341495,
      "n_iterations": 377,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5170467495918274,
        "right_subspace_overlap_bottom_k": -0.5370767712593079,
        "interaction_matrix_overlap_top_k": -0.34696295857429504,
        "interaction_matrix_overlap_bottom_k": 0.01419755257666111,
        "effective_rank": 0.17614232003688812,
        "effective_rank_mergeability_score": -0.014251618646085262,
        "stable_rank": 0.1719784289598465,
        "spectral_gap": 0.07053565979003906,
        "singular_value_ratio": 0.32727789878845215,
        "layerwise_effective_rank": -0.06548409909009933,
        "layerwise_effective_rank_mergeability_score": 0.5169440507888794,
        "task_vector_cosine_similarity": -0.16694194078445435,
        "task_vector_l2_distance": 0.039012275636196136,
        "task_vector_dot_product": 0.056098952889442444,
        "weight_space_angle": 0.0052497293800115585,
        "task_vector_magnitude_ratio": -0.19991344213485718,
        "singular_value_overlap": 0.06698615103960037,
        "subspace_overlap": -0.19093704223632812,
        "right_subspace_overlap": 0.5246357917785645,
        "activation_l2_distance": 0.2533337473869324,
        "activation_cosine_similarity": 0.6489541530609131,
        "activation_magnitude_ratio": -0.028319841250777245,
        "activation_dot_product": -0.1849726289510727,
        "encoder_gradient_cosine_similarity": 0.09891825914382935,
        "encoder_gradient_l2_distance": -0.41954153776168823,
        "encoder_gradient_dot_product": 0.06658919900655746,
        "input_gradient_cosine_similarity": 0.03472165763378143,
        "input_gradient_l2_distance": -0.29487428069114685,
        "input_gradient_dot_product": -0.13794191181659698
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6242355754217341,
      "val_r": 0.4964838016667297,
      "n_iterations": 83,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.0007264614105225,
        "right_subspace_overlap_bottom_k": -0.30506816506385803,
        "interaction_matrix_overlap_top_k": 1.6147385835647583,
        "interaction_matrix_overlap_bottom_k": -1.5688122510910034,
        "effective_rank": -0.05712635815143585,
        "effective_rank_mergeability_score": 0.6208360195159912,
        "stable_rank": -0.13119317591190338,
        "spectral_gap": -0.35001105070114136,
        "singular_value_ratio": -0.3178909718990326,
        "layerwise_effective_rank": -0.26443129777908325,
        "layerwise_effective_rank_mergeability_score": 0.5565174221992493,
        "task_vector_cosine_similarity": 0.6043170690536499,
        "task_vector_l2_distance": -0.25768476724624634,
        "task_vector_dot_product": 0.20152686536312103,
        "weight_space_angle": -1.8603181838989258,
        "task_vector_magnitude_ratio": -0.43897297978401184,
        "singular_value_overlap": 1.6701860427856445,
        "subspace_overlap": 1.105432152748108,
        "right_subspace_overlap": 0.919734001159668,
        "activation_l2_distance": 1.8049802780151367,
        "activation_cosine_similarity": -0.8426432013511658,
        "activation_magnitude_ratio": -1.9045852422714233,
        "activation_dot_product": 1.229944109916687,
        "encoder_gradient_cosine_similarity": 1.7028918266296387,
        "encoder_gradient_l2_distance": -2.603431463241577,
        "encoder_gradient_dot_product": -0.5939882397651672,
        "input_gradient_cosine_similarity": 1.331223964691162,
        "input_gradient_l2_distance": -1.4313431978225708,
        "input_gradient_dot_product": -1.444578766822815
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7202745432950534,
      "val_r": 0.36322381301150136,
      "n_iterations": 55,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.8382185101509094,
        "right_subspace_overlap_bottom_k": -0.290496826171875,
        "interaction_matrix_overlap_top_k": -0.32542523741722107,
        "interaction_matrix_overlap_bottom_k": -0.9564939737319946,
        "effective_rank": -1.1294505596160889,
        "effective_rank_mergeability_score": 0.84788578748703,
        "stable_rank": 1.1540778875350952,
        "spectral_gap": 1.3246238231658936,
        "singular_value_ratio": 1.407307505607605,
        "layerwise_effective_rank": 0.14137598872184753,
        "layerwise_effective_rank_mergeability_score": -0.12423339486122131,
        "task_vector_cosine_similarity": 0.5756468772888184,
        "task_vector_l2_distance": 0.08129749447107315,
        "task_vector_dot_product": -0.1251916140317917,
        "weight_space_angle": -0.7230595946311951,
        "task_vector_magnitude_ratio": 0.32038089632987976,
        "singular_value_overlap": -0.03287998214364052,
        "subspace_overlap": -0.5715649127960205,
        "right_subspace_overlap": 1.0185221433639526,
        "activation_l2_distance": -0.40512052178382874,
        "activation_cosine_similarity": 0.8904086351394653,
        "activation_magnitude_ratio": -0.43639490008354187,
        "activation_dot_product": 0.7800513505935669,
        "encoder_gradient_cosine_similarity": 0.20058459043502808,
        "encoder_gradient_l2_distance": -1.9285696744918823,
        "encoder_gradient_dot_product": -0.3422018885612488,
        "input_gradient_cosine_similarity": 0.07296761870384216,
        "input_gradient_l2_distance": -0.48126938939094543,
        "input_gradient_dot_product": -0.7711891531944275
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7668618993933283,
      "val_r": 0.7745048037795558,
      "n_iterations": 170,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.6065739989280701,
        "right_subspace_overlap_bottom_k": -1.1304945945739746,
        "interaction_matrix_overlap_top_k": 0.35128656029701233,
        "interaction_matrix_overlap_bottom_k": -0.440475195646286,
        "effective_rank": -0.13997270166873932,
        "effective_rank_mergeability_score": -0.144754096865654,
        "stable_rank": 0.09058045595884323,
        "spectral_gap": 0.012523237615823746,
        "singular_value_ratio": -0.39696064591407776,
        "layerwise_effective_rank": 0.1595853567123413,
        "layerwise_effective_rank_mergeability_score": 0.3266293406486511,
        "task_vector_cosine_similarity": -0.5235448479652405,
        "task_vector_l2_distance": 0.09412981569766998,
        "task_vector_dot_product": -0.724187433719635,
        "weight_space_angle": 0.3975623846054077,
        "task_vector_magnitude_ratio": 0.48031875491142273,
        "singular_value_overlap": 0.6570349335670471,
        "subspace_overlap": 0.5303064584732056,
        "right_subspace_overlap": 1.092384696006775,
        "activation_l2_distance": 0.3596855103969574,
        "activation_cosine_similarity": 1.012281894683838,
        "activation_magnitude_ratio": -0.20580154657363892,
        "activation_dot_product": 0.8852450251579285,
        "encoder_gradient_cosine_similarity": 0.3327920436859131,
        "encoder_gradient_l2_distance": -1.3431345224380493,
        "encoder_gradient_dot_product": 0.11316125094890594,
        "input_gradient_cosine_similarity": 0.3198155462741852,
        "input_gradient_l2_distance": -1.2963374853134155,
        "input_gradient_dot_product": -0.479441374540329
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7772141585556772,
      "val_r": 0.7550268763444333,
      "n_iterations": 578,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.6414774656295776,
        "right_subspace_overlap_bottom_k": -0.4175901412963867,
        "interaction_matrix_overlap_top_k": 0.34028589725494385,
        "interaction_matrix_overlap_bottom_k": -0.6677236557006836,
        "effective_rank": -0.03823114559054375,
        "effective_rank_mergeability_score": -0.5688915848731995,
        "stable_rank": 0.44755443930625916,
        "spectral_gap": 0.4657021760940552,
        "singular_value_ratio": 0.3926992416381836,
        "layerwise_effective_rank": -0.5052085518836975,
        "layerwise_effective_rank_mergeability_score": 0.48555365204811096,
        "task_vector_cosine_similarity": 0.4957779049873352,
        "task_vector_l2_distance": 0.18475177884101868,
        "task_vector_dot_product": -0.5848254561424255,
        "weight_space_angle": -0.08107452094554901,
        "task_vector_magnitude_ratio": 0.03271012380719185,
        "singular_value_overlap": 0.32423925399780273,
        "subspace_overlap": -0.8063180446624756,
        "right_subspace_overlap": 0.836395800113678,
        "activation_l2_distance": 0.5379195809364319,
        "activation_cosine_similarity": 1.2373279333114624,
        "activation_magnitude_ratio": -0.0916992574930191,
        "activation_dot_product": 0.12208123505115509,
        "encoder_gradient_cosine_similarity": 0.2630910575389862,
        "encoder_gradient_l2_distance": -1.2188090085983276,
        "encoder_gradient_dot_product": 0.17824271321296692,
        "input_gradient_cosine_similarity": 0.17189663648605347,
        "input_gradient_l2_distance": -0.7645813226699829,
        "input_gradient_dot_product": -0.41002729535102844
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7802159643191242,
      "val_r": 0.6957931426781955,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.534635543823242,
        "right_subspace_overlap_bottom_k": -4.791340351104736,
        "interaction_matrix_overlap_top_k": -0.4141785502433777,
        "interaction_matrix_overlap_bottom_k": -2.5086512565612793,
        "effective_rank": -1.639542579650879,
        "effective_rank_mergeability_score": 1.3214038610458374,
        "stable_rank": 1.420405387878418,
        "spectral_gap": -0.8260352611541748,
        "singular_value_ratio": 1.3217395544052124,
        "layerwise_effective_rank": 2.39548659324646,
        "layerwise_effective_rank_mergeability_score": 2.809840202331543,
        "task_vector_cosine_similarity": -0.43567830324172974,
        "task_vector_l2_distance": 0.9339990615844727,
        "task_vector_dot_product": -3.2536208629608154,
        "weight_space_angle": -0.4617769718170166,
        "task_vector_magnitude_ratio": -0.8816072344779968,
        "singular_value_overlap": 1.847948431968689,
        "subspace_overlap": -4.7411980628967285,
        "right_subspace_overlap": 6.2520952224731445,
        "activation_l2_distance": 0.567791223526001,
        "activation_cosine_similarity": 5.3441877365112305,
        "activation_magnitude_ratio": -0.9866385459899902,
        "activation_dot_product": 0.6921970248222351,
        "encoder_gradient_cosine_similarity": 1.4737465381622314,
        "encoder_gradient_l2_distance": -4.908179759979248,
        "encoder_gradient_dot_product": 1.0558913946151733,
        "input_gradient_cosine_similarity": 0.8632148504257202,
        "input_gradient_l2_distance": -6.171273708343506,
        "input_gradient_dot_product": -2.815858840942383
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7686375065504705,
      "val_r": 0.7220507129324346,
      "n_iterations": 839,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.434907913208008,
        "right_subspace_overlap_bottom_k": -5.6143412590026855,
        "interaction_matrix_overlap_top_k": 9.220990180969238,
        "interaction_matrix_overlap_bottom_k": -12.268839836120605,
        "effective_rank": 10.996553421020508,
        "effective_rank_mergeability_score": 6.245359897613525,
        "stable_rank": 0.05753515288233757,
        "spectral_gap": 3.581733465194702,
        "singular_value_ratio": 16.233675003051758,
        "layerwise_effective_rank": -11.840104103088379,
        "layerwise_effective_rank_mergeability_score": -2.0902743339538574,
        "task_vector_cosine_similarity": -10.082344055175781,
        "task_vector_l2_distance": -0.5183813571929932,
        "task_vector_dot_product": -2.562161922454834,
        "weight_space_angle": -0.2822372615337372,
        "task_vector_magnitude_ratio": -10.207364082336426,
        "singular_value_overlap": 4.831968307495117,
        "subspace_overlap": -4.55422306060791,
        "right_subspace_overlap": 12.679512977600098,
        "activation_l2_distance": -1.1799428462982178,
        "activation_cosine_similarity": 7.478572368621826,
        "activation_magnitude_ratio": -2.1248860359191895,
        "activation_dot_product": 3.489264726638794,
        "encoder_gradient_cosine_similarity": 3.682676076889038,
        "encoder_gradient_l2_distance": -8.375967979431152,
        "encoder_gradient_dot_product": 3.442612409591675,
        "input_gradient_cosine_similarity": 1.3827177286148071,
        "input_gradient_l2_distance": -13.561165809631348,
        "input_gradient_dot_product": -4.497481346130371
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7710592762468432,
      "val_r": 0.1929069175766156,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 5.938537120819092,
        "right_subspace_overlap_bottom_k": -10.62357234954834,
        "interaction_matrix_overlap_top_k": 8.424174308776855,
        "interaction_matrix_overlap_bottom_k": -8.693180084228516,
        "effective_rank": 1.9239379167556763,
        "effective_rank_mergeability_score": -6.317979335784912,
        "stable_rank": -0.9088044762611389,
        "spectral_gap": 3.210578680038452,
        "singular_value_ratio": 5.200541019439697,
        "layerwise_effective_rank": -8.569297790527344,
        "layerwise_effective_rank_mergeability_score": 3.423205852508545,
        "task_vector_cosine_similarity": -2.2912843227386475,
        "task_vector_l2_distance": -1.3478140830993652,
        "task_vector_dot_product": -5.857793807983398,
        "weight_space_angle": 0.9827899932861328,
        "task_vector_magnitude_ratio": 0.44938939809799194,
        "singular_value_overlap": 13.609474182128906,
        "subspace_overlap": 4.177717208862305,
        "right_subspace_overlap": 11.524093627929688,
        "activation_l2_distance": 1.1244566440582275,
        "activation_cosine_similarity": 11.463760375976562,
        "activation_magnitude_ratio": -7.000340461730957,
        "activation_dot_product": 7.446649551391602,
        "encoder_gradient_cosine_similarity": 5.634867191314697,
        "encoder_gradient_l2_distance": -9.527174949645996,
        "encoder_gradient_dot_product": 4.18528413772583,
        "input_gradient_cosine_similarity": 3.18565034866333,
        "input_gradient_l2_distance": -17.11208152770996,
        "input_gradient_dot_product": -12.65704345703125
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.8444992880440614,
      "val_r": 0.7774920342535097,
      "n_iterations": 649,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.10101386904716492,
        "right_subspace_overlap_bottom_k": -1.7705843448638916,
        "interaction_matrix_overlap_top_k": -1.0248291492462158,
        "interaction_matrix_overlap_bottom_k": 1.4498335123062134,
        "effective_rank": 1.5248569250106812,
        "effective_rank_mergeability_score": -0.6213370561599731,
        "stable_rank": -2.001974582672119,
        "spectral_gap": -0.04138418287038803,
        "singular_value_ratio": 0.4463617205619812,
        "layerwise_effective_rank": 0.40672627091407776,
        "layerwise_effective_rank_mergeability_score": 0.8130173087120056,
        "task_vector_cosine_similarity": 0.25118744373321533,
        "task_vector_l2_distance": 0.078894704580307,
        "task_vector_dot_product": 0.13390709459781647,
        "weight_space_angle": 0.21177338063716888,
        "task_vector_magnitude_ratio": -0.10941901057958603,
        "singular_value_overlap": 0.032252635806798935,
        "subspace_overlap": -0.12712551653385162,
        "right_subspace_overlap": 1.1061851978302002,
        "activation_l2_distance": 0.2941477298736572,
        "activation_cosine_similarity": 0.6982026696205139,
        "activation_magnitude_ratio": -0.03413499891757965,
        "activation_dot_product": -0.23342019319534302,
        "encoder_gradient_cosine_similarity": 0.07020867615938187,
        "encoder_gradient_l2_distance": -0.3299295902252197,
        "encoder_gradient_dot_product": 0.04541376978158951,
        "input_gradient_cosine_similarity": 0.00831126980483532,
        "input_gradient_l2_distance": -0.2893446385860443,
        "input_gradient_dot_product": -0.08524586260318756
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7570149554787955,
      "val_r": 0.690081142653354,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 5.3806281089782715,
        "right_subspace_overlap_bottom_k": -25.277414321899414,
        "interaction_matrix_overlap_top_k": 20.178415298461914,
        "interaction_matrix_overlap_bottom_k": -20.21345329284668,
        "effective_rank": 3.1346864700317383,
        "effective_rank_mergeability_score": -29.704946517944336,
        "stable_rank": 1.306363821029663,
        "spectral_gap": 2.0728626251220703,
        "singular_value_ratio": 10.028116226196289,
        "layerwise_effective_rank": -29.1379451751709,
        "layerwise_effective_rank_mergeability_score": 16.831382751464844,
        "task_vector_cosine_similarity": -7.606662750244141,
        "task_vector_l2_distance": 7.665400505065918,
        "task_vector_dot_product": -16.620914459228516,
        "weight_space_angle": 14.993346214294434,
        "task_vector_magnitude_ratio": -2.8272852897644043,
        "singular_value_overlap": 18.913448333740234,
        "subspace_overlap": 10.380049705505371,
        "right_subspace_overlap": 45.51665496826172,
        "activation_l2_distance": -5.542779445648193,
        "activation_cosine_similarity": 13.412094116210938,
        "activation_magnitude_ratio": -3.334458351135254,
        "activation_dot_product": 18.969858169555664,
        "encoder_gradient_cosine_similarity": 9.871773719787598,
        "encoder_gradient_l2_distance": -23.94488525390625,
        "encoder_gradient_dot_product": 8.686716079711914,
        "input_gradient_cosine_similarity": 3.4365320205688477,
        "input_gradient_l2_distance": -28.12262535095215,
        "input_gradient_dot_product": -17.446521759033203
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7450042055738386,
      "val_r": 0.600108311518476,
      "n_iterations": 810,
      "coefficients": {
        "right_subspace_overlap_top_k": 17.990571975708008,
        "right_subspace_overlap_bottom_k": -38.47515106201172,
        "interaction_matrix_overlap_top_k": 32.456905364990234,
        "interaction_matrix_overlap_bottom_k": -22.257125854492188,
        "effective_rank": 8.364747047424316,
        "effective_rank_mergeability_score": -19.412843704223633,
        "stable_rank": -29.62567710876465,
        "spectral_gap": -16.214012145996094,
        "singular_value_ratio": 4.9333696365356445,
        "layerwise_effective_rank": -14.368188858032227,
        "layerwise_effective_rank_mergeability_score": 7.386672019958496,
        "task_vector_cosine_similarity": 3.250889778137207,
        "task_vector_l2_distance": 15.855782508850098,
        "task_vector_dot_product": -22.62419319152832,
        "weight_space_angle": 8.745805740356445,
        "task_vector_magnitude_ratio": 1.8317362070083618,
        "singular_value_overlap": 23.708158493041992,
        "subspace_overlap": 20.603736877441406,
        "right_subspace_overlap": 6.472228050231934,
        "activation_l2_distance": -0.6157020330429077,
        "activation_cosine_similarity": 21.990934371948242,
        "activation_magnitude_ratio": 1.0358260869979858,
        "activation_dot_product": 22.459550857543945,
        "encoder_gradient_cosine_similarity": 15.427347183227539,
        "encoder_gradient_l2_distance": -38.84358215332031,
        "encoder_gradient_dot_product": 4.719310760498047,
        "input_gradient_cosine_similarity": 11.52390193939209,
        "input_gradient_l2_distance": -13.096048355102539,
        "input_gradient_dot_product": -12.226838111877441
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7498829939314262,
      "val_r": 0.6420682511804204,
      "n_iterations": 85,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.2925390005111694,
        "right_subspace_overlap_bottom_k": -1.7316539287567139,
        "interaction_matrix_overlap_top_k": -0.042100269347429276,
        "interaction_matrix_overlap_bottom_k": -2.238473892211914,
        "effective_rank": 0.03356708213686943,
        "effective_rank_mergeability_score": 0.45435672998428345,
        "stable_rank": -0.7883796691894531,
        "spectral_gap": -0.2546977400779724,
        "singular_value_ratio": 0.2978520691394806,
        "layerwise_effective_rank": 0.6527330279350281,
        "layerwise_effective_rank_mergeability_score": 1.0377532243728638,
        "task_vector_cosine_similarity": 0.8142478466033936,
        "task_vector_l2_distance": -0.04979197308421135,
        "task_vector_dot_product": 0.6154378652572632,
        "weight_space_angle": -0.9176499247550964,
        "task_vector_magnitude_ratio": 1.063230037689209,
        "singular_value_overlap": 1.0311915874481201,
        "subspace_overlap": 0.07205931842327118,
        "right_subspace_overlap": 0.5652957558631897,
        "activation_l2_distance": -0.7071212530136108,
        "activation_cosine_similarity": 1.4350351095199585,
        "activation_magnitude_ratio": -0.6001010537147522,
        "activation_dot_product": 0.7410061359405518,
        "encoder_gradient_cosine_similarity": 1.0028109550476074,
        "encoder_gradient_l2_distance": -1.6499661207199097,
        "encoder_gradient_dot_product": 0.5921555757522583,
        "input_gradient_cosine_similarity": 0.5122826099395752,
        "input_gradient_l2_distance": -1.1793991327285767,
        "input_gradient_dot_product": -1.0663542747497559
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}