{
  "aggregate_metrics": {
    "train_r": 0.05954233306423309,
    "train_p": 0.0007209904182372171,
    "val_r": 0.0469438283885926,
    "val_p": 0.3758326100172263
  },
  "per_fold_stats": {
    "train_r_mean": 0.7129151001074575,
    "train_r_std": 0.16907927705911063,
    "val_r_mean": 0.5720938309057051,
    "val_r_std": 0.23617021174911804
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": -12.388481140136719,
    "right_subspace_overlap_bottom_k": -11.933205604553223,
    "interaction_matrix_overlap_top_k": 5.7680559158325195,
    "interaction_matrix_overlap_bottom_k": -8.316106796264648,
    "effective_rank": 0.47337284684181213,
    "effective_rank_mergeability_score": -1.0554158687591553,
    "stable_rank": -10.754512786865234,
    "spectral_gap": -23.823974609375,
    "singular_value_ratio": 1.5519731044769287,
    "layerwise_effective_rank": 0.012254871428012848,
    "layerwise_effective_rank_mergeability_score": 15.130328178405762,
    "task_vector_cosine_similarity": 4.670492649078369,
    "task_vector_l2_distance": 14.24102783203125,
    "task_vector_dot_product": 8.995806694030762,
    "weight_space_angle": -11.339395523071289,
    "task_vector_magnitude_ratio": 14.741411209106445,
    "singular_value_overlap": -17.28042221069336,
    "subspace_overlap": 13.968194961547852,
    "activation_l2_distance": 9.226186752319336,
    "activation_cosine_similarity": -6.3594489097595215,
    "activation_magnitude_ratio": 3.034186840057373,
    "activation_dot_product": 22.95903205871582,
    "encoder_gradient_cosine_similarity": 2.6662843227386475,
    "encoder_gradient_l2_distance": -19.534786224365234,
    "encoder_gradient_dot_product": -4.558012008666992,
    "input_gradient_cosine_similarity": 25.422176361083984,
    "input_gradient_l2_distance": -17.593320846557617,
    "input_gradient_dot_product": -0.2432471215724945
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 85.73963928222656,
    "right_subspace_overlap_bottom_k": 40.53670883178711,
    "interaction_matrix_overlap_top_k": 10.846409797668457,
    "interaction_matrix_overlap_bottom_k": 15.87845230102539,
    "effective_rank": 8.724222183227539,
    "effective_rank_mergeability_score": 6.377950668334961,
    "stable_rank": 60.409114837646484,
    "spectral_gap": 97.44283294677734,
    "singular_value_ratio": 17.737674713134766,
    "layerwise_effective_rank": 34.30923080444336,
    "layerwise_effective_rank_mergeability_score": 55.59535598754883,
    "task_vector_cosine_similarity": 16.87018585205078,
    "task_vector_l2_distance": 67.7674560546875,
    "task_vector_dot_product": 49.82279968261719,
    "weight_space_angle": 42.487518310546875,
    "task_vector_magnitude_ratio": 59.512245178222656,
    "singular_value_overlap": 84.89936828613281,
    "subspace_overlap": 41.159912109375,
    "activation_l2_distance": 45.68316650390625,
    "activation_cosine_similarity": 57.81329345703125,
    "activation_magnitude_ratio": 31.20709991455078,
    "activation_dot_product": 57.749549865722656,
    "encoder_gradient_cosine_similarity": 6.593928337097168,
    "encoder_gradient_l2_distance": 31.765899658203125,
    "encoder_gradient_dot_product": 28.25765037536621,
    "input_gradient_cosine_similarity": 97.25479888916016,
    "input_gradient_l2_distance": 45.520912170410156,
    "input_gradient_dot_product": 33.859439849853516
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.8432119734357177,
      "val_r": 0.624437176259883,
      "n_iterations": 755,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.33606666326522827,
        "right_subspace_overlap_bottom_k": -1.0041613578796387,
        "interaction_matrix_overlap_top_k": -0.7056594491004944,
        "interaction_matrix_overlap_bottom_k": 0.9330753684043884,
        "effective_rank": 0.6500583291053772,
        "effective_rank_mergeability_score": 0.4315315783023834,
        "stable_rank": -0.2584449350833893,
        "spectral_gap": 0.14966988563537598,
        "singular_value_ratio": 0.538177490234375,
        "layerwise_effective_rank": -0.16582907736301422,
        "layerwise_effective_rank_mergeability_score": -0.18861281871795654,
        "task_vector_cosine_similarity": 0.13793116807937622,
        "task_vector_l2_distance": 0.026381783187389374,
        "task_vector_dot_product": 0.00037112005520612,
        "weight_space_angle": -0.06730930507183075,
        "task_vector_magnitude_ratio": -0.3531762957572937,
        "singular_value_overlap": 0.004861094988882542,
        "subspace_overlap": 0.0638647973537445,
        "activation_l2_distance": 0.22673289477825165,
        "activation_cosine_similarity": 0.4214169979095459,
        "activation_magnitude_ratio": -0.022505760192871094,
        "activation_dot_product": -0.12779507040977478,
        "encoder_gradient_cosine_similarity": 0.004277511965483427,
        "encoder_gradient_l2_distance": -0.15009954571723938,
        "encoder_gradient_dot_product": 0.01455824263393879,
        "input_gradient_cosine_similarity": 0.023242291063070297,
        "input_gradient_l2_distance": -0.1382378190755844,
        "input_gradient_dot_product": -0.03127328306436539
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.63062546750235,
      "val_r": 0.7611123010730378,
      "n_iterations": 453,
      "coefficients": {
        "right_subspace_overlap_top_k": 31.715438842773438,
        "right_subspace_overlap_bottom_k": 21.20713996887207,
        "interaction_matrix_overlap_top_k": 36.18305587768555,
        "interaction_matrix_overlap_bottom_k": -29.097318649291992,
        "effective_rank": 5.864509582519531,
        "effective_rank_mergeability_score": -8.737882614135742,
        "stable_rank": -4.031283378601074,
        "spectral_gap": 4.853992938995361,
        "singular_value_ratio": 1.5875275135040283,
        "layerwise_effective_rank": -37.5926513671875,
        "layerwise_effective_rank_mergeability_score": 11.817087173461914,
        "task_vector_cosine_similarity": 15.764738082885742,
        "task_vector_l2_distance": -30.673200607299805,
        "task_vector_dot_product": -20.981246948242188,
        "weight_space_angle": -18.515642166137695,
        "task_vector_magnitude_ratio": 20.449289321899414,
        "singular_value_overlap": -21.93105125427246,
        "subspace_overlap": 18.121793746948242,
        "activation_l2_distance": 20.349842071533203,
        "activation_cosine_similarity": 41.32864761352539,
        "activation_magnitude_ratio": -23.571611404418945,
        "activation_dot_product": 69.19512176513672,
        "encoder_gradient_cosine_similarity": 0.9970342516899109,
        "encoder_gradient_l2_distance": -69.29620361328125,
        "encoder_gradient_dot_product": -0.05914083495736122,
        "input_gradient_cosine_similarity": 19.975317001342773,
        "input_gradient_l2_distance": -34.353981018066406,
        "input_gradient_dot_product": -51.72001647949219
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7875025351026855,
      "val_r": 0.7681276555980405,
      "n_iterations": 925,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.811177968978882,
        "right_subspace_overlap_bottom_k": -6.979704856872559,
        "interaction_matrix_overlap_top_k": 3.829671859741211,
        "interaction_matrix_overlap_bottom_k": -3.289543628692627,
        "effective_rank": 1.1648082733154297,
        "effective_rank_mergeability_score": -1.7032721042633057,
        "stable_rank": -0.1537436693906784,
        "spectral_gap": 0.0006213507149368525,
        "singular_value_ratio": 1.047438621520996,
        "layerwise_effective_rank": -2.394702434539795,
        "layerwise_effective_rank_mergeability_score": 3.039781093597412,
        "task_vector_cosine_similarity": -0.5889833569526672,
        "task_vector_l2_distance": 0.31290584802627563,
        "task_vector_dot_product": -0.054278817027807236,
        "weight_space_angle": 4.007694244384766,
        "task_vector_magnitude_ratio": 0.02193390764296055,
        "singular_value_overlap": 2.7103660106658936,
        "subspace_overlap": -1.2861822843551636,
        "activation_l2_distance": -0.3660050630569458,
        "activation_cosine_similarity": 5.676599979400635,
        "activation_magnitude_ratio": -1.2510045766830444,
        "activation_dot_product": 2.32784366607666,
        "encoder_gradient_cosine_similarity": 1.340073823928833,
        "encoder_gradient_l2_distance": -9.995052337646484,
        "encoder_gradient_dot_product": 0.3848118185997009,
        "input_gradient_cosine_similarity": 1.792297124862671,
        "input_gradient_l2_distance": -5.563611030578613,
        "input_gradient_dot_product": -4.114187717437744
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.767179669576615,
      "val_r": 0.7122568817862339,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.9688374996185303,
        "right_subspace_overlap_bottom_k": -3.3981096744537354,
        "interaction_matrix_overlap_top_k": 3.1760213375091553,
        "interaction_matrix_overlap_bottom_k": -3.6064774990081787,
        "effective_rank": -0.5191564559936523,
        "effective_rank_mergeability_score": 0.0243811197578907,
        "stable_rank": 1.8598450422286987,
        "spectral_gap": 0.9282793998718262,
        "singular_value_ratio": 1.3504478931427002,
        "layerwise_effective_rank": -0.9644550681114197,
        "layerwise_effective_rank_mergeability_score": 1.7526496648788452,
        "task_vector_cosine_similarity": -2.376957416534424,
        "task_vector_l2_distance": -0.18450286984443665,
        "task_vector_dot_product": -0.7777758240699768,
        "weight_space_angle": 1.7584434747695923,
        "task_vector_magnitude_ratio": -0.1653328686952591,
        "singular_value_overlap": 2.196282386779785,
        "subspace_overlap": -3.0841007232666016,
        "activation_l2_distance": 0.1244383230805397,
        "activation_cosine_similarity": 3.778412103652954,
        "activation_magnitude_ratio": -1.0314241647720337,
        "activation_dot_product": 1.9947893619537354,
        "encoder_gradient_cosine_similarity": 1.8992784023284912,
        "encoder_gradient_l2_distance": -8.863323211669922,
        "encoder_gradient_dot_product": 0.3002949357032776,
        "input_gradient_cosine_similarity": 0.44082796573638916,
        "input_gradient_l2_distance": -2.9008638858795166,
        "input_gradient_dot_product": -2.3724520206451416
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.07267915202221355,
      "val_r": -0.10818127572371926,
      "n_iterations": 586,
      "coefficients": {
        "right_subspace_overlap_top_k": -382.7597351074219,
        "right_subspace_overlap_bottom_k": -175.78106689453125,
        "interaction_matrix_overlap_top_k": 11.432040214538574,
        "interaction_matrix_overlap_bottom_k": -52.605308532714844,
        "effective_rank": 4.118983268737793,
        "effective_rank_mergeability_score": -21.146501541137695,
        "stable_rank": -268.9131774902344,
        "spectral_gap": -444.63323974609375,
        "singular_value_ratio": 52.32694625854492,
        "layerwise_effective_rank": 127.77559661865234,
        "layerwise_effective_rank_mergeability_score": 256.7837829589844,
        "task_vector_cosine_similarity": 22.515165328979492,
        "task_vector_l2_distance": 307.40716552734375,
        "task_vector_dot_product": 218.1765594482422,
        "weight_space_angle": -189.11685180664062,
        "task_vector_magnitude_ratio": 272.19097900390625,
        "singular_value_overlap": -384.61480712890625,
        "subspace_overlap": 181.02410888671875,
        "activation_l2_distance": 205.77243041992188,
        "activation_cosine_similarity": -253.8848876953125,
        "activation_magnitude_ratio": 135.4272918701172,
        "activation_dot_product": 259.70806884765625,
        "encoder_gradient_cosine_similarity": -9.003602027893066,
        "encoder_gradient_l2_distance": -97.89197540283203,
        "encoder_gradient_dot_product": -125.3955078125,
        "input_gradient_cosine_similarity": 448.21270751953125,
        "input_gradient_l2_distance": -209.84432983398438,
        "input_gradient_dot_product": 121.61296844482422
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7814192560200434,
      "val_r": 0.7546687866917964,
      "n_iterations": 576,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.248471975326538,
        "right_subspace_overlap_bottom_k": -2.3772852420806885,
        "interaction_matrix_overlap_top_k": 0.1750672459602356,
        "interaction_matrix_overlap_bottom_k": -0.6715528964996338,
        "effective_rank": 0.6981467008590698,
        "effective_rank_mergeability_score": -0.43726229667663574,
        "stable_rank": -0.2408614605665207,
        "spectral_gap": 0.4666108787059784,
        "singular_value_ratio": 0.10980278253555298,
        "layerwise_effective_rank": -0.1552230566740036,
        "layerwise_effective_rank_mergeability_score": 1.4796572923660278,
        "task_vector_cosine_similarity": -0.8627086877822876,
        "task_vector_l2_distance": -0.11240343004465103,
        "task_vector_dot_product": -1.0197749137878418,
        "weight_space_angle": 0.6700095534324646,
        "task_vector_magnitude_ratio": 0.5794897675514221,
        "singular_value_overlap": 0.890555739402771,
        "subspace_overlap": -0.4794408679008484,
        "activation_l2_distance": -0.3980556130409241,
        "activation_cosine_similarity": 1.7928202152252197,
        "activation_magnitude_ratio": -0.5573523044586182,
        "activation_dot_product": 0.9316542744636536,
        "encoder_gradient_cosine_similarity": 0.9341663122177124,
        "encoder_gradient_l2_distance": -2.736616849899292,
        "encoder_gradient_dot_product": 0.13359694182872772,
        "input_gradient_cosine_similarity": 0.42676734924316406,
        "input_gradient_l2_distance": -1.9818482398986816,
        "input_gradient_dot_product": -0.9481483101844788
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.47019737373259846,
      "val_r": 0.5183859513951935,
      "n_iterations": 249,
      "coefficients": {
        "right_subspace_overlap_top_k": 12.632804870605469,
        "right_subspace_overlap_bottom_k": 28.190765380859375,
        "interaction_matrix_overlap_top_k": 1.5586925745010376,
        "interaction_matrix_overlap_bottom_k": -3.7606561183929443,
        "effective_rank": 16.667537689208984,
        "effective_rank_mergeability_score": -4.5084381103515625,
        "stable_rank": 11.64055061340332,
        "spectral_gap": -9.279661178588867,
        "singular_value_ratio": -23.65556526184082,
        "layerwise_effective_rank": -16.256179809570312,
        "layerwise_effective_rank_mergeability_score": 10.174481391906738,
        "task_vector_cosine_similarity": 49.073158264160156,
        "task_vector_l2_distance": 1.5771174430847168,
        "task_vector_dot_product": 24.491500854492188,
        "weight_space_angle": -11.255659103393555,
        "task_vector_magnitude_ratio": -19.95644187927246,
        "singular_value_overlap": -8.511641502380371,
        "subspace_overlap": 11.99013614654541,
        "activation_l2_distance": -16.20970916748047,
        "activation_cosine_similarity": 15.287354469299316,
        "activation_magnitude_ratio": -17.396617889404297,
        "activation_dot_product": 25.722171783447266,
        "encoder_gradient_cosine_similarity": 10.175907135009766,
        "encoder_gradient_l2_distance": -38.39264678955078,
        "encoder_gradient_dot_product": 22.401691436767578,
        "input_gradient_cosine_similarity": -4.499596118927002,
        "input_gradient_l2_distance": -32.98612594604492,
        "input_gradient_dot_product": -55.57188415527344
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6821303179574187,
      "val_r": 0.3134516404374732,
      "n_iterations": 67,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5568249821662903,
        "right_subspace_overlap_bottom_k": -0.8913367986679077,
        "interaction_matrix_overlap_top_k": -0.029069121927022934,
        "interaction_matrix_overlap_bottom_k": -0.015556562691926956,
        "effective_rank": -0.8194679021835327,
        "effective_rank_mergeability_score": -0.4953983724117279,
        "stable_rank": 0.32977762818336487,
        "spectral_gap": 0.06076183542609215,
        "singular_value_ratio": 0.4422184228897095,
        "layerwise_effective_rank": -0.6323999166488647,
        "layerwise_effective_rank_mergeability_score": 0.012510208413004875,
        "task_vector_cosine_similarity": 0.7419904470443726,
        "task_vector_l2_distance": -0.3826580047607422,
        "task_vector_dot_product": -0.8241767883300781,
        "weight_space_angle": -0.22767159342765808,
        "task_vector_magnitude_ratio": 0.14985086023807526,
        "singular_value_overlap": 0.4343312978744507,
        "subspace_overlap": 0.28241458535194397,
        "activation_l2_distance": 0.863508939743042,
        "activation_cosine_similarity": 0.8625921607017517,
        "activation_magnitude_ratio": -0.24546346068382263,
        "activation_dot_product": 0.9967506527900696,
        "encoder_gradient_cosine_similarity": -0.1658569574356079,
        "encoder_gradient_l2_distance": -0.5127027034759521,
        "encoder_gradient_dot_product": -0.36434102058410645,
        "input_gradient_cosine_similarity": 0.21348734200000763,
        "input_gradient_l2_distance": -0.5916507244110107,
        "input_gradient_dot_product": 0.41983747482299805
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7792882052109729,
      "val_r": 0.4176106122687662,
      "n_iterations": 83,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.49815258383750916,
        "right_subspace_overlap_bottom_k": -0.3691945970058441,
        "interaction_matrix_overlap_top_k": 0.06109943240880966,
        "interaction_matrix_overlap_bottom_k": -0.46079668402671814,
        "effective_rank": 0.12778982520103455,
        "effective_rank_mergeability_score": 0.03150952607393265,
        "stable_rank": 0.1293434500694275,
        "spectral_gap": -0.11231713742017746,
        "singular_value_ratio": -0.030985193327069283,
        "layerwise_effective_rank": -0.3765500783920288,
        "layerwise_effective_rank_mergeability_score": 0.2699086368083954,
        "task_vector_cosine_similarity": -0.14612920582294464,
        "task_vector_l2_distance": -0.14380039274692535,
        "task_vector_dot_product": 0.17046009004116058,
        "weight_space_angle": 0.45651283860206604,
        "task_vector_magnitude_ratio": 0.033576373010873795,
        "singular_value_overlap": 0.3439098000526428,
        "subspace_overlap": 0.06068603694438934,
        "activation_l2_distance": 0.18471668660640717,
        "activation_cosine_similarity": 0.5175228714942932,
        "activation_magnitude_ratio": -0.09087852388620377,
        "activation_dot_product": 0.5247889757156372,
        "encoder_gradient_cosine_similarity": 0.24694199860095978,
        "encoder_gradient_l2_distance": -0.9272489547729492,
        "encoder_gradient_dot_product": 0.1533416509628296,
        "input_gradient_cosine_similarity": 0.24651360511779785,
        "input_gradient_l2_distance": -0.6524206399917603,
        "input_gradient_dot_product": -0.2849400043487549
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7428344066610473,
      "val_r": 0.3334998920391954,
      "n_iterations": 98,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.1285083293914795,
        "right_subspace_overlap_bottom_k": -1.5169998407363892,
        "interaction_matrix_overlap_top_k": 1.472669243812561,
        "interaction_matrix_overlap_bottom_k": -1.4228301048278809,
        "effective_rank": -0.2836264669895172,
        "effective_rank_mergeability_score": -0.14255455136299133,
        "stable_rank": 0.45327070355415344,
        "spectral_gap": 0.07190871238708496,
        "singular_value_ratio": 1.0072267055511475,
        "layerwise_effective_rank": -1.3287073373794556,
        "layerwise_effective_rank_mergeability_score": 1.4955896139144897,
        "task_vector_cosine_similarity": -1.1221261024475098,
        "task_vector_l2_distance": -0.8661501407623291,
        "task_vector_dot_product": -1.263140082359314,
        "weight_space_angle": -0.20089906454086304,
        "task_vector_magnitude_ratio": 0.49102136492729187,
        "singular_value_overlap": 1.0105040073394775,
        "subspace_overlap": 1.0835074186325073,
        "activation_l2_distance": 1.3904787302017212,
        "activation_cosine_similarity": -0.1306711584329605,
        "activation_magnitude_ratio": 0.2874927222728729,
        "activation_dot_product": 0.3111374080181122,
        "encoder_gradient_cosine_similarity": 1.4891165494918823,
        "encoder_gradient_l2_distance": -2.3057124614715576,
        "encoder_gradient_dot_product": 0.12048022449016571,
        "input_gradient_cosine_similarity": 0.6223673820495605,
        "input_gradient_l2_distance": -1.654996633529663,
        "input_gradient_dot_product": -1.3016875982284546
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8050093023203586,
      "val_r": 0.36517788480854707,
      "n_iterations": 59,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.34528571367263794,
        "right_subspace_overlap_bottom_k": -0.17004962265491486,
        "interaction_matrix_overlap_top_k": 0.13024722039699554,
        "interaction_matrix_overlap_bottom_k": -0.20672288537025452,
        "effective_rank": 0.0643543154001236,
        "effective_rank_mergeability_score": 0.11906665563583374,
        "stable_rank": -0.0034359225537627935,
        "spectral_gap": 0.19067691266536713,
        "singular_value_ratio": 0.17988118529319763,
        "layerwise_effective_rank": 0.17682047188282013,
        "layerwise_effective_rank_mergeability_score": 0.1938333660364151,
        "task_vector_cosine_similarity": 0.038492415100336075,
        "task_vector_l2_distance": 0.03888577222824097,
        "task_vector_dot_product": -0.1843956857919693,
        "weight_space_angle": 0.1907113641500473,
        "task_vector_magnitude_ratio": 0.07073375582695007,
        "singular_value_overlap": 0.20203319191932678,
        "subspace_overlap": -0.27167555689811707,
        "activation_l2_distance": -0.11740323156118393,
        "activation_cosine_similarity": 0.18900999426841736,
        "activation_magnitude_ratio": -0.06985064595937729,
        "activation_dot_product": 0.18560239672660828,
        "encoder_gradient_cosine_similarity": 0.03710922226309776,
        "encoder_gradient_l2_distance": -0.3647317886352539,
        "encoder_gradient_dot_product": -0.016661206260323524,
        "input_gradient_cosine_similarity": 0.05926552042365074,
        "input_gradient_l2_distance": -0.18397466838359833,
        "input_gradient_dot_product": -0.07067599892616272
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7653375458191876,
      "val_r": 0.7689686951069947,
      "n_iterations": 114,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.6563475728034973,
        "right_subspace_overlap_bottom_k": -1.7885732650756836,
        "interaction_matrix_overlap_top_k": -0.013325436972081661,
        "interaction_matrix_overlap_bottom_k": 0.7397395968437195,
        "effective_rank": 0.1088065505027771,
        "effective_rank_mergeability_score": 0.10253474116325378,
        "stable_rank": 0.30016303062438965,
        "spectral_gap": -0.1620228886604309,
        "singular_value_ratio": -0.064505934715271,
        "layerwise_effective_rank": -0.38041162490844727,
        "layerwise_effective_rank_mergeability_score": 0.08031825721263885,
        "task_vector_cosine_similarity": -0.17221160233020782,
        "task_vector_l2_distance": 0.04762644320726395,
        "task_vector_dot_product": -0.2607119679450989,
        "weight_space_angle": 0.6261075735092163,
        "task_vector_magnitude_ratio": 0.023814763873815536,
        "singular_value_overlap": 0.4097749590873718,
        "subspace_overlap": 0.4164641499519348,
        "activation_l2_distance": 0.17390364408493042,
        "activation_cosine_similarity": 0.79929119348526,
        "activation_magnitude_ratio": -0.18801969289779663,
        "activation_dot_product": 0.3590519428253174,
        "encoder_gradient_cosine_similarity": 0.19224494695663452,
        "encoder_gradient_l2_distance": -0.40040844678878784,
        "encoder_gradient_dot_product": 0.21358661353588104,
        "input_gradient_cosine_similarity": 0.1886124610900879,
        "input_gradient_l2_distance": -1.3603184223175049,
        "input_gradient_dot_product": -0.33263346552848816
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7768612932876333,
      "val_r": 0.7592335106905898,
      "n_iterations": 449,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.257063627243042,
        "right_subspace_overlap_bottom_k": -1.4787765741348267,
        "interaction_matrix_overlap_top_k": 0.39840275049209595,
        "interaction_matrix_overlap_bottom_k": -1.3234899044036865,
        "effective_rank": 2.63679575920105,
        "effective_rank_mergeability_score": -0.23547302186489105,
        "stable_rank": -0.17532889544963837,
        "spectral_gap": 0.14372332394123077,
        "singular_value_ratio": 0.6966351866722107,
        "layerwise_effective_rank": -1.172267198562622,
        "layerwise_effective_rank_mergeability_score": 1.6594934463500977,
        "task_vector_cosine_similarity": 0.2770856022834778,
        "task_vector_l2_distance": 0.7784809470176697,
        "task_vector_dot_product": -1.0250219106674194,
        "weight_space_angle": -0.4491916298866272,
        "task_vector_magnitude_ratio": -0.41211140155792236,
        "singular_value_overlap": 0.7372311353683472,
        "subspace_overlap": -1.1444933414459229,
        "activation_l2_distance": -0.5137264728546143,
        "activation_cosine_similarity": 1.1621599197387695,
        "activation_magnitude_ratio": -0.22136101126670837,
        "activation_dot_product": 0.4000649154186249,
        "encoder_gradient_cosine_similarity": 0.5194888114929199,
        "encoder_gradient_l2_distance": -1.8845518827438354,
        "encoder_gradient_dot_product": 0.5514780879020691,
        "input_gradient_cosine_similarity": 0.28792452812194824,
        "input_gradient_l2_distance": -1.6835750341415405,
        "input_gradient_dot_product": -0.8967610597610474
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8234862777753255,
      "val_r": 0.8279428280953943,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.7759451866149902,
        "right_subspace_overlap_bottom_k": -5.454409122467041,
        "interaction_matrix_overlap_top_k": -0.7295991778373718,
        "interaction_matrix_overlap_bottom_k": 3.4413137435913086,
        "effective_rank": 1.146902084350586,
        "effective_rank_mergeability_score": -3.5537109375,
        "stable_rank": -2.589496374130249,
        "spectral_gap": 0.12014088779687881,
        "singular_value_ratio": 1.7137197256088257,
        "layerwise_effective_rank": -0.5486184358596802,
        "layerwise_effective_rank_mergeability_score": 2.0950522422790527,
        "task_vector_cosine_similarity": 1.9685311317443848,
        "task_vector_l2_distance": 0.46248582005500793,
        "task_vector_dot_product": 0.02997428923845291,
        "weight_space_angle": 2.502856731414795,
        "task_vector_magnitude_ratio": -1.2056981325149536,
        "singular_value_overlap": 0.15672358870506287,
        "subspace_overlap": -1.818886399269104,
        "activation_l2_distance": 0.61348956823349,
        "activation_cosine_similarity": 2.6784424781799316,
        "activation_magnitude_ratio": -0.12747640907764435,
        "activation_dot_product": -0.6694826483726501,
        "encoder_gradient_cosine_similarity": 0.30019086599349976,
        "encoder_gradient_l2_distance": -2.473510503768921,
        "encoder_gradient_dot_product": 0.15945257246494293,
        "input_gradient_cosine_similarity": 0.24722513556480408,
        "input_gradient_l2_distance": -1.3300011157989502,
        "input_gradient_dot_product": -0.696929395198822
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7911974470555729,
      "val_r": 0.7499612881760296,
      "n_iterations": 468,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.2640007734298706,
        "right_subspace_overlap_bottom_k": -2.2648446559906006,
        "interaction_matrix_overlap_top_k": 1.247021198272705,
        "interaction_matrix_overlap_bottom_k": 0.4710179567337036,
        "effective_rank": 0.5449826121330261,
        "effective_rank_mergeability_score": -0.33369243144989014,
        "stable_rank": -0.459612637758255,
        "spectral_gap": 0.6186997294425964,
        "singular_value_ratio": 0.8442904949188232,
        "layerwise_effective_rank": 0.12367784976959229,
        "layerwise_effective_rank_mergeability_score": 0.8937597870826721,
        "task_vector_cosine_similarity": 0.8319021463394165,
        "task_vector_l2_distance": 0.4928478002548218,
        "task_vector_dot_product": -1.9842305183410645,
        "weight_space_angle": 0.6357865929603577,
        "task_vector_magnitude_ratio": 0.09694930911064148,
        "singular_value_overlap": 0.5672030448913574,
        "subspace_overlap": -0.29356124997138977,
        "activation_l2_distance": -0.7156702280044556,
        "activation_cosine_similarity": 0.47695454955101013,
        "activation_magnitude_ratio": -0.24923381209373474,
        "activation_dot_product": 0.5270642042160034,
        "encoder_gradient_cosine_similarity": 0.3504374623298645,
        "encoder_gradient_l2_distance": -2.1046767234802246,
        "encoder_gradient_dot_product": 0.07488670200109482,
        "input_gradient_cosine_similarity": 0.1969723254442215,
        "input_gradient_l2_distance": -1.0494369268417358,
        "input_gradient_dot_product": -0.38037028908729553
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.8003169226035622,
      "val_r": 0.23382663201100617,
      "n_iterations": 73,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.4405422508716583,
        "right_subspace_overlap_bottom_k": -0.3783400356769562,
        "interaction_matrix_overlap_top_k": 0.20754587650299072,
        "interaction_matrix_overlap_bottom_k": -0.35982412099838257,
        "effective_rank": -0.03520474582910538,
        "effective_rank_mergeability_score": 0.13445375859737396,
        "stable_rank": 0.10339535772800446,
        "spectral_gap": 0.005936863832175732,
        "singular_value_ratio": 0.18527960777282715,
        "layerwise_effective_rank": 0.17103919386863708,
        "layerwise_effective_rank_mergeability_score": 0.2715774476528168,
        "task_vector_cosine_similarity": -0.3091590106487274,
        "task_vector_l2_distance": -0.22188463807106018,
        "task_vector_dot_product": 0.09798107296228409,
        "weight_space_angle": 0.3918997645378113,
        "task_vector_magnitude_ratio": -0.12369544059038162,
        "singular_value_overlap": 0.5315550565719604,
        "subspace_overlap": -0.2879129648208618,
        "activation_l2_distance": 0.21031300723552704,
        "activation_cosine_similarity": 0.4232300817966461,
        "activation_magnitude_ratio": -0.13471995294094086,
        "activation_dot_product": 0.24012838304042816,
        "encoder_gradient_cosine_similarity": 0.16983895003795624,
        "encoder_gradient_l2_distance": -0.7211109399795532,
        "encoder_gradient_dot_product": 0.13337980210781097,
        "input_gradient_cosine_similarity": 0.013480677269399166,
        "input_gradient_l2_distance": -0.39178887009620667,
        "input_gradient_dot_product": -0.4398265480995178
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6726940707065312,
      "val_r": 0.7067085469378984,
      "n_iterations": 176,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.7010505199432373,
        "right_subspace_overlap_bottom_k": -4.5249433517456055,
        "interaction_matrix_overlap_top_k": 3.777621269226074,
        "interaction_matrix_overlap_bottom_k": -4.307299613952637,
        "effective_rank": -0.672272801399231,
        "effective_rank_mergeability_score": 2.264430284500122,
        "stable_rank": -3.2354109287261963,
        "spectral_gap": -0.17994500696659088,
        "singular_value_ratio": 2.0955984592437744,
        "layerwise_effective_rank": 0.1913464069366455,
        "layerwise_effective_rank_mergeability_score": 0.25054091215133667,
        "task_vector_cosine_similarity": 3.4590234756469727,
        "task_vector_l2_distance": -1.2249521017074585,
        "task_vector_dot_product": -2.0723907947540283,
        "weight_space_angle": -3.750706672668457,
        "task_vector_magnitude_ratio": 2.0985517501831055,
        "singular_value_overlap": 1.7181135416030884,
        "subspace_overlap": 4.342205047607422,
        "activation_l2_distance": -2.0523650646209717,
        "activation_cosine_similarity": 1.5822925567626953,
        "activation_magnitude_ratio": -2.2410662174224854,
        "activation_dot_product": 1.881619930267334,
        "encoder_gradient_cosine_similarity": 3.8484485149383545,
        "encoder_gradient_l2_distance": -4.505284309387207,
        "encoder_gradient_dot_product": 1.9934821128845215,
        "input_gradient_cosine_similarity": 0.9724401235580444,
        "input_gradient_l2_distance": -3.7949178218841553,
        "input_gradient_dot_product": -3.2499125003814697
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7077298201911597,
      "val_r": 0.5865321666679474,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 22.065814971923828,
        "right_subspace_overlap_bottom_k": -26.50501251220703,
        "interaction_matrix_overlap_top_k": 31.798152923583984,
        "interaction_matrix_overlap_bottom_k": -48.020076751708984,
        "effective_rank": -32.8642692565918,
        "effective_rank_mergeability_score": 16.401031494140625,
        "stable_rank": -3.596881151199341,
        "spectral_gap": 22.830904006958008,
        "singular_value_ratio": 34.44514846801758,
        "layerwise_effective_rank": 7.446932792663574,
        "layerwise_effective_rank_mergeability_score": -4.326684951782227,
        "task_vector_cosine_similarity": -36.501129150390625,
        "task_vector_l2_distance": -10.353500366210938,
        "task_vector_dot_product": 15.505178451538086,
        "weight_space_angle": -41.6796989440918,
        "task_vector_magnitude_ratio": 16.009382247924805,
        "singular_value_overlap": 31.4888916015625,
        "subspace_overlap": 5.136775016784668,
        "activation_l2_distance": -4.136829376220703,
        "activation_cosine_similarity": 22.929670333862305,
        "activation_magnitude_ratio": -20.046144485473633,
        "activation_dot_product": 47.299072265625,
        "encoder_gradient_cosine_similarity": 22.894670486450195,
        "encoder_gradient_l2_distance": -44.52397155761719,
        "encoder_gradient_dot_product": 11.714661598205566,
        "input_gradient_cosine_similarity": 15.047340393066406,
        "input_gradient_l2_distance": -29.959510803222656,
        "input_gradient_dot_product": -35.933250427246094
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7161586021992824,
      "val_r": 0.6237890205923665,
      "n_iterations": 682,
      "coefficients": {
        "right_subspace_overlap_top_k": 43.28005599975586,
        "right_subspace_overlap_bottom_k": -52.294471740722656,
        "interaction_matrix_overlap_top_k": 22.779083251953125,
        "interaction_matrix_overlap_bottom_k": -20.65715980529785,
        "effective_rank": 10.235139846801758,
        "effective_rank_mergeability_score": 1.1312564611434937,
        "stable_rank": 52.88890075683594,
        "spectral_gap": -54.0393180847168,
        "singular_value_ratio": -42.897335052490234,
        "layerwise_effective_rank": -73.97225189208984,
        "layerwise_effective_rank_mergeability_score": 12.919535636901855,
        "task_vector_cosine_similarity": 40.083438873291016,
        "task_vector_l2_distance": 18.722503662109375,
        "task_vector_dot_product": -48.678279876708984,
        "weight_space_angle": 25.68428611755371,
        "task_vector_magnitude_ratio": 3.1902575492858887,
        "singular_value_overlap": 25.249874114990234,
        "subspace_overlap": 66.9190902709961,
        "activation_l2_distance": -19.892440795898438,
        "activation_cosine_similarity": 25.828508377075195,
        "activation_magnitude_ratio": -7.260921955108643,
        "activation_dot_product": 45.698665618896484,
        "encoder_gradient_cosine_similarity": 16.669776916503906,
        "encoder_gradient_l2_distance": -98.63422393798828,
        "encoder_gradient_dot_product": -4.15535306930542,
        "input_gradient_cosine_similarity": 23.447471618652344,
        "input_gradient_l2_distance": -18.91252899169922,
        "input_gradient_dot_product": 32.368995666503906
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8424423629688731,
      "val_r": 0.7243664232014276,
      "n_iterations": 567,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.3077350854873657,
        "right_subspace_overlap_bottom_k": -0.8847150802612305,
        "interaction_matrix_overlap_top_k": -1.3876277208328247,
        "interaction_matrix_overlap_bottom_k": -2.1026530265808105,
        "effective_rank": 0.6326413154602051,
        "effective_rank_mergeability_score": -0.4543275237083435,
        "stable_rank": 0.8622092008590698,
        "spectral_gap": 1.4850059747695923,
        "singular_value_ratio": -0.8824792504310608,
        "layerwise_effective_rank": 0.2999298870563507,
        "layerwise_effective_rank_mergeability_score": 1.932347059249878,
        "task_vector_cosine_similarity": 0.5978073477745056,
        "task_vector_l2_distance": -0.882856011390686,
        "task_vector_dot_product": 0.5695643424987793,
        "weight_space_angle": 1.551405429840088,
        "task_vector_magnitude_ratio": 1.6388468742370605,
        "singular_value_overlap": 0.7968055605888367,
        "subspace_overlap": -1.4108506441116333,
        "activation_l2_distance": -0.9839158058166504,
        "activation_cosine_similarity": 1.0916756391525269,
        "activation_magnitude_ratio": -0.3254091143608093,
        "activation_dot_product": 1.6743332147598267,
        "encoder_gradient_cosine_similarity": 0.4261419475078583,
        "encoder_gradient_l2_distance": -4.011712551116943,
        "encoder_gradient_dot_product": 0.4810596704483032,
        "input_gradient_cosine_similarity": 0.5288380980491638,
        "input_gradient_l2_distance": -2.5323522090911865,
        "input_gradient_dot_product": -0.9217965602874756
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}