{
  "weight_avg": {
    "aggregate_metrics": {
      "train_mse": 65.79623127721104,
      "train_r2": -16117.626068648115,
      "train_pearson_r": 0.07062355252309695,
      "train_pearson_p": 6.0146370816548416e-05,
      "val_mse": 90.3225586423997,
      "val_r2": -22126.03541227111,
      "val_pearson_r": -0.06616280631831493,
      "val_pearson_p": 0.21172002583663055
    },
    "per_fold_stats": {
      "train_mse_mean": 66.0003218085351,
      "train_mse_std": 196.43723756756944,
      "val_mse_mean": 88.44176990727794,
      "val_mse_std": 285.64235820484515,
      "train_r_mean": 0.23314818778393867,
      "train_r_std": 0.22833233962500848,
      "val_r_mean": 0.18687256302310465,
      "val_r_std": 0.35235980022069285
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 1.8058252334594727,
      "right_subspace_overlap_bottom_k": -1.3870881795883179,
      "interaction_matrix_overlap_top_k": 0.8444067239761353,
      "interaction_matrix_overlap_bottom_k": 1.2753050327301025,
      "effective_rank": 1.5006048679351807,
      "effective_rank_mergeability_score": 0.00985858403146267,
      "stable_rank": 1.307286024093628,
      "spectral_gap": -1.4312965869903564,
      "singular_value_ratio": -2.8738560676574707,
      "layerwise_effective_rank": -1.5182852745056152,
      "layerwise_effective_rank_mergeability_score": -0.5700728297233582,
      "task_vector_cosine_similarity": -0.6403070688247681,
      "task_vector_l2_distance": 0.09525584429502487,
      "task_vector_dot_product": 0.39443689584732056,
      "weight_space_angle": -1.3025461435317993,
      "task_vector_magnitude_ratio": 0.3075953423976898,
      "singular_value_overlap": 1.067650556564331,
      "subspace_overlap": 1.3921890258789062,
      "right_subspace_overlap": -1.7947447299957275,
      "activation_l2_distance": -0.5298110246658325,
      "activation_cosine_similarity": 0.8698446154594421,
      "activation_magnitude_ratio": 0.5118957757949829,
      "activation_dot_product": 0.2537786066532135,
      "encoder_gradient_cosine_similarity": 1.532606601715088,
      "encoder_gradient_l2_distance": -0.5751479864120483,
      "encoder_gradient_dot_product": 0.4765914976596832,
      "input_gradient_cosine_similarity": -1.2081639766693115,
      "input_gradient_l2_distance": -0.41626840829849243,
      "input_gradient_dot_product": 1.5912938117980957
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 5.105084419250488,
      "right_subspace_overlap_bottom_k": 7.868483543395996,
      "interaction_matrix_overlap_top_k": 3.99006724357605,
      "interaction_matrix_overlap_bottom_k": 3.1081314086914062,
      "effective_rank": 4.639261245727539,
      "effective_rank_mergeability_score": 1.9102100133895874,
      "stable_rank": 5.668040752410889,
      "spectral_gap": 8.164864540100098,
      "singular_value_ratio": 8.715383529663086,
      "layerwise_effective_rank": 6.2415900230407715,
      "layerwise_effective_rank_mergeability_score": 3.7116498947143555,
      "task_vector_cosine_similarity": 5.086080551147461,
      "task_vector_l2_distance": 1.4514036178588867,
      "task_vector_dot_product": 3.163069725036621,
      "weight_space_angle": 6.166738033294678,
      "task_vector_magnitude_ratio": 5.634439945220947,
      "singular_value_overlap": 4.105656623840332,
      "subspace_overlap": 7.451869487762451,
      "right_subspace_overlap": 5.263078212738037,
      "activation_l2_distance": 3.455319404602051,
      "activation_cosine_similarity": 6.879420757293701,
      "activation_magnitude_ratio": 1.882379174232483,
      "activation_dot_product": 3.6240499019622803,
      "encoder_gradient_cosine_similarity": 5.814236164093018,
      "encoder_gradient_l2_distance": 4.5888872146606445,
      "encoder_gradient_dot_product": 3.2293033599853516,
      "input_gradient_cosine_similarity": 5.052158355712891,
      "input_gradient_l2_distance": 8.169217109680176,
      "input_gradient_dot_product": 4.96410608291626
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.006494030915670673,
        "train_r2": -0.6421228444603617,
        "train_pearson_r": 0.5502301533513804,
        "val_mse": 0.005995544139338355,
        "val_r2": -2.0396282759634987,
        "val_pearson_r": 0.5412642194579437,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.5015450716018677,
          "right_subspace_overlap_bottom_k": 0.10363337397575378,
          "interaction_matrix_overlap_top_k": -0.6193697452545166,
          "interaction_matrix_overlap_bottom_k": -0.2125515341758728,
          "effective_rank": 0.22710831463336945,
          "effective_rank_mergeability_score": -0.045060690492391586,
          "stable_rank": 0.04158557951450348,
          "spectral_gap": 0.054597336798906326,
          "singular_value_ratio": -0.3537108898162842,
          "layerwise_effective_rank": 0.060531772673130035,
          "layerwise_effective_rank_mergeability_score": 0.24425353109836578,
          "task_vector_cosine_similarity": -0.06813260912895203,
          "task_vector_l2_distance": 0.048835862427949905,
          "task_vector_dot_product": -0.11705438792705536,
          "weight_space_angle": 0.04085724055767059,
          "task_vector_magnitude_ratio": 0.2987034320831299,
          "singular_value_overlap": 0.040603116154670715,
          "subspace_overlap": 0.04257604479789734,
          "right_subspace_overlap": 0.08585675805807114,
          "activation_l2_distance": 0.5054065585136414,
          "activation_cosine_similarity": 0.7095668315887451,
          "activation_magnitude_ratio": 0.004388925153762102,
          "activation_dot_product": -0.2056703418493271,
          "encoder_gradient_cosine_similarity": 0.028838496655225754,
          "encoder_gradient_l2_distance": -0.1839449405670166,
          "encoder_gradient_dot_product": 0.06832937151193619,
          "input_gradient_cosine_similarity": -0.10361086577177048,
          "input_gradient_l2_distance": -0.11409493535757065,
          "input_gradient_dot_product": -0.08384513854980469
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.017618485366996044,
        "train_r2": -3.230767285701382,
        "train_pearson_r": 0.3611250928545767,
        "val_mse": 0.016266523948033147,
        "val_r2": -7.318835538134424,
        "val_pearson_r": 0.11486767448792917,
        "n_iterations": 60,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.04346197098493576,
          "right_subspace_overlap_bottom_k": -0.028818411752581596,
          "interaction_matrix_overlap_top_k": -0.13633374869823456,
          "interaction_matrix_overlap_bottom_k": -0.04926997423171997,
          "effective_rank": 0.0968763530254364,
          "effective_rank_mergeability_score": 0.21399913728237152,
          "stable_rank": 0.09424205869436264,
          "spectral_gap": 0.1959235817193985,
          "singular_value_ratio": -0.24144825339317322,
          "layerwise_effective_rank": -0.14591005444526672,
          "layerwise_effective_rank_mergeability_score": -0.036461781710386276,
          "task_vector_cosine_similarity": -0.06280477344989777,
          "task_vector_l2_distance": 0.11381185799837112,
          "task_vector_dot_product": -0.5055162906646729,
          "weight_space_angle": -0.06947128474712372,
          "task_vector_magnitude_ratio": 0.600864052772522,
          "singular_value_overlap": 0.1628025770187378,
          "subspace_overlap": 0.16535358130931854,
          "right_subspace_overlap": -0.045025456696748734,
          "activation_l2_distance": 0.2148231565952301,
          "activation_cosine_similarity": 0.3410813808441162,
          "activation_magnitude_ratio": 0.12666359543800354,
          "activation_dot_product": 0.024881675839424133,
          "encoder_gradient_cosine_similarity": 0.0681108832359314,
          "encoder_gradient_l2_distance": -0.28165772557258606,
          "encoder_gradient_dot_product": 0.23950369656085968,
          "input_gradient_cosine_similarity": 0.01158287562429905,
          "input_gradient_l2_distance": -0.11265236884355545,
          "input_gradient_dot_product": 0.08559601753950119
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 12.766052528450437,
        "train_r2": -3008.6953853661917,
        "train_pearson_r": -0.12457106631186576,
        "val_mse": 10.10043942656666,
        "val_r2": -4599.186835708717,
        "val_pearson_r": -0.22364587011934592,
        "n_iterations": 52,
        "coefficients": {
          "right_subspace_overlap_top_k": 8.217000007629395,
          "right_subspace_overlap_bottom_k": 3.439969778060913,
          "interaction_matrix_overlap_top_k": -1.489062786102295,
          "interaction_matrix_overlap_bottom_k": 4.684792995452881,
          "effective_rank": 6.010285377502441,
          "effective_rank_mergeability_score": 4.348766803741455,
          "stable_rank": -2.834906816482544,
          "spectral_gap": -0.9944260716438293,
          "singular_value_ratio": -2.6480660438537598,
          "layerwise_effective_rank": -4.101172924041748,
          "layerwise_effective_rank_mergeability_score": -2.681809663772583,
          "task_vector_cosine_similarity": 3.7345471382141113,
          "task_vector_l2_distance": -3.0967466831207275,
          "task_vector_dot_product": -1.1798949241638184,
          "weight_space_angle": 7.961326599121094,
          "task_vector_magnitude_ratio": 5.037882328033447,
          "singular_value_overlap": -2.5016603469848633,
          "subspace_overlap": -8.176319122314453,
          "right_subspace_overlap": -0.5958988070487976,
          "activation_l2_distance": -5.12571907043457,
          "activation_cosine_similarity": -3.780369520187378,
          "activation_magnitude_ratio": -1.6821027994155884,
          "activation_dot_product": 2.2067089080810547,
          "encoder_gradient_cosine_similarity": -4.560495376586914,
          "encoder_gradient_l2_distance": -3.5891568660736084,
          "encoder_gradient_dot_product": 0.9575493931770325,
          "input_gradient_cosine_similarity": -0.4814671576023102,
          "input_gradient_l2_distance": 2.0050418376922607,
          "input_gradient_dot_product": 1.8827824592590332
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.8359693014179114,
        "train_r2": -203.05431680509224,
        "train_pearson_r": -0.10394448987677578,
        "val_mse": 0.42983159869450355,
        "val_r2": -212.65934671486062,
        "val_pearson_r": -0.36396651198520646,
        "n_iterations": 140,
        "coefficients": {
          "right_subspace_overlap_top_k": 1.5302114486694336,
          "right_subspace_overlap_bottom_k": -0.5816190838813782,
          "interaction_matrix_overlap_top_k": -2.069439649581909,
          "interaction_matrix_overlap_bottom_k": -1.7333592176437378,
          "effective_rank": -1.4569010734558105,
          "effective_rank_mergeability_score": -2.258430242538452,
          "stable_rank": -0.4789849519729614,
          "spectral_gap": 3.926006317138672,
          "singular_value_ratio": 3.3322715759277344,
          "layerwise_effective_rank": 0.9888357520103455,
          "layerwise_effective_rank_mergeability_score": 0.6629985570907593,
          "task_vector_cosine_similarity": -0.696834921836853,
          "task_vector_l2_distance": 2.529909372329712,
          "task_vector_dot_product": -2.3062338829040527,
          "weight_space_angle": -2.8664565086364746,
          "task_vector_magnitude_ratio": 0.45339176058769226,
          "singular_value_overlap": 0.8926398754119873,
          "subspace_overlap": -0.10864519327878952,
          "right_subspace_overlap": 2.247804641723633,
          "activation_l2_distance": -2.3866171836853027,
          "activation_cosine_similarity": -0.4901508390903473,
          "activation_magnitude_ratio": -0.7885288000106812,
          "activation_dot_product": -1.2396271228790283,
          "encoder_gradient_cosine_similarity": 0.3621945083141327,
          "encoder_gradient_l2_distance": 1.1537203788757324,
          "encoder_gradient_dot_product": 2.4894931316375732,
          "input_gradient_cosine_similarity": 0.671427309513092,
          "input_gradient_l2_distance": 0.8815101385116577,
          "input_gradient_dot_product": -1.6711146831512451
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.008709599238155272,
        "train_r2": -1.1134529581463704,
        "train_pearson_r": 0.47406820269825706,
        "val_mse": 0.016556172314183975,
        "val_r2": -5.337283508445506,
        "val_pearson_r": 0.5598055133047942,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.07785766571760178,
          "right_subspace_overlap_bottom_k": -0.1901814043521881,
          "interaction_matrix_overlap_top_k": -0.5809399485588074,
          "interaction_matrix_overlap_bottom_k": 0.0470866933465004,
          "effective_rank": 0.12265483289957047,
          "effective_rank_mergeability_score": -0.06759938597679138,
          "stable_rank": 0.30898961424827576,
          "spectral_gap": 0.274494469165802,
          "singular_value_ratio": -0.17514237761497498,
          "layerwise_effective_rank": 0.04871784895658493,
          "layerwise_effective_rank_mergeability_score": 0.43862536549568176,
          "task_vector_cosine_similarity": -0.6122279167175293,
          "task_vector_l2_distance": 0.07628201693296432,
          "task_vector_dot_product": -0.07129103690385818,
          "weight_space_angle": -0.0798344761133194,
          "task_vector_magnitude_ratio": 0.3191929757595062,
          "singular_value_overlap": 0.0846552699804306,
          "subspace_overlap": 0.7021064758300781,
          "right_subspace_overlap": 0.26953980326652527,
          "activation_l2_distance": 0.25857555866241455,
          "activation_cosine_similarity": 0.4702267348766327,
          "activation_magnitude_ratio": 0.015008204616606236,
          "activation_dot_product": -0.10106448829174042,
          "encoder_gradient_cosine_similarity": 0.05184703320264816,
          "encoder_gradient_l2_distance": -0.21650637686252594,
          "encoder_gradient_dot_product": 0.040335625410079956,
          "input_gradient_cosine_similarity": -0.19937364757061005,
          "input_gradient_l2_distance": -0.08643071353435516,
          "input_gradient_dot_product": -0.06962601840496063
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_mse": 0.22738131496138178,
        "train_r2": -53.899894521297185,
        "train_pearson_r": -0.07884424390987158,
        "val_mse": 0.09477467640436288,
        "val_r2": -42.4756400096251,
        "val_pearson_r": -0.22063925725182637,
        "n_iterations": 160,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.9845483899116516,
          "right_subspace_overlap_bottom_k": -0.007197195664048195,
          "interaction_matrix_overlap_top_k": -0.28488847613334656,
          "interaction_matrix_overlap_bottom_k": -0.2673262655735016,
          "effective_rank": 0.8626580834388733,
          "effective_rank_mergeability_score": -0.8152667284011841,
          "stable_rank": 0.45300164818763733,
          "spectral_gap": 0.9303023219108582,
          "singular_value_ratio": -0.02795748971402645,
          "layerwise_effective_rank": -0.4817885756492615,
          "layerwise_effective_rank_mergeability_score": 0.34374478459358215,
          "task_vector_cosine_similarity": 0.3980044424533844,
          "task_vector_l2_distance": 0.33917030692100525,
          "task_vector_dot_product": 0.15200018882751465,
          "weight_space_angle": 0.3846574127674103,
          "task_vector_magnitude_ratio": -0.2021251916885376,
          "singular_value_overlap": -0.8046612739562988,
          "subspace_overlap": 0.8721202611923218,
          "right_subspace_overlap": 0.3012221157550812,
          "activation_l2_distance": -0.5389862656593323,
          "activation_cosine_similarity": 0.245595782995224,
          "activation_magnitude_ratio": 0.3652581572532654,
          "activation_dot_product": -0.3724941313266754,
          "encoder_gradient_cosine_similarity": -0.000722814816981554,
          "encoder_gradient_l2_distance": -0.14944183826446533,
          "encoder_gradient_dot_product": 0.32912489771842957,
          "input_gradient_cosine_similarity": 0.00222951197065413,
          "input_gradient_l2_distance": 0.06534621864557266,
          "input_gradient_dot_product": -0.1062127947807312
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_mse": 0.07715142973030652,
        "train_r2": -18.350480722785026,
        "train_pearson_r": 0.04258242332034279,
        "val_mse": 0.17407325942701377,
        "val_r2": -95.11120718332711,
        "val_pearson_r": 0.16523711450517764,
        "n_iterations": 62,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.050340160727500916,
          "right_subspace_overlap_bottom_k": -0.11002074182033539,
          "interaction_matrix_overlap_top_k": -0.3335300385951996,
          "interaction_matrix_overlap_bottom_k": 0.13023170828819275,
          "effective_rank": -0.0021546429488807917,
          "effective_rank_mergeability_score": 0.0038985502906143665,
          "stable_rank": 0.5357245206832886,
          "spectral_gap": -0.2187800407409668,
          "singular_value_ratio": 0.015362914651632309,
          "layerwise_effective_rank": -0.16645604372024536,
          "layerwise_effective_rank_mergeability_score": 0.4061454236507416,
          "task_vector_cosine_similarity": 0.21020154654979706,
          "task_vector_l2_distance": 0.263214111328125,
          "task_vector_dot_product": 0.07244568318128586,
          "weight_space_angle": 0.2254849076271057,
          "task_vector_magnitude_ratio": -0.2686350345611572,
          "singular_value_overlap": 0.7414997816085815,
          "subspace_overlap": 0.14183814823627472,
          "right_subspace_overlap": -0.17304667830467224,
          "activation_l2_distance": -0.12136116623878479,
          "activation_cosine_similarity": -0.004341526888310909,
          "activation_magnitude_ratio": 0.16559019684791565,
          "activation_dot_product": 0.007339825853705406,
          "encoder_gradient_cosine_similarity": 0.017921313643455505,
          "encoder_gradient_l2_distance": -0.019042152911424637,
          "encoder_gradient_dot_product": -0.02745748870074749,
          "input_gradient_cosine_similarity": -0.25587528944015503,
          "input_gradient_l2_distance": -0.0316561795771122,
          "input_gradient_dot_product": -0.16206450760364532
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 790.2211886136038,
        "train_r2": -220078.69557729142,
        "train_pearson_r": 0.21821325787578505,
        "val_mse": 1268.7345558885254,
        "val_r2": -663189.3748691857,
        "val_pearson_r": 0.023490154904212746,
        "n_iterations": 51,
        "coefficients": {
          "right_subspace_overlap_top_k": 2.009305715560913,
          "right_subspace_overlap_bottom_k": -34.6861572265625,
          "interaction_matrix_overlap_top_k": 16.970306396484375,
          "interaction_matrix_overlap_bottom_k": 4.202853202819824,
          "effective_rank": 5.205721855163574,
          "effective_rank_mergeability_score": -6.134680271148682,
          "stable_rank": 25.40328598022461,
          "spectral_gap": -36.555938720703125,
          "singular_value_ratio": -33.41578674316406,
          "layerwise_effective_rank": -23.56412124633789,
          "layerwise_effective_rank_mergeability_score": -10.626612663269043,
          "task_vector_cosine_similarity": -2.5167434215545654,
          "task_vector_l2_distance": 4.684350490570068,
          "task_vector_dot_product": 12.558123588562012,
          "weight_space_angle": -9.546321868896484,
          "task_vector_magnitude_ratio": 15.725997924804688,
          "singular_value_overlap": 18.427377700805664,
          "subspace_overlap": 32.693763732910156,
          "right_subspace_overlap": -21.106319427490234,
          "activation_l2_distance": -3.740892171859741,
          "activation_cosine_similarity": 29.25728416442871,
          "activation_magnitude_ratio": 0.6357885003089905,
          "activation_dot_product": -4.809090614318848,
          "encoder_gradient_cosine_similarity": 14.781245231628418,
          "encoder_gradient_l2_distance": -16.753376007080078,
          "encoder_gradient_dot_product": -9.132038116455078,
          "input_gradient_cosine_similarity": -14.364052772521973,
          "input_gradient_l2_distance": 24.429950714111328,
          "input_gradient_dot_product": 20.89995574951172
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_mse": 0.008190921941981911,
        "train_r2": -0.960411718356533,
        "train_pearson_r": 0.4864551354404168,
        "val_mse": 0.007883520365991381,
        "val_r2": -2.295904720193254,
        "val_pearson_r": 0.5740658718205838,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0811174288392067,
          "right_subspace_overlap_bottom_k": 0.1496574729681015,
          "interaction_matrix_overlap_top_k": -0.12665148079395294,
          "interaction_matrix_overlap_bottom_k": -0.31740668416023254,
          "effective_rank": 0.11684655398130417,
          "effective_rank_mergeability_score": -0.017690453678369522,
          "stable_rank": 0.5691369771957397,
          "spectral_gap": 0.15639087557792664,
          "singular_value_ratio": 0.14784710109233856,
          "layerwise_effective_rank": -0.1444728672504425,
          "layerwise_effective_rank_mergeability_score": 0.41319698095321655,
          "task_vector_cosine_similarity": -0.22827987372875214,
          "task_vector_l2_distance": 0.09267397224903107,
          "task_vector_dot_product": -0.1668136864900589,
          "weight_space_angle": 0.11161430925130844,
          "task_vector_magnitude_ratio": -0.18548016250133514,
          "singular_value_overlap": 0.07599227130413055,
          "subspace_overlap": 0.17968812584877014,
          "right_subspace_overlap": 0.32365626096725464,
          "activation_l2_distance": 0.11460516601800919,
          "activation_cosine_similarity": 0.29382216930389404,
          "activation_magnitude_ratio": -0.0013622479746118188,
          "activation_dot_product": -0.07440344989299774,
          "encoder_gradient_cosine_similarity": 0.03336207941174507,
          "encoder_gradient_l2_distance": -0.241509348154068,
          "encoder_gradient_dot_product": 0.11271486431360245,
          "input_gradient_cosine_similarity": -0.13750885426998138,
          "input_gradient_l2_distance": -0.08531773835420609,
          "input_gradient_dot_product": -0.08262838423252106
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 30.480466468112304,
        "train_r2": -7721.196746188418,
        "train_pearson_r": 0.1032860590550282,
        "val_mse": 70.52953206072127,
        "val_r2": -23953.083242817604,
        "val_pearson_r": -0.13505421595863687,
        "n_iterations": 51,
        "coefficients": {
          "right_subspace_overlap_top_k": 1.5628321170806885,
          "right_subspace_overlap_bottom_k": -2.194441556930542,
          "interaction_matrix_overlap_top_k": 3.1257903575897217,
          "interaction_matrix_overlap_bottom_k": 8.487127304077148,
          "effective_rank": -2.8871192932128906,
          "effective_rank_mergeability_score": 0.8939045071601868,
          "stable_rank": 4.099572658538818,
          "spectral_gap": 4.238776683807373,
          "singular_value_ratio": -3.2769062519073486,
          "layerwise_effective_rank": 10.047021865844727,
          "layerwise_effective_rank_mergeability_score": 8.43239688873291,
          "task_vector_cosine_similarity": 6.704230785369873,
          "task_vector_l2_distance": -1.295399785041809,
          "task_vector_dot_product": 4.290590763092041,
          "weight_space_angle": -0.5699487924575806,
          "task_vector_magnitude_ratio": 3.8975348472595215,
          "singular_value_overlap": -0.61711585521698,
          "subspace_overlap": -1.998716950416565,
          "right_subspace_overlap": -4.783637523651123,
          "activation_l2_distance": -10.123641014099121,
          "activation_cosine_similarity": -2.6867570877075195,
          "activation_magnitude_ratio": 1.4996728897094727,
          "activation_dot_product": -5.669218063354492,
          "encoder_gradient_cosine_similarity": -0.8821572065353394,
          "encoder_gradient_l2_distance": -0.5064927935600281,
          "encoder_gradient_dot_product": 2.3351547718048096,
          "input_gradient_cosine_similarity": -16.712331771850586,
          "input_gradient_l2_distance": -6.22330379486084,
          "input_gradient_dot_product": 1.7647422552108765
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.008914298319485066,
        "train_r2": -1.5391685274862281,
        "train_pearson_r": 0.4822302498540507,
        "val_mse": 0.011550898448410458,
        "val_r2": -5.920606845472527,
        "val_pearson_r": 0.4520083941971499,
        "n_iterations": 567,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.18293428421020508,
          "right_subspace_overlap_bottom_k": -0.18692001700401306,
          "interaction_matrix_overlap_top_k": 0.08366822451353073,
          "interaction_matrix_overlap_bottom_k": 0.03771665692329407,
          "effective_rank": 0.2193940281867981,
          "effective_rank_mergeability_score": -0.2656913995742798,
          "stable_rank": -0.10567401349544525,
          "spectral_gap": 0.07903212308883667,
          "singular_value_ratio": -0.0006082195322960615,
          "layerwise_effective_rank": 0.1999851018190384,
          "layerwise_effective_rank_mergeability_score": 0.4826907217502594,
          "task_vector_cosine_similarity": -0.1089906096458435,
          "task_vector_l2_distance": 0.015750987455248833,
          "task_vector_dot_product": 0.2447122484445572,
          "weight_space_angle": 0.42036131024360657,
          "task_vector_magnitude_ratio": -0.028608379885554314,
          "singular_value_overlap": 0.07582012563943863,
          "subspace_overlap": -0.12130072712898254,
          "right_subspace_overlap": -0.09205377101898193,
          "activation_l2_distance": 0.13660269975662231,
          "activation_cosine_similarity": 0.3839362859725952,
          "activation_magnitude_ratio": 0.019505122676491737,
          "activation_dot_product": -0.18729165196418762,
          "encoder_gradient_cosine_similarity": 0.03237801045179367,
          "encoder_gradient_l2_distance": -0.1992858648300171,
          "encoder_gradient_dot_product": 0.14459802210330963,
          "input_gradient_cosine_similarity": -0.15804991126060486,
          "input_gradient_l2_distance": -0.09388505667448044,
          "input_gradient_dot_product": -0.2105865627527237
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.019149383341182054,
        "train_r2": -3.6084033411560297,
        "train_pearson_r": 0.2200561445405937,
        "val_mse": 0.022661796011881376,
        "val_r2": -10.14438253810115,
        "val_pearson_r": 0.08390384455341292,
        "n_iterations": 248,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.27666279673576355,
          "right_subspace_overlap_bottom_k": 0.18792949616909027,
          "interaction_matrix_overlap_top_k": -0.06309544295072556,
          "interaction_matrix_overlap_bottom_k": -0.3646450936794281,
          "effective_rank": 0.3512739837169647,
          "effective_rank_mergeability_score": -0.3554307818412781,
          "stable_rank": 0.3314375579357147,
          "spectral_gap": 0.3314051628112793,
          "singular_value_ratio": -0.4250406324863434,
          "layerwise_effective_rank": -0.2722756862640381,
          "layerwise_effective_rank_mergeability_score": 0.2668405771255493,
          "task_vector_cosine_similarity": 0.3138699233531952,
          "task_vector_l2_distance": 0.08469494432210922,
          "task_vector_dot_product": 0.3001410961151123,
          "weight_space_angle": 0.40639904141426086,
          "task_vector_magnitude_ratio": 0.25414642691612244,
          "singular_value_overlap": 0.1404152810573578,
          "subspace_overlap": -0.17061026394367218,
          "right_subspace_overlap": 0.19634214043617249,
          "activation_l2_distance": -0.08530935645103455,
          "activation_cosine_similarity": 0.21539151668548584,
          "activation_magnitude_ratio": 0.02747342549264431,
          "activation_dot_product": -0.2075960636138916,
          "encoder_gradient_cosine_similarity": 0.023540543392300606,
          "encoder_gradient_l2_distance": -0.22208160161972046,
          "encoder_gradient_dot_product": 0.18840713798999786,
          "input_gradient_cosine_similarity": -0.026091113686561584,
          "input_gradient_l2_distance": -0.047991253435611725,
          "input_gradient_dot_product": -0.10526027530431747
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 483.0389718128666,
        "train_r2": -122779.53724427204,
        "train_pearson_r": 0.1659078141421891,
        "val_mse": 416.53661077233886,
        "val_r2": -206528.25304895968,
        "val_pearson_r": 0.29625609615623205,
        "n_iterations": 52,
        "coefficients": {
          "right_subspace_overlap_top_k": 22.54905128479004,
          "right_subspace_overlap_bottom_k": 7.427090644836426,
          "interaction_matrix_overlap_top_k": 4.97927713394165,
          "interaction_matrix_overlap_bottom_k": 10.497476577758789,
          "effective_rank": 19.934619903564453,
          "effective_rank_mergeability_score": 2.2789947986602783,
          "stable_rank": -2.076051712036133,
          "spectral_gap": -1.25151789188385,
          "singular_value_ratio": -23.099252700805664,
          "layerwise_effective_rank": -12.26413345336914,
          "layerwise_effective_rank_mergeability_score": -9.359789848327637,
          "task_vector_cosine_similarity": -21.369659423828125,
          "task_vector_l2_distance": -1.3216900825500488,
          "task_vector_dot_product": -4.338826656341553,
          "weight_space_angle": -25.0842342376709,
          "task_vector_magnitude_ratio": -18.61222267150879,
          "singular_value_overlap": 3.3477306365966797,
          "subspace_overlap": 2.7042360305786133,
          "right_subspace_overlap": -11.923957824707031,
          "activation_l2_distance": 9.72875690460205,
          "activation_cosine_similarity": -8.923073768615723,
          "activation_magnitude_ratio": 8.25240421295166,
          "activation_dot_product": 14.189093589782715,
          "encoder_gradient_cosine_similarity": 21.836345672607422,
          "encoder_gradient_l2_distance": 11.45976734161377,
          "encoder_gradient_dot_product": 10.793251991271973,
          "input_gradient_cosine_similarity": 7.105270862579346,
          "input_gradient_l2_distance": -26.329198837280273,
          "input_gradient_dot_product": 9.82205581665039
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.25757817469329625,
        "train_r2": -60.17602549828345,
        "train_pearson_r": 0.45944111255731035,
        "val_mse": 0.14413720465806978,
        "val_r2": -56.07052414347014,
        "val_pearson_r": 0.6556563510173351,
        "n_iterations": 77,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.36649617552757263,
          "right_subspace_overlap_bottom_k": -0.2784446179866791,
          "interaction_matrix_overlap_top_k": -0.008806105703115463,
          "interaction_matrix_overlap_bottom_k": -0.05355469882488251,
          "effective_rank": 0.7377135157585144,
          "effective_rank_mergeability_score": 0.46871641278266907,
          "stable_rank": 0.11825310438871384,
          "spectral_gap": -0.09907730668783188,
          "singular_value_ratio": -0.15386778116226196,
          "layerwise_effective_rank": 0.1316457986831665,
          "layerwise_effective_rank_mergeability_score": -0.35481786727905273,
          "task_vector_cosine_similarity": -0.05425296723842621,
          "task_vector_l2_distance": -0.243205264210701,
          "task_vector_dot_product": 0.0139019088819623,
          "weight_space_angle": 0.16105276346206665,
          "task_vector_magnitude_ratio": -0.9024935960769653,
          "singular_value_overlap": -0.030772453173995018,
          "subspace_overlap": 0.463822603225708,
          "right_subspace_overlap": 0.5235461592674255,
          "activation_l2_distance": 0.03128408268094063,
          "activation_cosine_similarity": 0.015114519745111465,
          "activation_magnitude_ratio": 0.15386229753494263,
          "activation_dot_product": 0.22191938757896423,
          "encoder_gradient_cosine_similarity": 0.8542152643203735,
          "encoder_gradient_l2_distance": -0.5381020307540894,
          "encoder_gradient_dot_product": 0.3815673291683197,
          "input_gradient_cosine_similarity": -0.6423994898796082,
          "input_gradient_l2_distance": -0.27435964345932007,
          "input_gradient_dot_product": -0.01728706806898117
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.007088999115769163,
        "train_r2": -0.764666824171816,
        "train_pearson_r": 0.5178070346556815,
        "val_mse": 0.009506088978558659,
        "val_r2": -2.170314911519515,
        "val_pearson_r": 0.36081768240959045,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.08908762782812119,
          "right_subspace_overlap_bottom_k": 0.00542212650179863,
          "interaction_matrix_overlap_top_k": -0.03958059847354889,
          "interaction_matrix_overlap_bottom_k": -0.20513668656349182,
          "effective_rank": 0.144802987575531,
          "effective_rank_mergeability_score": -0.10307519137859344,
          "stable_rank": 0.13496220111846924,
          "spectral_gap": 0.4039575755596161,
          "singular_value_ratio": -0.07327494770288467,
          "layerwise_effective_rank": 0.09514009207487106,
          "layerwise_effective_rank_mergeability_score": 0.3227781355381012,
          "task_vector_cosine_similarity": -0.038999151438474655,
          "task_vector_l2_distance": 0.11154060810804367,
          "task_vector_dot_product": -0.17056122422218323,
          "weight_space_angle": 0.1465829759836197,
          "task_vector_magnitude_ratio": 0.34627026319503784,
          "singular_value_overlap": 0.0713743194937706,
          "subspace_overlap": -0.15693838894367218,
          "right_subspace_overlap": 0.19932085275650024,
          "activation_l2_distance": 0.0032601880375295877,
          "activation_cosine_similarity": 0.21561549603939056,
          "activation_magnitude_ratio": 0.008615673519670963,
          "activation_dot_product": -0.11034021526575089,
          "encoder_gradient_cosine_similarity": 0.04654063656926155,
          "encoder_gradient_l2_distance": -0.2303743213415146,
          "encoder_gradient_dot_product": 0.09122782945632935,
          "input_gradient_cosine_similarity": -0.13327334821224213,
          "input_gradient_l2_distance": -0.07694897055625916,
          "input_gradient_dot_product": -0.097508504986763
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_mse": 0.0385358539900475,
        "train_r2": -8.112332290859714,
        "train_pearson_r": 0.09196075438093838,
        "val_mse": 0.03844176737693187,
        "val_r2": -14.781497799346775,
        "val_pearson_r": -0.595489948189134,
        "n_iterations": 146,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.15562564134597778,
          "right_subspace_overlap_bottom_k": 0.44669678807258606,
          "interaction_matrix_overlap_top_k": -0.6155273914337158,
          "interaction_matrix_overlap_bottom_k": -0.051556333899497986,
          "effective_rank": 0.7715209722518921,
          "effective_rank_mergeability_score": 0.20296114683151245,
          "stable_rank": -0.36917418241500854,
          "spectral_gap": 0.12538568675518036,
          "singular_value_ratio": 0.5030401945114136,
          "layerwise_effective_rank": 0.13848330080509186,
          "layerwise_effective_rank_mergeability_score": 0.27951833605766296,
          "task_vector_cosine_similarity": 0.1103639230132103,
          "task_vector_l2_distance": -0.18866443634033203,
          "task_vector_dot_product": 0.015484495088458061,
          "weight_space_angle": 0.40175676345825195,
          "task_vector_magnitude_ratio": -0.4313904345035553,
          "singular_value_overlap": 0.03406348451972008,
          "subspace_overlap": -0.1950450986623764,
          "right_subspace_overlap": 0.01399340108036995,
          "activation_l2_distance": -0.11147083342075348,
          "activation_cosine_similarity": -0.23570358753204346,
          "activation_magnitude_ratio": -0.04420734569430351,
          "activation_dot_product": 0.41736388206481934,
          "encoder_gradient_cosine_similarity": -0.07659336924552917,
          "encoder_gradient_l2_distance": 0.07627225667238235,
          "encoder_gradient_dot_product": 0.2440914362668991,
          "input_gradient_cosine_similarity": 0.03755611181259155,
          "input_gradient_l2_distance": -0.2676520347595215,
          "input_gradient_dot_product": -0.38554540276527405
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.010228235786176144,
        "train_r2": -1.4053076087720227,
        "train_pearson_r": 0.48577769765098117,
        "val_mse": 0.0074377520816650946,
        "val_r2": -2.1211595646778965,
        "val_pearson_r": 0.5586120664903695,
        "n_iterations": 345,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.13803917169570923,
          "right_subspace_overlap_bottom_k": -0.17891088128089905,
          "interaction_matrix_overlap_top_k": 0.21925729513168335,
          "interaction_matrix_overlap_bottom_k": 0.005509282927960157,
          "effective_rank": 0.30700239539146423,
          "effective_rank_mergeability_score": 0.16402755677700043,
          "stable_rank": 0.11458805948495865,
          "spectral_gap": 0.2638954222202301,
          "singular_value_ratio": 0.21088187396526337,
          "layerwise_effective_rank": -0.07645384967327118,
          "layerwise_effective_rank_mergeability_score": 0.05673651769757271,
          "task_vector_cosine_similarity": -0.16174942255020142,
          "task_vector_l2_distance": 0.07730579376220703,
          "task_vector_dot_product": -0.049913741648197174,
          "weight_space_angle": 0.3033444285392761,
          "task_vector_magnitude_ratio": -0.06537418067455292,
          "singular_value_overlap": 0.1118941605091095,
          "subspace_overlap": -0.051867496222257614,
          "right_subspace_overlap": -0.07735401391983032,
          "activation_l2_distance": 0.03582616522908211,
          "activation_cosine_similarity": 0.23547285795211792,
          "activation_magnitude_ratio": 0.001753176562488079,
          "activation_dot_product": -0.10080750286579132,
          "encoder_gradient_cosine_similarity": 0.06684447079896927,
          "encoder_gradient_l2_distance": -0.23351289331912994,
          "encoder_gradient_dot_product": 0.07952415943145752,
          "input_gradient_cosine_similarity": -0.1651258021593094,
          "input_gradient_l2_distance": -0.08456519991159439,
          "input_gradient_dot_product": -0.1461227983236313
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.04734283898294622,
        "train_r2": -10.893478182173492,
        "train_pearson_r": -0.06250984067793834,
        "val_mse": 0.12189492610290811,
        "val_r2": -49.303750287631026,
        "val_pearson_r": 0.058006786296928126,
        "n_iterations": 90,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.10434316098690033,
          "right_subspace_overlap_bottom_k": -0.02318265475332737,
          "interaction_matrix_overlap_top_k": -0.21814373135566711,
          "interaction_matrix_overlap_bottom_k": 0.18677540123462677,
          "effective_rank": 0.4899005591869354,
          "effective_rank_mergeability_score": 0.025957278907299042,
          "stable_rank": 0.3019057810306549,
          "spectral_gap": 0.16941404342651367,
          "singular_value_ratio": -0.14827415347099304,
          "layerwise_effective_rank": -0.354532390832901,
          "layerwise_effective_rank_mergeability_score": 0.08288277685642242,
          "task_vector_cosine_similarity": 0.12443062663078308,
          "task_vector_l2_distance": 0.057022351771593094,
          "task_vector_dot_product": 0.38631290197372437,
          "weight_space_angle": 0.2655068337917328,
          "task_vector_magnitude_ratio": -0.0991905927658081,
          "singular_value_overlap": 0.3681139349937439,
          "subspace_overlap": -0.2184048295021057,
          "right_subspace_overlap": -0.2936374843120575,
          "activation_l2_distance": 0.1309366226196289,
          "activation_cosine_similarity": -0.09346876293420792,
          "activation_magnitude_ratio": 0.15795373916625977,
          "activation_dot_product": 0.31821408867836,
          "encoder_gradient_cosine_similarity": 0.17174215614795685,
          "encoder_gradient_l2_distance": -0.24789246916770935,
          "encoder_gradient_dot_product": -0.2728075683116913,
          "input_gradient_cosine_similarity": -0.21304456889629364,
          "input_gradient_l2_distance": 0.24864834547042847,
          "input_gradient_dot_product": -0.2029271125793457
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.03720138076406366,
        "train_r2": -7.545245952907997,
        "train_pearson_r": 0.05116232663733686,
        "val_mse": 0.03030174090456845,
        "val_r2": -17.603830586566783,
        "val_pearson_r": 0.2165329673086095,
        "n_iterations": 189,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.3158283233642578,
          "right_subspace_overlap_bottom_k": -0.03691960498690605,
          "interaction_matrix_overlap_top_k": -0.5229999423027039,
          "interaction_matrix_overlap_bottom_k": -0.1604398787021637,
          "effective_rank": 0.13891205191612244,
          "effective_rank_mergeability_score": -0.3434264361858368,
          "stable_rank": 0.2833690941333771,
          "spectral_gap": 0.07643812149763107,
          "singular_value_ratio": 0.23823659121990204,
          "layerwise_effective_rank": -0.01870160549879074,
          "layerwise_effective_rank_mergeability_score": 0.3640023469924927,
          "task_vector_cosine_similarity": -0.026235029101371765,
          "task_vector_l2_distance": 0.28716567158699036,
          "task_vector_dot_product": -0.8751488327980042,
          "weight_space_angle": 0.22091174125671387,
          "task_vector_magnitude_ratio": -0.4583037197589874,
          "singular_value_overlap": 0.2495511919260025,
          "subspace_overlap": 0.4137667417526245,
          "right_subspace_overlap": 0.30703005194664,
          "activation_l2_distance": -0.23015642166137695,
          "activation_cosine_similarity": -0.43491512537002563,
          "activation_magnitude_ratio": 0.027337398380041122,
          "activation_dot_product": 0.5279589295387268,
          "encoder_gradient_cosine_similarity": 0.093532033264637,
          "encoder_gradient_l2_distance": 0.12165442854166031,
          "encoder_gradient_dot_product": 0.30076146125793457,
          "input_gradient_cosine_similarity": 0.11590798944234848,
          "input_gradient_l2_distance": -0.046727411448955536,
          "input_gradient_dot_product": 0.06809061020612717
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 1.8922024991034248,
        "train_r2": -459.6934872519553,
        "train_pearson_r": 0.32252993744035663,
        "val_mse": 1.8029465275504242,
        "val_r2": -885.0359931425609,
        "val_pearson_r": 0.6157223270559734,
        "n_iterations": 73,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.11687815189361572,
          "right_subspace_overlap_bottom_k": -0.9993511438369751,
          "interaction_matrix_overlap_top_k": -1.3817944526672363,
          "interaction_matrix_overlap_bottom_k": 0.6417780518531799,
          "effective_rank": -1.3790174722671509,
          "effective_rank_mergeability_score": 2.0022971630096436,
          "stable_rank": -0.7795419692993164,
          "spectral_gap": -0.7322129607200623,
          "singular_value_ratio": 2.114574670791626,
          "layerwise_effective_rank": -0.486050546169281,
          "layerwise_effective_rank_mergeability_score": -1.1387742757797241,
          "task_vector_cosine_similarity": 1.543121337890625,
          "task_vector_l2_distance": -0.7309049367904663,
          "task_vector_dot_product": -0.36372095346450806,
          "weight_space_angle": 1.1154882907867432,
          "task_vector_magnitude_ratio": 0.4717479646205902,
          "singular_value_overlap": 0.4826827943325043,
          "subspace_overlap": 0.6623576879501343,
          "right_subspace_overlap": -1.272273063659668,
          "activation_l2_distance": 0.7078567743301392,
          "activation_cosine_similarity": 1.6625676155090332,
          "activation_magnitude_ratio": 1.2928431034088135,
          "activation_dot_product": 0.23969514667987823,
          "encoder_gradient_cosine_similarity": -2.2965569496154785,
          "encoder_gradient_l2_distance": -0.7019978165626526,
          "encoder_gradient_dot_product": 0.16849876940250397,
          "input_gradient_cosine_similarity": 1.484951376914978,
          "input_gradient_l2_distance": -2.0810816287994385,
          "input_gradient_dot_product": 0.6433829069137573
        }
      }
    ],
    "optimization_params": {
      "objective": "MSE",
      "n_iterations": 1000,
      "learning_rate": 0.01,
      "patience": 50,
      "convergence_threshold": 1e-06
    }
  },
  "arithmetic": {
    "aggregate_metrics": {
      "train_mse": 7.748566128456837,
      "train_r2": -903.0621185052875,
      "train_pearson_r": -0.004435322480634275,
      "train_pearson_p": 0.8013005793442622,
      "val_mse": 6.266125107102048,
      "val_r2": -730.0986612000323,
      "val_pearson_r": 0.03637226992983513,
      "val_pearson_p": 0.4927030912361285
    },
    "per_fold_stats": {
      "train_mse_mean": 7.785679473939362,
      "train_mse_std": 27.991657859689575,
      "val_mse_mean": 6.264667772012818,
      "val_mse_std": 17.102180088520186,
      "train_r_mean": 0.10170009319010813,
      "train_r_std": 0.19678522423537795,
      "val_r_mean": 0.10072819546139247,
      "val_r_std": 0.21969355558474982
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": -0.13346895575523376,
      "right_subspace_overlap_bottom_k": 0.801952064037323,
      "interaction_matrix_overlap_top_k": 0.015142029151320457,
      "interaction_matrix_overlap_bottom_k": 0.1017412543296814,
      "effective_rank": -0.40794315934181213,
      "effective_rank_mergeability_score": -0.30881112813949585,
      "stable_rank": 0.2858622372150421,
      "spectral_gap": 0.5077435374259949,
      "singular_value_ratio": 0.7349931597709656,
      "layerwise_effective_rank": 0.3374524712562561,
      "layerwise_effective_rank_mergeability_score": -0.22803525626659393,
      "task_vector_cosine_similarity": -0.5163270235061646,
      "task_vector_l2_distance": -0.16178396344184875,
      "task_vector_dot_product": 0.005480554886162281,
      "weight_space_angle": -0.4533427655696869,
      "task_vector_magnitude_ratio": -0.25782716274261475,
      "singular_value_overlap": 0.47403138875961304,
      "subspace_overlap": -0.3630792796611786,
      "right_subspace_overlap": 0.42741769552230835,
      "activation_l2_distance": -0.2318987101316452,
      "activation_cosine_similarity": -0.17596180737018585,
      "activation_magnitude_ratio": 0.4634707570075989,
      "activation_dot_product": -0.32706981897354126,
      "encoder_gradient_cosine_similarity": 0.597573459148407,
      "encoder_gradient_l2_distance": -0.26550760865211487,
      "encoder_gradient_dot_product": 0.039665985852479935,
      "input_gradient_cosine_similarity": -0.2483637034893036,
      "input_gradient_l2_distance": 0.05654103681445122,
      "input_gradient_dot_product": 0.21809574961662292
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 1.05595862865448,
      "right_subspace_overlap_bottom_k": 2.5282018184661865,
      "interaction_matrix_overlap_top_k": 0.5454081892967224,
      "interaction_matrix_overlap_bottom_k": 1.908506155014038,
      "effective_rank": 2.287868022918701,
      "effective_rank_mergeability_score": 1.3828524351119995,
      "stable_rank": 1.1957604885101318,
      "spectral_gap": 1.0807991027832031,
      "singular_value_ratio": 2.306943416595459,
      "layerwise_effective_rank": 1.036375641822815,
      "layerwise_effective_rank_mergeability_score": 2.0031468868255615,
      "task_vector_cosine_similarity": 2.061363697052002,
      "task_vector_l2_distance": 1.241172432899475,
      "task_vector_dot_product": 1.131712794303894,
      "weight_space_angle": 1.7113909721374512,
      "task_vector_magnitude_ratio": 1.2406337261199951,
      "singular_value_overlap": 1.7094738483428955,
      "subspace_overlap": 1.1407569646835327,
      "right_subspace_overlap": 1.1976432800292969,
      "activation_l2_distance": 1.0394514799118042,
      "activation_cosine_similarity": 0.8770217895507812,
      "activation_magnitude_ratio": 1.28190279006958,
      "activation_dot_product": 1.5811413526535034,
      "encoder_gradient_cosine_similarity": 1.9154295921325684,
      "encoder_gradient_l2_distance": 1.0226759910583496,
      "encoder_gradient_dot_product": 0.7070204019546509,
      "input_gradient_cosine_similarity": 1.1871641874313354,
      "input_gradient_l2_distance": 1.4546291828155518,
      "input_gradient_dot_product": 1.4257041215896606
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 4.317343478680121,
        "train_r2": -489.4973297823858,
        "train_pearson_r": -0.26956521251121945,
        "val_mse": 5.799067369983885,
        "val_r2": -1341.135300842326,
        "val_pearson_r": 0.0805822360905511,
        "n_iterations": 56,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.41842108964920044,
          "right_subspace_overlap_bottom_k": -0.7860199213027954,
          "interaction_matrix_overlap_top_k": -0.22450286149978638,
          "interaction_matrix_overlap_bottom_k": -0.27667611837387085,
          "effective_rank": -0.27836817502975464,
          "effective_rank_mergeability_score": 0.5995857119560242,
          "stable_rank": 0.05337550491094589,
          "spectral_gap": 0.5099117159843445,
          "singular_value_ratio": -0.5517200827598572,
          "layerwise_effective_rank": 1.3101770877838135,
          "layerwise_effective_rank_mergeability_score": 0.07760204374790192,
          "task_vector_cosine_similarity": -1.085546612739563,
          "task_vector_l2_distance": 2.1403555870056152,
          "task_vector_dot_product": 0.9818156957626343,
          "weight_space_angle": -1.787272572517395,
          "task_vector_magnitude_ratio": 1.2892879247665405,
          "singular_value_overlap": -1.586434006690979,
          "subspace_overlap": 0.6883716583251953,
          "right_subspace_overlap": -2.1882174015045166,
          "activation_l2_distance": 2.06469988822937,
          "activation_cosine_similarity": 1.02432382106781,
          "activation_magnitude_ratio": 2.4211857318878174,
          "activation_dot_product": -2.579026699066162,
          "encoder_gradient_cosine_similarity": 2.446728229522705,
          "encoder_gradient_l2_distance": -2.6195144653320312,
          "encoder_gradient_dot_product": -2.070119857788086,
          "input_gradient_cosine_similarity": -0.522734522819519,
          "input_gradient_l2_distance": 3.4419639110565186,
          "input_gradient_dot_product": -1.0928771495819092
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 2.4812251349076058,
        "train_r2": -277.6096450086962,
        "train_pearson_r": 0.16018807449475667,
        "val_mse": 3.135318074130921,
        "val_r2": -708.1586544222575,
        "val_pearson_r": -0.08497188075226458,
        "n_iterations": 51,
        "coefficients": {
          "right_subspace_overlap_top_k": -1.2976070642471313,
          "right_subspace_overlap_bottom_k": 0.9106310606002808,
          "interaction_matrix_overlap_top_k": -0.18253958225250244,
          "interaction_matrix_overlap_bottom_k": 2.005849838256836,
          "effective_rank": -1.5946650505065918,
          "effective_rank_mergeability_score": -1.0627785921096802,
          "stable_rank": -0.09323051571846008,
          "spectral_gap": 0.2550690174102783,
          "singular_value_ratio": 0.1462738811969757,
          "layerwise_effective_rank": 1.325525164604187,
          "layerwise_effective_rank_mergeability_score": 0.23930422961711884,
          "task_vector_cosine_similarity": -0.7657480835914612,
          "task_vector_l2_distance": -0.6895484328269958,
          "task_vector_dot_product": -0.6190858483314514,
          "weight_space_angle": -1.0264662504196167,
          "task_vector_magnitude_ratio": -0.6978583335876465,
          "singular_value_overlap": 0.47594815492630005,
          "subspace_overlap": -2.2436318397521973,
          "right_subspace_overlap": 2.483961343765259,
          "activation_l2_distance": -0.29216697812080383,
          "activation_cosine_similarity": -0.7438372373580933,
          "activation_magnitude_ratio": 2.0042827129364014,
          "activation_dot_product": 0.5238903164863586,
          "encoder_gradient_cosine_similarity": 0.3218074142932892,
          "encoder_gradient_l2_distance": -0.03120957687497139,
          "encoder_gradient_dot_product": 0.4376228451728821,
          "input_gradient_cosine_similarity": 1.4968998432159424,
          "input_gradient_l2_distance": -1.4142149686813354,
          "input_gradient_dot_product": 1.100847601890564
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.028166152940227694,
        "train_r2": -2.126878779373693,
        "train_pearson_r": 0.4299618465356089,
        "val_mse": 0.029534181907534925,
        "val_r2": -5.751681278618217,
        "val_pearson_r": 0.34588452531754416,
        "n_iterations": 714,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.5660187602043152,
          "right_subspace_overlap_bottom_k": 0.2873707711696625,
          "interaction_matrix_overlap_top_k": -0.8133692145347595,
          "interaction_matrix_overlap_bottom_k": -0.27986064553260803,
          "effective_rank": 0.36888185143470764,
          "effective_rank_mergeability_score": 0.18632367253303528,
          "stable_rank": 0.031132841482758522,
          "spectral_gap": -0.01393261831253767,
          "singular_value_ratio": -0.18417280912399292,
          "layerwise_effective_rank": 0.12424533069133759,
          "layerwise_effective_rank_mergeability_score": 0.26164525747299194,
          "task_vector_cosine_similarity": -0.02852298505604267,
          "task_vector_l2_distance": -0.07362305372953415,
          "task_vector_dot_product": 0.11559975147247314,
          "weight_space_angle": 0.2305494248867035,
          "task_vector_magnitude_ratio": 0.041404709219932556,
          "singular_value_overlap": 0.002875123405829072,
          "subspace_overlap": 0.07814729958772659,
          "right_subspace_overlap": 0.13307516276836395,
          "activation_l2_distance": 0.21153968572616577,
          "activation_cosine_similarity": 0.31804224848747253,
          "activation_magnitude_ratio": -0.016850624233484268,
          "activation_dot_product": -0.08725526183843613,
          "encoder_gradient_cosine_similarity": 0.01493415329605341,
          "encoder_gradient_l2_distance": -0.20786231756210327,
          "encoder_gradient_dot_product": 0.06084669753909111,
          "input_gradient_cosine_similarity": -0.12622423470020294,
          "input_gradient_l2_distance": -0.11475346982479095,
          "input_gradient_dot_product": -0.09521811455488205
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.05376414320438446,
        "train_r2": -5.205487264421823,
        "train_pearson_r": -0.24697325632954337,
        "val_mse": 0.01687261370015171,
        "val_r2": -2.9233581936602353,
        "val_pearson_r": 0.030873710943239586,
        "n_iterations": 59,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.08600408583879471,
          "right_subspace_overlap_bottom_k": 0.09765946120023727,
          "interaction_matrix_overlap_top_k": -0.2306084930896759,
          "interaction_matrix_overlap_bottom_k": -0.028628528118133545,
          "effective_rank": -0.14057856798171997,
          "effective_rank_mergeability_score": 0.2019900232553482,
          "stable_rank": 0.7413424253463745,
          "spectral_gap": -0.10037045925855637,
          "singular_value_ratio": -0.27289506793022156,
          "layerwise_effective_rank": -0.4178771674633026,
          "layerwise_effective_rank_mergeability_score": -0.13090001046657562,
          "task_vector_cosine_similarity": 0.20426128804683685,
          "task_vector_l2_distance": 0.18569286167621613,
          "task_vector_dot_product": -0.03772622346878052,
          "weight_space_angle": 0.3237472474575043,
          "task_vector_magnitude_ratio": 0.028044989332556725,
          "singular_value_overlap": 0.2234000712633133,
          "subspace_overlap": -0.05911234766244888,
          "right_subspace_overlap": -0.3303649127483368,
          "activation_l2_distance": 0.11053276062011719,
          "activation_cosine_similarity": 0.21524077653884888,
          "activation_magnitude_ratio": 0.13557887077331543,
          "activation_dot_product": 0.03231358900666237,
          "encoder_gradient_cosine_similarity": 0.2530689835548401,
          "encoder_gradient_l2_distance": -0.11460348963737488,
          "encoder_gradient_dot_product": -0.053831346333026886,
          "input_gradient_cosine_similarity": -0.22005335986614227,
          "input_gradient_l2_distance": 0.0739578977227211,
          "input_gradient_dot_product": 0.21996326744556427
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.018177952243161304,
        "train_r2": -1.0646374617231547,
        "train_pearson_r": 0.22362658196414809,
        "val_mse": 0.020212861489873606,
        "val_r2": -3.4116930031328936,
        "val_pearson_r": -0.013833465217357885,
        "n_iterations": 309,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.13213986158370972,
          "right_subspace_overlap_bottom_k": 0.2064487189054489,
          "interaction_matrix_overlap_top_k": -0.14026200771331787,
          "interaction_matrix_overlap_bottom_k": -0.252236932516098,
          "effective_rank": 0.01786554791033268,
          "effective_rank_mergeability_score": 0.694832444190979,
          "stable_rank": 0.8143946528434753,
          "spectral_gap": 0.7167618274688721,
          "singular_value_ratio": -0.18334685266017914,
          "layerwise_effective_rank": 0.10409419238567352,
          "layerwise_effective_rank_mergeability_score": -0.014093405567109585,
          "task_vector_cosine_similarity": -0.011943642050027847,
          "task_vector_l2_distance": 0.059089962393045425,
          "task_vector_dot_product": -0.3446301519870758,
          "weight_space_angle": -0.009867863729596138,
          "task_vector_magnitude_ratio": 0.6280083060264587,
          "singular_value_overlap": 0.12538890540599823,
          "subspace_overlap": -0.3300522565841675,
          "right_subspace_overlap": 0.17266981303691864,
          "activation_l2_distance": -0.5940287709236145,
          "activation_cosine_similarity": -0.5923134684562683,
          "activation_magnitude_ratio": 0.03817326948046684,
          "activation_dot_product": 0.26038500666618347,
          "encoder_gradient_cosine_similarity": 0.03818816319108009,
          "encoder_gradient_l2_distance": -0.4543135464191437,
          "encoder_gradient_dot_product": 0.09837622940540314,
          "input_gradient_cosine_similarity": -0.048445433378219604,
          "input_gradient_l2_distance": 0.060275766998529434,
          "input_gradient_dot_product": -0.19327735900878906
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_mse": 0.03298891324071599,
        "train_r2": -2.6513770950748556,
        "train_pearson_r": 0.20100487471457115,
        "val_mse": 0.016723572441040058,
        "val_r2": -4.640173760876944,
        "val_pearson_r": 0.5121024896699936,
        "n_iterations": 80,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.41642332077026367,
          "right_subspace_overlap_bottom_k": 0.47172409296035767,
          "interaction_matrix_overlap_top_k": -0.49041110277175903,
          "interaction_matrix_overlap_bottom_k": -0.14860893785953522,
          "effective_rank": 0.21776802837848663,
          "effective_rank_mergeability_score": 0.25498074293136597,
          "stable_rank": -0.05286429449915886,
          "spectral_gap": -0.05064934492111206,
          "singular_value_ratio": 0.04487953335046768,
          "layerwise_effective_rank": 0.10129202902317047,
          "layerwise_effective_rank_mergeability_score": -0.046617697924375534,
          "task_vector_cosine_similarity": -0.3494229316711426,
          "task_vector_l2_distance": -0.211480513215065,
          "task_vector_dot_product": -0.131384015083313,
          "weight_space_angle": -0.3431922495365143,
          "task_vector_magnitude_ratio": -0.18981309235095978,
          "singular_value_overlap": 0.19061145186424255,
          "subspace_overlap": 0.21941255033016205,
          "right_subspace_overlap": 0.18180036544799805,
          "activation_l2_distance": 0.8107679486274719,
          "activation_cosine_similarity": 0.6599052548408508,
          "activation_magnitude_ratio": 0.12343764305114746,
          "activation_dot_product": 0.1691121906042099,
          "encoder_gradient_cosine_similarity": 0.08392070233821869,
          "encoder_gradient_l2_distance": -0.19615232944488525,
          "encoder_gradient_dot_product": 0.18240804970264435,
          "input_gradient_cosine_similarity": 0.1923581063747406,
          "input_gradient_l2_distance": -0.26539814472198486,
          "input_gradient_dot_product": -0.016138067469000816
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_mse": 1.1513756593794764,
        "train_r2": -137.2252345126865,
        "train_pearson_r": -0.03025893683993378,
        "val_mse": 1.241270224049991,
        "val_r2": -290.09953717751,
        "val_pearson_r": 0.12069244414172982,
        "n_iterations": 206,
        "coefficients": {
          "right_subspace_overlap_top_k": 2.5502896308898926,
          "right_subspace_overlap_bottom_k": 0.5849870443344116,
          "interaction_matrix_overlap_top_k": -0.31319597363471985,
          "interaction_matrix_overlap_bottom_k": -1.5693198442459106,
          "effective_rank": 3.944392204284668,
          "effective_rank_mergeability_score": -1.5911939144134521,
          "stable_rank": 0.7671626806259155,
          "spectral_gap": 0.1016959697008133,
          "singular_value_ratio": -0.5944372415542603,
          "layerwise_effective_rank": -1.4904135465621948,
          "layerwise_effective_rank_mergeability_score": 3.304548978805542,
          "task_vector_cosine_similarity": -0.19412408769130707,
          "task_vector_l2_distance": 0.9801937937736511,
          "task_vector_dot_product": -2.978447198867798,
          "weight_space_angle": -1.6957229375839233,
          "task_vector_magnitude_ratio": -0.8222857117652893,
          "singular_value_overlap": -0.0035353354178369045,
          "subspace_overlap": 0.9361830353736877,
          "right_subspace_overlap": 0.15110310912132263,
          "activation_l2_distance": -1.426888346672058,
          "activation_cosine_similarity": -1.976518154144287,
          "activation_magnitude_ratio": -0.6579588651657104,
          "activation_dot_product": 0.5647348761558533,
          "encoder_gradient_cosine_similarity": 2.5720226764678955,
          "encoder_gradient_l2_distance": 1.1532189846038818,
          "encoder_gradient_dot_product": 0.7173742651939392,
          "input_gradient_cosine_similarity": -0.871402382850647,
          "input_gradient_l2_distance": -0.03598248213529587,
          "input_gradient_dot_product": -1.1127115488052368
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.49753891099959313,
        "train_r2": -61.91214124675254,
        "train_pearson_r": -0.12056235290485327,
        "val_mse": 0.618738279708686,
        "val_r2": -178.00530386054322,
        "val_pearson_r": -0.2759210545093806,
        "n_iterations": 149,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.6304349303245544,
          "right_subspace_overlap_bottom_k": 0.5048612952232361,
          "interaction_matrix_overlap_top_k": 0.9499167203903198,
          "interaction_matrix_overlap_bottom_k": -0.8613185286521912,
          "effective_rank": 0.1582455337047577,
          "effective_rank_mergeability_score": -0.37386733293533325,
          "stable_rank": 0.731697678565979,
          "spectral_gap": -0.5648202896118164,
          "singular_value_ratio": 0.15731768310070038,
          "layerwise_effective_rank": -0.950439453125,
          "layerwise_effective_rank_mergeability_score": 0.3105989098548889,
          "task_vector_cosine_similarity": -0.7244613170623779,
          "task_vector_l2_distance": 0.8638401031494141,
          "task_vector_dot_product": -0.5704941153526306,
          "weight_space_angle": 0.815262496471405,
          "task_vector_magnitude_ratio": -0.6953144669532776,
          "singular_value_overlap": -0.35085099935531616,
          "subspace_overlap": 0.6887421011924744,
          "right_subspace_overlap": 0.010146185755729675,
          "activation_l2_distance": -0.9911388754844666,
          "activation_cosine_similarity": 0.6988699436187744,
          "activation_magnitude_ratio": -0.12800750136375427,
          "activation_dot_product": -0.4880423843860626,
          "encoder_gradient_cosine_similarity": 0.958825409412384,
          "encoder_gradient_l2_distance": 1.3497878313064575,
          "encoder_gradient_dot_product": -0.4674294590950012,
          "input_gradient_cosine_similarity": 0.843874990940094,
          "input_gradient_l2_distance": -0.6618340611457825,
          "input_gradient_dot_product": 0.4132261872291565
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_mse": 12.950171585128563,
        "train_r2": -1452.9803689977957,
        "train_pearson_r": -0.06343750309580443,
        "val_mse": 41.987894925319566,
        "val_r2": -9548.335032231493,
        "val_pearson_r": 0.35594841714429376,
        "n_iterations": 63,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.014436899684369564,
          "right_subspace_overlap_bottom_k": 0.3163350522518158,
          "interaction_matrix_overlap_top_k": 0.1707332581281662,
          "interaction_matrix_overlap_bottom_k": -1.0626534223556519,
          "effective_rank": -0.45589256286621094,
          "effective_rank_mergeability_score": -0.0176740363240242,
          "stable_rank": 3.9233410358428955,
          "spectral_gap": 0.7201052904129028,
          "singular_value_ratio": 1.2178759574890137,
          "layerwise_effective_rank": 2.1323704719543457,
          "layerwise_effective_rank_mergeability_score": -2.7220802307128906,
          "task_vector_cosine_similarity": 3.2582666873931885,
          "task_vector_l2_distance": -0.9953839182853699,
          "task_vector_dot_product": -1.832664966583252,
          "weight_space_angle": -0.21217532455921173,
          "task_vector_magnitude_ratio": -0.8658031225204468,
          "singular_value_overlap": 0.7611960768699646,
          "subspace_overlap": -0.8659749031066895,
          "right_subspace_overlap": 2.975724458694458,
          "activation_l2_distance": -2.2554304599761963,
          "activation_cosine_similarity": -0.1744387298822403,
          "activation_magnitude_ratio": -0.9056522846221924,
          "activation_dot_product": -3.046515941619873,
          "encoder_gradient_cosine_similarity": -1.2990785837173462,
          "encoder_gradient_l2_distance": 1.9561480283737183,
          "encoder_gradient_dot_product": 0.9673145413398743,
          "input_gradient_cosine_similarity": 1.233271837234497,
          "input_gradient_l2_distance": -2.3193483352661133,
          "input_gradient_dot_product": 0.3733043968677521
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 129.15289385590236,
        "train_r2": -14657.794712449748,
        "train_pearson_r": -0.052074453201239324,
        "val_mse": 69.45558093847903,
        "val_r2": -12694.45703577888,
        "val_pearson_r": -0.10921420468525318,
        "n_iterations": 61,
        "coefficients": {
          "right_subspace_overlap_top_k": -1.5904872417449951,
          "right_subspace_overlap_bottom_k": 11.642648696899414,
          "interaction_matrix_overlap_top_k": 0.29719147086143494,
          "interaction_matrix_overlap_bottom_k": 7.720083713531494,
          "effective_rank": -9.165810585021973,
          "effective_rank_mergeability_score": -5.11166524887085,
          "stable_rank": -1.7710902690887451,
          "spectral_gap": 2.1171836853027344,
          "singular_value_ratio": 10.208305358886719,
          "layerwise_effective_rank": 2.640192747116089,
          "layerwise_effective_rank_mergeability_score": -7.662883281707764,
          "task_vector_cosine_similarity": -8.411931037902832,
          "task_vector_l2_distance": -4.628629207611084,
          "task_vector_dot_product": 1.952284336090088,
          "weight_space_angle": -6.973988056182861,
          "task_vector_magnitude_ratio": -4.80656099319458,
          "singular_value_overlap": 7.0379533767700195,
          "subspace_overlap": -4.175378799438477,
          "right_subspace_overlap": 2.670466899871826,
          "activation_l2_distance": -0.1597590148448944,
          "activation_cosine_similarity": -1.4940816164016724,
          "activation_magnitude_ratio": 4.803842544555664,
          "activation_dot_product": -5.444324016571045,
          "encoder_gradient_cosine_similarity": 7.9018168449401855,
          "encoder_gradient_l2_distance": -0.3589640259742737,
          "encoder_gradient_dot_product": -0.9982295632362366,
          "input_gradient_cosine_similarity": -4.663367748260498,
          "input_gradient_l2_distance": 3.6243600845336914,
          "input_gradient_dot_product": 5.712497711181641
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 2.6690058884898127,
        "train_r2": -320.61083676842634,
        "train_pearson_r": -0.043235400462969475,
        "val_mse": 1.2480185212554264,
        "val_r2": -339.4952784398235,
        "val_pearson_r": -0.25130685826127325,
        "n_iterations": 75,
        "coefficients": {
          "right_subspace_overlap_top_k": -2.50140380859375,
          "right_subspace_overlap_bottom_k": -0.5798665285110474,
          "interaction_matrix_overlap_top_k": -0.6784877777099609,
          "interaction_matrix_overlap_bottom_k": -1.0597987174987793,
          "effective_rank": -0.8104969263076782,
          "effective_rank_mergeability_score": -0.8499479293823242,
          "stable_rank": -2.146829843521118,
          "spectral_gap": -1.9765623807907104,
          "singular_value_ratio": -0.49744713306427,
          "layerwise_effective_rank": 1.4951201677322388,
          "layerwise_effective_rank_mergeability_score": 0.7636597156524658,
          "task_vector_cosine_similarity": 1.5221542119979858,
          "task_vector_l2_distance": 0.8060214519500732,
          "task_vector_dot_product": 2.4713194370269775,
          "weight_space_angle": -1.752139687538147,
          "task_vector_magnitude_ratio": -0.31196603178977966,
          "singular_value_overlap": 3.0649759769439697,
          "subspace_overlap": -0.9722149968147278,
          "right_subspace_overlap": 0.20870515704154968,
          "activation_l2_distance": 1.2712204456329346,
          "activation_cosine_similarity": 1.2236367464065552,
          "activation_magnitude_ratio": 1.1150524616241455,
          "activation_dot_product": 1.9687656164169312,
          "encoder_gradient_cosine_similarity": -1.3617290258407593,
          "encoder_gradient_l2_distance": -1.7881715297698975,
          "encoder_gradient_dot_product": 1.0752928256988525,
          "input_gradient_cosine_similarity": -0.30209001898765564,
          "input_gradient_l2_distance": 1.3840097188949585,
          "input_gradient_dot_product": 0.2064773440361023
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.6282989375073559,
        "train_r2": -70.95024908161945,
        "train_pearson_r": 0.3738622815918228,
        "val_mse": 0.6165485964885452,
        "val_r2": -138.35795872321586,
        "val_pearson_r": 0.31459427908972176,
        "n_iterations": 87,
        "coefficients": {
          "right_subspace_overlap_top_k": -1.315001368522644,
          "right_subspace_overlap_bottom_k": 1.3763978481292725,
          "interaction_matrix_overlap_top_k": 0.8569925427436829,
          "interaction_matrix_overlap_bottom_k": -0.6160089373588562,
          "effective_rank": 1.223780632019043,
          "effective_rank_mergeability_score": -1.5491119623184204,
          "stable_rank": 1.1705701351165771,
          "spectral_gap": 3.326742172241211,
          "singular_value_ratio": 0.9097999334335327,
          "layerwise_effective_rank": -0.8132448792457581,
          "layerwise_effective_rank_mergeability_score": 1.2627577781677246,
          "task_vector_cosine_similarity": -1.3569707870483398,
          "task_vector_l2_distance": -0.6106877326965332,
          "task_vector_dot_product": 0.02832013927400112,
          "weight_space_angle": -0.15663570165634155,
          "task_vector_magnitude_ratio": 0.27344414591789246,
          "singular_value_overlap": -0.12875863909721375,
          "subspace_overlap": 0.472516268491745,
          "right_subspace_overlap": 1.5037988424301147,
          "activation_l2_distance": -2.2344648838043213,
          "activation_cosine_similarity": -1.5965847969055176,
          "activation_magnitude_ratio": -0.954463541507721,
          "activation_dot_product": 0.6061603426933289,
          "encoder_gradient_cosine_similarity": -0.6170859932899475,
          "encoder_gradient_l2_distance": -1.2262178659439087,
          "encoder_gradient_dot_product": 0.9152623414993286,
          "input_gradient_cosine_similarity": 0.16438953578472137,
          "input_gradient_l2_distance": -0.8857584595680237,
          "input_gradient_dot_product": 0.9521542191505432
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.0904091103398261,
        "train_r2": -9.843834619278965,
        "train_pearson_r": 0.14791731507309872,
        "val_mse": 0.14793653035236384,
        "val_r2": -31.832277778690617,
        "val_pearson_r": -0.09117910105308148,
        "n_iterations": 78,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.28447410464286804,
          "right_subspace_overlap_bottom_k": 0.37607190012931824,
          "interaction_matrix_overlap_top_k": 0.6372925043106079,
          "interaction_matrix_overlap_bottom_k": 0.030611146241426468,
          "effective_rank": 0.2973686456680298,
          "effective_rank_mergeability_score": 0.8983745574951172,
          "stable_rank": -0.5122472047805786,
          "spectral_gap": 0.8805619478225708,
          "singular_value_ratio": 1.6252599954605103,
          "layerwise_effective_rank": -0.0736253559589386,
          "layerwise_effective_rank_mergeability_score": -0.29119908809661865,
          "task_vector_cosine_similarity": -1.1193583011627197,
          "task_vector_l2_distance": -0.5041283965110779,
          "task_vector_dot_product": 0.6420590281486511,
          "weight_space_angle": 0.0042143091559410095,
          "task_vector_magnitude_ratio": -0.06180283799767494,
          "singular_value_overlap": 0.04813191667199135,
          "subspace_overlap": -1.1441785097122192,
          "right_subspace_overlap": -0.19800005853176117,
          "activation_l2_distance": 0.050080444663763046,
          "activation_cosine_similarity": 0.11612047255039215,
          "activation_magnitude_ratio": -0.13010187447071075,
          "activation_dot_product": 0.08857373148202896,
          "encoder_gradient_cosine_similarity": -0.2070336490869522,
          "encoder_gradient_l2_distance": -0.2025892436504364,
          "encoder_gradient_dot_product": 0.5173092484474182,
          "input_gradient_cosine_similarity": -0.4406539797782898,
          "input_gradient_l2_distance": -0.32013511657714844,
          "input_gradient_dot_product": -0.2934861481189728
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.04864447994443028,
        "train_r2": -4.4219103428336055,
        "train_pearson_r": 0.23422002307141468,
        "val_mse": 0.037214017359573165,
        "val_r2": -6.515963827523398,
        "val_pearson_r": 0.4043282157661675,
        "n_iterations": 93,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.3816080391407013,
          "right_subspace_overlap_bottom_k": -0.0734051764011383,
          "interaction_matrix_overlap_top_k": -0.19777026772499084,
          "interaction_matrix_overlap_bottom_k": -0.20187021791934967,
          "effective_rank": 0.044559743255376816,
          "effective_rank_mergeability_score": -0.07137752324342728,
          "stable_rank": -0.13622617721557617,
          "spectral_gap": 0.4958967864513397,
          "singular_value_ratio": 0.24550095200538635,
          "layerwise_effective_rank": 0.24445851147174835,
          "layerwise_effective_rank_mergeability_score": 0.250678151845932,
          "task_vector_cosine_similarity": -0.760383665561676,
          "task_vector_l2_distance": -0.010225560516119003,
          "task_vector_dot_product": -0.04633937031030655,
          "weight_space_angle": 0.32240912318229675,
          "task_vector_magnitude_ratio": 0.19124853610992432,
          "singular_value_overlap": -0.07350420206785202,
          "subspace_overlap": 0.3234560787677765,
          "right_subspace_overlap": 0.39245858788490295,
          "activation_l2_distance": 0.07360031455755234,
          "activation_cosine_similarity": 0.04187604784965515,
          "activation_magnitude_ratio": 0.13750821352005005,
          "activation_dot_product": 0.17401988804340363,
          "encoder_gradient_cosine_similarity": 0.24301695823669434,
          "encoder_gradient_l2_distance": -0.7339674830436707,
          "encoder_gradient_dot_product": -0.31068679690361023,
          "input_gradient_cosine_similarity": -0.0035382481291890144,
          "input_gradient_l2_distance": 0.30387449264526367,
          "input_gradient_dot_product": -0.2492884248495102
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.48109693049863156,
        "train_r2": -56.09433643133025,
        "train_pearson_r": 0.09865435633212535,
        "val_mse": 0.19141116876572362,
        "val_r2": -32.39778489517878,
        "val_pearson_r": 0.16249381003485996,
        "n_iterations": 148,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.5058146715164185,
          "right_subspace_overlap_bottom_k": 0.30316370725631714,
          "interaction_matrix_overlap_top_k": -0.6701672077178955,
          "interaction_matrix_overlap_bottom_k": -1.6767505407333374,
          "effective_rank": -1.0418986082077026,
          "effective_rank_mergeability_score": -1.1249085664749146,
          "stable_rank": 1.5329595804214478,
          "spectral_gap": 1.8673521280288696,
          "singular_value_ratio": 0.322973370552063,
          "layerwise_effective_rank": -0.6533414721488953,
          "layerwise_effective_rank_mergeability_score": -0.0036418696399778128,
          "task_vector_cosine_similarity": 0.34141284227371216,
          "task_vector_l2_distance": 0.21577681601047516,
          "task_vector_dot_product": 0.6589002013206482,
          "weight_space_angle": 1.2171396017074585,
          "task_vector_magnitude_ratio": 0.2129986435174942,
          "singular_value_overlap": 0.05986422672867775,
          "subspace_overlap": 0.18912246823310852,
          "right_subspace_overlap": 1.4497933387756348,
          "activation_l2_distance": -1.051953673362732,
          "activation_cosine_similarity": -1.5842688083648682,
          "activation_magnitude_ratio": 0.4754161238670349,
          "activation_dot_product": 1.0739834308624268,
          "encoder_gradient_cosine_similarity": 0.5308530330657959,
          "encoder_gradient_l2_distance": -1.6170066595077515,
          "encoder_gradient_dot_product": -0.5736780762672424,
          "input_gradient_cosine_similarity": 0.31797248125076294,
          "input_gradient_l2_distance": 1.3990367650985718,
          "input_gradient_dot_product": -1.6803231239318848
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_mse": 0.8013472947283955,
        "train_r2": -90.3019340128508,
        "train_pearson_r": 0.3895280779641247,
        "val_mse": 0.3337533483637299,
        "val_r2": -64.03464062085165,
        "val_pearson_r": 0.16367048744319096,
        "n_iterations": 138,
        "coefficients": {
          "right_subspace_overlap_top_k": 1.4834988117218018,
          "right_subspace_overlap_bottom_k": -0.1798345446586609,
          "interaction_matrix_overlap_top_k": 0.9859234094619751,
          "interaction_matrix_overlap_bottom_k": 0.6523208022117615,
          "effective_rank": -0.02228233590722084,
          "effective_rank_mergeability_score": 1.7359191179275513,
          "stable_rank": -0.1487327367067337,
          "spectral_gap": -0.8201059699058533,
          "singular_value_ratio": 2.40718674659729,
          "layerwise_effective_rank": 0.18030652403831482,
          "layerwise_effective_rank_mergeability_score": 0.6149301528930664,
          "task_vector_cosine_similarity": -0.4914792776107788,
          "task_vector_l2_distance": -0.8592410087585449,
          "task_vector_dot_product": -0.576869785785675,
          "weight_space_angle": 0.5715564489364624,
          "task_vector_magnitude_ratio": -1.3886194229125977,
          "singular_value_overlap": -0.05007007718086243,
          "subspace_overlap": -0.41944190859794617,
          "right_subspace_overlap": -0.5467223525047302,
          "activation_l2_distance": 0.8541761040687561,
          "activation_cosine_similarity": 0.31001025438308716,
          "activation_magnitude_ratio": 0.6643768548965454,
          "activation_dot_product": 0.005785558372735977,
          "encoder_gradient_cosine_similarity": -0.17310959100723267,
          "encoder_gradient_l2_distance": 0.10446333885192871,
          "encoder_gradient_dot_product": 0.02450977824628353,
          "input_gradient_cosine_similarity": -1.2171050310134888,
          "input_gradient_l2_distance": -2.0441055297851562,
          "input_gradient_dot_product": -0.6601070165634155
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.012798093226570426,
        "train_r2": -0.44771663799536676,
        "train_pearson_r": 0.3422840943855713,
        "val_mse": 0.01053885515317851,
        "val_r2": -0.8337247473613099,
        "val_pearson_r": 0.22505471364409702,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.10291800647974014,
          "right_subspace_overlap_bottom_k": -0.011196163482964039,
          "interaction_matrix_overlap_top_k": 0.07038921117782593,
          "interaction_matrix_overlap_bottom_k": -0.040953923016786575,
          "effective_rank": 0.37952721118927,
          "effective_rank_mergeability_score": -0.10672205686569214,
          "stable_rank": -0.07791873812675476,
          "spectral_gap": 0.46182337403297424,
          "singular_value_ratio": 0.10448933392763138,
          "layerwise_effective_rank": -0.35045599937438965,
          "layerwise_effective_rank_mergeability_score": -0.020919060334563255,
          "task_vector_cosine_similarity": -0.020466333255171776,
          "task_vector_l2_distance": 0.024946006014943123,
          "task_vector_dot_product": -0.05595295503735542,
          "weight_space_angle": 0.498322993516922,
          "task_vector_magnitude_ratio": 0.2790937125682831,
          "singular_value_overlap": 0.032229043543338776,
          "subspace_overlap": 0.26530277729034424,
          "right_subspace_overlap": 0.018046321347355843,
          "activation_l2_distance": 0.043780580163002014,
          "activation_cosine_similarity": 0.2647574543952942,
          "activation_magnitude_ratio": -0.005755880381911993,
          "activation_dot_product": -0.13662073016166687,
          "encoder_gradient_cosine_similarity": 0.05733524262905121,
          "encoder_gradient_l2_distance": -0.2441592961549759,
          "encoder_gradient_dot_product": 0.0722896009683609,
          "input_gradient_cosine_similarity": -0.16251322627067566,
          "input_gradient_l2_distance": -0.12464579939842224,
          "input_gradient_dot_product": -0.11080383509397507
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.03578682764451973,
        "train_r2": -3.288264610317599,
        "train_pearson_r": 0.02730707226568575,
        "val_mse": 0.1763068972808706,
        "val_r2": -33.55152019505325,
        "val_pearson_r": -0.20714838354291354,
        "n_iterations": 58,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.010690414346754551,
          "right_subspace_overlap_bottom_k": 0.12489054352045059,
          "interaction_matrix_overlap_top_k": -0.5725926160812378,
          "interaction_matrix_overlap_bottom_k": 0.004905520938336849,
          "effective_rank": 0.03826458752155304,
          "effective_rank_mergeability_score": -0.25639525055885315,
          "stable_rank": -0.1418972909450531,
          "spectral_gap": 0.3307674825191498,
          "singular_value_ratio": 0.4345223307609558,
          "layerwise_effective_rank": -0.036205142736434937,
          "layerwise_effective_rank_mergeability_score": 0.5438504815101624,
          "task_vector_cosine_similarity": -0.15018188953399658,
          "task_vector_l2_distance": 0.020171741023659706,
          "task_vector_dot_product": 0.19447161257266998,
          "weight_space_angle": 0.22015704214572906,
          "task_vector_magnitude_ratio": 0.23959892988204956,
          "singular_value_overlap": 0.08571982383728027,
          "subspace_overlap": 0.08948265761137009,
          "right_subspace_overlap": -0.18515732884407043,
          "activation_l2_distance": -0.19809415936470032,
          "activation_cosine_similarity": -0.1276421844959259,
          "activation_magnitude_ratio": 0.19616670906543732,
          "activation_dot_product": 0.21160471439361572,
          "encoder_gradient_cosine_similarity": -0.05482815206050873,
          "encoder_gradient_l2_distance": 0.09522203356027603,
          "encoder_gradient_dot_product": 0.35039326548576355,
          "input_gradient_cosine_similarity": -0.15093985199928284,
          "input_gradient_l2_distance": -0.15505646169185638,
          "input_gradient_dot_product": -0.1407725065946579
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.08283167953641475,
        "train_r2": -13.50497108510949,
        "train_pearson_r": 0.11643061892149215,
        "val_mse": 0.058690768198862445,
        "val_r2": -20.657873303289566,
        "val_pearson_r": 0.22254226743531835,
        "n_iterations": 275,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.04627827927470207,
          "right_subspace_overlap_bottom_k": 0.13383996486663818,
          "interaction_matrix_overlap_top_k": 0.3155333399772644,
          "interaction_matrix_overlap_bottom_k": -0.03545962646603584,
          "effective_rank": -1.3818845748901367,
          "effective_rank_mergeability_score": 0.5992591977119446,
          "stable_rank": 0.7977613210678101,
          "spectral_gap": 0.7771854400634766,
          "singular_value_ratio": -0.9074245691299438,
          "layerwise_effective_rank": 1.1886340379714966,
          "layerwise_effective_rank_mergeability_score": -0.37273573875427246,
          "task_vector_cosine_similarity": 0.08239645510911942,
          "task_vector_l2_distance": 0.06364385783672333,
          "task_vector_dot_product": -0.3109329044818878,
          "weight_space_angle": -0.1050109788775444,
          "task_vector_magnitude_ratio": 1.4821373224258423,
          "singular_value_overlap": 0.1903519481420517,
          "subspace_overlap": -0.700501024723053,
          "right_subspace_overlap": -0.48305609822273254,
          "activation_l2_distance": -0.13290195167064667,
          "activation_cosine_similarity": 0.1057942733168602,
          "activation_magnitude_ratio": 0.01746051199734211,
          "activation_dot_product": -0.08742859959602356,
          "encoder_gradient_cosine_similarity": 0.046080220490694046,
          "encoder_gradient_l2_distance": 0.0939038097858429,
          "encoder_gradient_dot_product": -0.14647765457630157,
          "input_gradient_cosine_similarity": -0.2201589196920395,
          "input_gradient_l2_distance": -0.6147937774658203,
          "input_gradient_dot_product": 0.5594912767410278
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.17972445024506042,
        "train_r2": -19.44259636234976,
        "train_pearson_r": 0.11512376183330579,
        "val_mse": 0.15172369582742895,
        "val_r2": -30.499069291999355,
        "val_pearson_r": 0.10937126052866603,
        "n_iterations": 60,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.4076809585094452,
          "right_subspace_overlap_bottom_k": 0.3323339521884918,
          "interaction_matrix_overlap_top_k": 0.5327751636505127,
          "interaction_matrix_overlap_bottom_k": -0.26880088448524475,
          "effective_rank": 0.04236004501581192,
          "effective_rank_mergeability_score": 0.7681547403335571,
          "stable_rank": 0.23454323410987854,
          "spectral_gap": 1.1202551126480103,
          "singular_value_ratio": 0.06692349910736084,
          "layerwise_effective_rank": 0.6882368922233582,
          "layerwise_effective_rank_mergeability_score": -0.9252102375030518,
          "task_vector_cosine_similarity": -0.26449090242385864,
          "task_vector_l2_distance": -0.01246357336640358,
          "task_vector_dot_product": 0.5693683624267578,
          "weight_space_angle": 0.7922592759132385,
          "task_vector_magnitude_ratio": 0.018213743343949318,
          "singular_value_overlap": -0.6248651742935181,
          "subspace_overlap": -0.3018362820148468,
          "right_subspace_overlap": 0.12812311947345734,
          "activation_l2_distance": -0.791545569896698,
          "activation_cosine_similarity": -0.2081284075975418,
          "activation_magnitude_ratio": -0.06427750736474991,
          "activation_dot_product": -0.35151174664497375,
          "encoder_gradient_cosine_similarity": 0.1957361400127411,
          "encoder_gradient_l2_distance": -0.26816436648368835,
          "encoder_gradient_dot_product": -0.005227243062108755,
          "input_gradient_cosine_similarity": -0.2668137848377228,
          "input_gradient_l2_distance": -0.20063166320323944,
          "input_gradient_dot_product": 0.4689571261405945
        }
      }
    ],
    "optimization_params": {
      "objective": "MSE",
      "n_iterations": 1000,
      "learning_rate": 0.01,
      "patience": 50,
      "convergence_threshold": 1e-06
    }
  },
  "tsv": {
    "aggregate_metrics": {
      "train_mse": 25.369529973883203,
      "train_r2": -7183.166842571682,
      "train_pearson_r": -0.00840698615932825,
      "train_pearson_p": 0.6333434719933269,
      "val_mse": 36.654481386195805,
      "val_r2": -10378.849694729162,
      "val_pearson_r": -0.0029448080897597952,
      "val_pearson_p": 0.9557212942646698
    },
    "per_fold_stats": {
      "train_mse_mean": 25.53688115633603,
      "train_mse_std": 103.57236926618279,
      "val_mse_mean": 34.54967890944381,
      "val_mse_std": 144.46447303261232,
      "train_r_mean": 0.1792491015710598,
      "train_r_std": 0.2829509031001972,
      "val_r_mean": 0.07050800523315728,
      "val_r_std": 0.3108038543721988
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.49118074774742126,
      "right_subspace_overlap_bottom_k": -0.07264728844165802,
      "interaction_matrix_overlap_top_k": -0.2584740221500397,
      "interaction_matrix_overlap_bottom_k": -0.2751474380493164,
      "effective_rank": 0.04194309189915657,
      "effective_rank_mergeability_score": -0.5323687195777893,
      "stable_rank": 0.2875727117061615,
      "spectral_gap": -0.5615673065185547,
      "singular_value_ratio": 0.13742555677890778,
      "layerwise_effective_rank": -0.24619996547698975,
      "layerwise_effective_rank_mergeability_score": -0.33378154039382935,
      "task_vector_cosine_similarity": 0.3877089321613312,
      "task_vector_l2_distance": 0.141163632273674,
      "task_vector_dot_product": 0.4344313144683838,
      "weight_space_angle": 0.5862447023391724,
      "task_vector_magnitude_ratio": 0.11917342990636826,
      "singular_value_overlap": 0.13661114871501923,
      "subspace_overlap": -0.9108210802078247,
      "right_subspace_overlap": -0.4325525760650635,
      "activation_l2_distance": 0.3966771960258484,
      "activation_cosine_similarity": 0.0922483280301094,
      "activation_magnitude_ratio": 0.14647266268730164,
      "activation_dot_product": 0.4417017102241516,
      "encoder_gradient_cosine_similarity": 0.4309094548225403,
      "encoder_gradient_l2_distance": 0.33690136671066284,
      "encoder_gradient_dot_product": -0.5964588522911072,
      "input_gradient_cosine_similarity": 0.37651506066322327,
      "input_gradient_l2_distance": 0.19318506121635437,
      "input_gradient_dot_product": 0.034424297511577606
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 2.212162494659424,
      "right_subspace_overlap_bottom_k": 0.9689323902130127,
      "interaction_matrix_overlap_top_k": 1.8773070573806763,
      "interaction_matrix_overlap_bottom_k": 3.2985281944274902,
      "effective_rank": 1.4739174842834473,
      "effective_rank_mergeability_score": 1.8611639738082886,
      "stable_rank": 2.244232416152954,
      "spectral_gap": 2.880911350250244,
      "singular_value_ratio": 2.7769079208374023,
      "layerwise_effective_rank": 2.0178842544555664,
      "layerwise_effective_rank_mergeability_score": 1.0447567701339722,
      "task_vector_cosine_similarity": 4.206647872924805,
      "task_vector_l2_distance": 1.811143398284912,
      "task_vector_dot_product": 1.7809165716171265,
      "weight_space_angle": 2.673119068145752,
      "task_vector_magnitude_ratio": 0.8952328562736511,
      "singular_value_overlap": 1.5416101217269897,
      "subspace_overlap": 4.117164611816406,
      "right_subspace_overlap": 3.4015040397644043,
      "activation_l2_distance": 1.56473970413208,
      "activation_cosine_similarity": 1.8943023681640625,
      "activation_magnitude_ratio": 0.8496588468551636,
      "activation_dot_product": 2.0479447841644287,
      "encoder_gradient_cosine_similarity": 1.0532304048538208,
      "encoder_gradient_l2_distance": 2.3635878562927246,
      "encoder_gradient_dot_product": 2.1953823566436768,
      "input_gradient_cosine_similarity": 1.9505232572555542,
      "input_gradient_l2_distance": 0.9390873312950134,
      "input_gradient_dot_product": 1.638098955154419
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 2.335065632448343,
        "train_r2": -699.4341433497739,
        "train_pearson_r": -0.10667782378333449,
        "val_mse": 2.3663696248017936,
        "val_r2": -1551.201244029165,
        "val_pearson_r": -0.03771063536156652,
        "n_iterations": 61,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.8046399354934692,
          "right_subspace_overlap_bottom_k": 0.01310704741626978,
          "interaction_matrix_overlap_top_k": 1.4372572898864746,
          "interaction_matrix_overlap_bottom_k": 1.2640669345855713,
          "effective_rank": -2.0103468894958496,
          "effective_rank_mergeability_score": -1.6488672494888306,
          "stable_rank": -0.29944777488708496,
          "spectral_gap": -0.056719981133937836,
          "singular_value_ratio": 0.38229095935821533,
          "layerwise_effective_rank": -0.10535129904747009,
          "layerwise_effective_rank_mergeability_score": -0.41558966040611267,
          "task_vector_cosine_similarity": -0.9740012288093567,
          "task_vector_l2_distance": 2.411975622177124,
          "task_vector_dot_product": -0.8806260228157043,
          "weight_space_angle": 1.4059170484542847,
          "task_vector_magnitude_ratio": -0.43879491090774536,
          "singular_value_overlap": -0.34815680980682373,
          "subspace_overlap": 1.7406615018844604,
          "right_subspace_overlap": 0.06845008581876755,
          "activation_l2_distance": 0.2565516233444214,
          "activation_cosine_similarity": -0.23517026007175446,
          "activation_magnitude_ratio": 0.7604434490203857,
          "activation_dot_product": -0.0794607624411583,
          "encoder_gradient_cosine_similarity": 1.007149577140808,
          "encoder_gradient_l2_distance": -0.6068378686904907,
          "encoder_gradient_dot_product": 0.3245680034160614,
          "input_gradient_cosine_similarity": -0.029024118557572365,
          "input_gradient_l2_distance": 0.4482973515987396,
          "input_gradient_dot_product": -1.6253703832626343
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.4980280091951502,
        "train_r2": -136.56115282844675,
        "train_pearson_r": -0.3242885978209018,
        "val_mse": 0.492406637483008,
        "val_r2": -291.5110784044485,
        "val_pearson_r": -0.2622825839666062,
        "n_iterations": 55,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.32506832480430603,
          "right_subspace_overlap_bottom_k": -0.2530561089515686,
          "interaction_matrix_overlap_top_k": -0.09380067884922028,
          "interaction_matrix_overlap_bottom_k": 0.42403414845466614,
          "effective_rank": -0.9093276858329773,
          "effective_rank_mergeability_score": 0.5760561227798462,
          "stable_rank": 0.240371435880661,
          "spectral_gap": 0.15242400765419006,
          "singular_value_ratio": 0.6690794825553894,
          "layerwise_effective_rank": -0.18650589883327484,
          "layerwise_effective_rank_mergeability_score": -0.5361496210098267,
          "task_vector_cosine_similarity": -0.2007555067539215,
          "task_vector_l2_distance": 0.6217156052589417,
          "task_vector_dot_product": -0.5779979825019836,
          "weight_space_angle": -0.3871016502380371,
          "task_vector_magnitude_ratio": 0.444272518157959,
          "singular_value_overlap": -0.028744805604219437,
          "subspace_overlap": -0.7189441919326782,
          "right_subspace_overlap": -0.771342933177948,
          "activation_l2_distance": -0.10053893178701401,
          "activation_cosine_similarity": -0.10845425724983215,
          "activation_magnitude_ratio": 1.141802191734314,
          "activation_dot_product": -0.1925705075263977,
          "encoder_gradient_cosine_similarity": 0.8066096901893616,
          "encoder_gradient_l2_distance": 1.2067508697509766,
          "encoder_gradient_dot_product": 0.36606064438819885,
          "input_gradient_cosine_similarity": -0.3507368862628937,
          "input_gradient_l2_distance": -0.49010491371154785,
          "input_gradient_dot_product": -0.07402987033128738
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 22.428593858772167,
        "train_r2": -6176.212330071324,
        "train_pearson_r": -0.06403056944861224,
        "val_mse": 20.786403336861085,
        "val_r2": -10318.235809848444,
        "val_pearson_r": -0.11300886962898024,
        "n_iterations": 51,
        "coefficients": {
          "right_subspace_overlap_top_k": -2.4669930934906006,
          "right_subspace_overlap_bottom_k": 3.469865083694458,
          "interaction_matrix_overlap_top_k": 0.5845297574996948,
          "interaction_matrix_overlap_bottom_k": 6.1941237449646,
          "effective_rank": -4.441277503967285,
          "effective_rank_mergeability_score": -1.8942112922668457,
          "stable_rank": 1.5079234838485718,
          "spectral_gap": 3.9129257202148438,
          "singular_value_ratio": -4.806225299835205,
          "layerwise_effective_rank": 3.4819657802581787,
          "layerwise_effective_rank_mergeability_score": -2.151150941848755,
          "task_vector_cosine_similarity": -9.829425811767578,
          "task_vector_l2_distance": -0.759151816368103,
          "task_vector_dot_product": 1.2689749002456665,
          "weight_space_angle": -5.371304035186768,
          "task_vector_magnitude_ratio": 2.098572015762329,
          "singular_value_overlap": 3.0177316665649414,
          "subspace_overlap": -4.763068675994873,
          "right_subspace_overlap": 3.471689462661743,
          "activation_l2_distance": 2.254373550415039,
          "activation_cosine_similarity": 2.8649661540985107,
          "activation_magnitude_ratio": 0.49800026416778564,
          "activation_dot_product": 4.686839580535889,
          "encoder_gradient_cosine_similarity": -0.2743563652038574,
          "encoder_gradient_l2_distance": -2.9759511947631836,
          "encoder_gradient_dot_product": -9.30392074584961,
          "input_gradient_cosine_similarity": 3.96216082572937,
          "input_gradient_l2_distance": 2.3309409618377686,
          "input_gradient_dot_product": 4.4100022315979
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 1.0123356334900682,
        "train_r2": -283.97247629158284,
        "train_pearson_r": -0.12744178913649387,
        "val_mse": 0.7342876896213559,
        "val_r2": -418.85609672198916,
        "val_pearson_r": -0.23808876944796897,
        "n_iterations": 123,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.9413014054298401,
          "right_subspace_overlap_bottom_k": -1.0604901313781738,
          "interaction_matrix_overlap_top_k": -3.641871929168701,
          "interaction_matrix_overlap_bottom_k": 1.5133858919143677,
          "effective_rank": 1.1871129274368286,
          "effective_rank_mergeability_score": 1.2689976692199707,
          "stable_rank": -0.8481199741363525,
          "spectral_gap": -1.755454659461975,
          "singular_value_ratio": 0.21181055903434753,
          "layerwise_effective_rank": 0.4099409580230713,
          "layerwise_effective_rank_mergeability_score": 1.2801849842071533,
          "task_vector_cosine_similarity": 3.2292120456695557,
          "task_vector_l2_distance": 1.299109935760498,
          "task_vector_dot_product": 0.1807389259338379,
          "weight_space_angle": -0.2600492835044861,
          "task_vector_magnitude_ratio": -0.1517050713300705,
          "singular_value_overlap": 0.09215690195560455,
          "subspace_overlap": -1.8515243530273438,
          "right_subspace_overlap": 2.1683874130249023,
          "activation_l2_distance": -0.27276042103767395,
          "activation_cosine_similarity": 1.0673532485961914,
          "activation_magnitude_ratio": -0.3546810746192932,
          "activation_dot_product": -0.8126624822616577,
          "encoder_gradient_cosine_similarity": 0.10368287563323975,
          "encoder_gradient_l2_distance": 1.6842199563980103,
          "encoder_gradient_dot_product": 0.839338481426239,
          "input_gradient_cosine_similarity": -2.7399771213531494,
          "input_gradient_l2_distance": -0.4181748032569885,
          "input_gradient_dot_product": -0.43668434023857117
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.05012060933014964,
        "train_r2": -12.98927364975714,
        "train_pearson_r": 0.1875404646163995,
        "val_mse": 0.043135508793776416,
        "val_r2": -18.004003841075985,
        "val_pearson_r": 0.02560232922128426,
        "n_iterations": 296,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.5259504318237305,
          "right_subspace_overlap_bottom_k": -0.4307129383087158,
          "interaction_matrix_overlap_top_k": 0.42386552691459656,
          "interaction_matrix_overlap_bottom_k": 0.1848170906305313,
          "effective_rank": -0.001318363705649972,
          "effective_rank_mergeability_score": 0.8342218995094299,
          "stable_rank": -0.1504540592432022,
          "spectral_gap": -0.6599244475364685,
          "singular_value_ratio": -0.3269902169704437,
          "layerwise_effective_rank": 0.9106295108795166,
          "layerwise_effective_rank_mergeability_score": -0.1864033043384552,
          "task_vector_cosine_similarity": 0.08535809069871902,
          "task_vector_l2_distance": 0.18835383653640747,
          "task_vector_dot_product": -0.44694745540618896,
          "weight_space_angle": 0.37348031997680664,
          "task_vector_magnitude_ratio": -0.3352809250354767,
          "singular_value_overlap": 0.3788592517375946,
          "subspace_overlap": -0.0718473270535469,
          "right_subspace_overlap": -0.5799144506454468,
          "activation_l2_distance": 0.18240800499916077,
          "activation_cosine_similarity": 0.13785672187805176,
          "activation_magnitude_ratio": 0.028685610741376877,
          "activation_dot_product": 0.14060263335704803,
          "encoder_gradient_cosine_similarity": 0.2887648046016693,
          "encoder_gradient_l2_distance": 0.06229483336210251,
          "encoder_gradient_dot_product": 0.18317361176013947,
          "input_gradient_cosine_similarity": -0.14768750965595245,
          "input_gradient_l2_distance": 0.01591760478913784,
          "input_gradient_dot_product": -0.6101395487785339
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_mse": 6.827197209487792,
        "train_r2": -1905.4914882380167,
        "train_pearson_r": -0.11035815380615344,
        "val_mse": 1.4426218877903965,
        "val_r2": -823.1078642698473,
        "val_pearson_r": 0.04695408427247934,
        "n_iterations": 60,
        "coefficients": {
          "right_subspace_overlap_top_k": 2.1095550060272217,
          "right_subspace_overlap_bottom_k": -1.8060457706451416,
          "interaction_matrix_overlap_top_k": -3.588289499282837,
          "interaction_matrix_overlap_bottom_k": -0.9053723216056824,
          "effective_rank": -0.4872592091560364,
          "effective_rank_mergeability_score": -3.946514129638672,
          "stable_rank": -2.2907629013061523,
          "spectral_gap": -1.3679742813110352,
          "singular_value_ratio": -1.9120988845825195,
          "layerwise_effective_rank": -1.76518976688385,
          "layerwise_effective_rank_mergeability_score": -0.06779622286558151,
          "task_vector_cosine_similarity": 0.7049704790115356,
          "task_vector_l2_distance": 4.490325450897217,
          "task_vector_dot_product": -0.29328882694244385,
          "weight_space_angle": 0.140584796667099,
          "task_vector_magnitude_ratio": 1.4452416896820068,
          "singular_value_overlap": 3.127925157546997,
          "subspace_overlap": 2.5143048763275146,
          "right_subspace_overlap": 0.6779171228408813,
          "activation_l2_distance": -2.691465377807617,
          "activation_cosine_similarity": 1.2171456813812256,
          "activation_magnitude_ratio": 2.1358160972595215,
          "activation_dot_product": -2.3482718467712402,
          "encoder_gradient_cosine_similarity": 1.5407594442367554,
          "encoder_gradient_l2_distance": -1.2301616668701172,
          "encoder_gradient_dot_product": -2.8533568382263184,
          "input_gradient_cosine_similarity": 0.9525247812271118,
          "input_gradient_l2_distance": 3.2889063358306885,
          "input_gradient_dot_product": 4.155373573303223
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_mse": 0.008221230631572454,
        "train_r2": -1.3444249776163577,
        "train_pearson_r": 0.39174710945141106,
        "val_mse": 0.06757216360098722,
        "val_r2": -49.05602565720321,
        "val_pearson_r": -0.3731535034946855,
        "n_iterations": 498,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.16957594454288483,
          "right_subspace_overlap_bottom_k": 0.030012689530849457,
          "interaction_matrix_overlap_top_k": -0.11760368198156357,
          "interaction_matrix_overlap_bottom_k": -0.11357004195451736,
          "effective_rank": 0.039740752428770065,
          "effective_rank_mergeability_score": 0.011882560327649117,
          "stable_rank": -0.24854609370231628,
          "spectral_gap": 0.21703346073627472,
          "singular_value_ratio": 0.08003011345863342,
          "layerwise_effective_rank": 0.32903268933296204,
          "layerwise_effective_rank_mergeability_score": 0.002698990050703287,
          "task_vector_cosine_similarity": 0.3125002384185791,
          "task_vector_l2_distance": 0.09372766315937042,
          "task_vector_dot_product": -0.4546149671077728,
          "weight_space_angle": 0.3322305977344513,
          "task_vector_magnitude_ratio": 0.12068261951208115,
          "singular_value_overlap": 0.12021558731794357,
          "subspace_overlap": -0.03953051194548607,
          "right_subspace_overlap": 0.025439472869038582,
          "activation_l2_distance": 0.21233844757080078,
          "activation_cosine_similarity": 0.24785888195037842,
          "activation_magnitude_ratio": 0.056187137961387634,
          "activation_dot_product": -0.01972304843366146,
          "encoder_gradient_cosine_similarity": 0.04635559394955635,
          "encoder_gradient_l2_distance": -0.18165425956249237,
          "encoder_gradient_dot_product": 0.07677225023508072,
          "input_gradient_cosine_similarity": -0.23282453417778015,
          "input_gradient_l2_distance": -0.054235681891441345,
          "input_gradient_dot_product": -0.062378499656915665
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.013601017052557693,
        "train_r2": -3.0580782750281426,
        "train_pearson_r": 0.28273183678852454,
        "val_mse": 0.05006858778932872,
        "val_r2": -26.088317312813146,
        "val_pearson_r": 0.3316140819784963,
        "n_iterations": 113,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.07568168640136719,
          "right_subspace_overlap_bottom_k": -0.06294771283864975,
          "interaction_matrix_overlap_top_k": -0.023612072691321373,
          "interaction_matrix_overlap_bottom_k": 0.006939372513443232,
          "effective_rank": 0.4070219397544861,
          "effective_rank_mergeability_score": 0.15917754173278809,
          "stable_rank": -0.2245718389749527,
          "spectral_gap": 0.22193248569965363,
          "singular_value_ratio": -0.18865567445755005,
          "layerwise_effective_rank": 0.1620994210243225,
          "layerwise_effective_rank_mergeability_score": 0.09978175908327103,
          "task_vector_cosine_similarity": -0.03345513343811035,
          "task_vector_l2_distance": 0.03593230992555618,
          "task_vector_dot_product": 0.13845835626125336,
          "weight_space_angle": 0.2710597515106201,
          "task_vector_magnitude_ratio": 0.3517487645149231,
          "singular_value_overlap": 0.18943169713020325,
          "subspace_overlap": -0.3366999626159668,
          "right_subspace_overlap": 0.1472785770893097,
          "activation_l2_distance": -0.04162700101733208,
          "activation_cosine_similarity": 0.036138057708740234,
          "activation_magnitude_ratio": 0.04009250923991203,
          "activation_dot_product": 0.0469173789024353,
          "encoder_gradient_cosine_similarity": 0.06310989707708359,
          "encoder_gradient_l2_distance": 0.03180878609418869,
          "encoder_gradient_dot_product": 0.18160417675971985,
          "input_gradient_cosine_similarity": -0.24092504382133484,
          "input_gradient_l2_distance": -0.2880406677722931,
          "input_gradient_dot_product": -0.0775517076253891
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_mse": 0.0271780178425261,
        "train_r2": -6.569035130795441,
        "train_pearson_r": 0.1230867284338681,
        "val_mse": 0.048402210889112784,
        "val_r2": -16.60688516473354,
        "val_pearson_r": 0.49137100520720844,
        "n_iterations": 112,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011433741077780724,
          "right_subspace_overlap_bottom_k": -0.2635263204574585,
          "interaction_matrix_overlap_top_k": 0.03899678960442543,
          "interaction_matrix_overlap_bottom_k": 0.24006113409996033,
          "effective_rank": 0.055504895746707916,
          "effective_rank_mergeability_score": 0.13837452232837677,
          "stable_rank": 0.11394944787025452,
          "spectral_gap": 0.2577327787876129,
          "singular_value_ratio": 0.006635558325797319,
          "layerwise_effective_rank": 0.27438730001449585,
          "layerwise_effective_rank_mergeability_score": -0.13120393455028534,
          "task_vector_cosine_similarity": -0.04693824425339699,
          "task_vector_l2_distance": 0.08125706762075424,
          "task_vector_dot_product": 0.0641435980796814,
          "weight_space_angle": 0.28702354431152344,
          "task_vector_magnitude_ratio": -0.06771818548440933,
          "singular_value_overlap": 0.1039644181728363,
          "subspace_overlap": 0.05039007589221001,
          "right_subspace_overlap": -0.40174156427383423,
          "activation_l2_distance": 0.02260473370552063,
          "activation_cosine_similarity": 0.23264434933662415,
          "activation_magnitude_ratio": 0.09120301902294159,
          "activation_dot_product": -0.039715275168418884,
          "encoder_gradient_cosine_similarity": 0.09703658521175385,
          "encoder_gradient_l2_distance": -0.3219609558582306,
          "encoder_gradient_dot_product": -0.027163879945874214,
          "input_gradient_cosine_similarity": 0.1427600085735321,
          "input_gradient_l2_distance": -0.047350622713565826,
          "input_gradient_dot_product": 0.03676128014922142
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 476.47721267939517,
        "train_r2": -146478.89400616646,
        "train_pearson_r": -0.0010536826302935814,
        "val_mse": 663.9521788795038,
        "val_r2": -199727.08713760594,
        "val_pearson_r": 0.31508104744104976,
        "n_iterations": 52,
        "coefficients": {
          "right_subspace_overlap_top_k": 9.434085845947266,
          "right_subspace_overlap_bottom_k": -0.7510902285575867,
          "interaction_matrix_overlap_top_k": 5.745115280151367,
          "interaction_matrix_overlap_bottom_k": -13.179398536682129,
          "effective_rank": 3.81300950050354,
          "effective_rank_mergeability_score": -7.065197944641113,
          "stable_rank": 9.489709854125977,
          "spectral_gap": -12.212890625,
          "singular_value_ratio": 11.182500839233398,
          "layerwise_effective_rank": -7.8725996017456055,
          "layerwise_effective_rank_mergeability_score": -3.440272808074951,
          "task_vector_cosine_similarity": 15.668519973754883,
          "task_vector_l2_distance": -6.093760013580322,
          "task_vector_dot_product": 7.775505542755127,
          "weight_space_angle": 10.604693412780762,
          "task_vector_magnitude_ratio": -2.6869091987609863,
          "singular_value_overlap": -5.244704246520996,
          "subspace_overlap": -17.630775451660156,
          "right_subspace_overlap": -14.681940078735352,
          "activation_l2_distance": 6.048007011413574,
          "activation_cosine_similarity": -7.602232456207275,
          "activation_magnitude_ratio": -2.7087066173553467,
          "activation_dot_product": 7.671995162963867,
          "encoder_gradient_cosine_similarity": 4.626860618591309,
          "encoder_gradient_l2_distance": 9.881120681762695,
          "encoder_gradient_dot_product": -2.6708288192749023,
          "input_gradient_cosine_similarity": 7.3700432777404785,
          "input_gradient_l2_distance": -0.9766027331352234,
          "input_gradient_dot_product": -3.5040931701660156
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.008373200191702086,
        "train_r2": -1.8483450247490976,
        "train_pearson_r": 0.538985638019935,
        "val_mse": 0.01717326979521916,
        "val_r2": -11.91012815194397,
        "val_pearson_r": 0.21833783217268507,
        "n_iterations": 232,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.12133743613958359,
          "right_subspace_overlap_bottom_k": -0.09956487268209457,
          "interaction_matrix_overlap_top_k": 0.0644129291176796,
          "interaction_matrix_overlap_bottom_k": -0.0486823134124279,
          "effective_rank": 0.14559583365917206,
          "effective_rank_mergeability_score": -0.16584190726280212,
          "stable_rank": -0.0860387533903122,
          "spectral_gap": 0.5456593632698059,
          "singular_value_ratio": 0.3294062912464142,
          "layerwise_effective_rank": 0.10892347991466522,
          "layerwise_effective_rank_mergeability_score": 0.1896226406097412,
          "task_vector_cosine_similarity": -0.10666650533676147,
          "task_vector_l2_distance": 0.06831710785627365,
          "task_vector_dot_product": 0.0726219192147255,
          "weight_space_angle": 0.17759576439857483,
          "task_vector_magnitude_ratio": 0.09978950023651123,
          "singular_value_overlap": 0.12655088305473328,
          "subspace_overlap": -0.2248317301273346,
          "right_subspace_overlap": 0.20007745921611786,
          "activation_l2_distance": 0.029311101883649826,
          "activation_cosine_similarity": 0.27074968814849854,
          "activation_magnitude_ratio": 0.023828303441405296,
          "activation_dot_product": -0.13085094094276428,
          "encoder_gradient_cosine_similarity": 0.009289327077567577,
          "encoder_gradient_l2_distance": -0.3029657006263733,
          "encoder_gradient_dot_product": 0.09781337529420853,
          "input_gradient_cosine_similarity": -0.11992551386356354,
          "input_gradient_l2_distance": -0.04441666603088379,
          "input_gradient_dot_product": -0.10840389877557755
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.007581749962365281,
        "train_r2": -1.077871830862029,
        "train_pearson_r": 0.5052572794519404,
        "val_mse": 0.007446269749013798,
        "val_r2": -3.361819093305029,
        "val_pearson_r": 0.3670579231039022,
        "n_iterations": 701,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.9120216965675354,
          "right_subspace_overlap_bottom_k": 0.5676639080047607,
          "interaction_matrix_overlap_top_k": 0.08839260041713715,
          "interaction_matrix_overlap_bottom_k": -0.7900233268737793,
          "effective_rank": 0.7804580926895142,
          "effective_rank_mergeability_score": 0.35171589255332947,
          "stable_rank": 0.04817047342658043,
          "spectral_gap": -0.1311623901128769,
          "singular_value_ratio": -0.5143970847129822,
          "layerwise_effective_rank": -0.5232419967651367,
          "layerwise_effective_rank_mergeability_score": -0.16976378858089447,
          "task_vector_cosine_similarity": 0.2563469409942627,
          "task_vector_l2_distance": -0.006178678013384342,
          "task_vector_dot_product": 0.05581904202699661,
          "weight_space_angle": 0.6481209397315979,
          "task_vector_magnitude_ratio": 0.24900779128074646,
          "singular_value_overlap": 0.060692280530929565,
          "subspace_overlap": -0.4858104884624481,
          "right_subspace_overlap": -0.356726735830307,
          "activation_l2_distance": 0.12725643813610077,
          "activation_cosine_similarity": 0.26355043053627014,
          "activation_magnitude_ratio": 0.003717282088473439,
          "activation_dot_product": -0.07980749011039734,
          "encoder_gradient_cosine_similarity": 0.035911232233047485,
          "encoder_gradient_l2_distance": -0.2292715609073639,
          "encoder_gradient_dot_product": 0.0741337388753891,
          "input_gradient_cosine_similarity": -0.10513201355934143,
          "input_gradient_l2_distance": -0.0319729782640934,
          "input_gradient_dot_product": -0.09965645521879196
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.053395387990758415,
        "train_r2": -14.275418292619982,
        "train_pearson_r": -0.027468227909470126,
        "val_mse": 0.14788070727069663,
        "val_r2": -88.39767187142797,
        "val_pearson_r": -0.21589840864048127,
        "n_iterations": 79,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.058340758085250854,
          "right_subspace_overlap_bottom_k": -0.00020018639042973518,
          "interaction_matrix_overlap_top_k": -0.5297384858131409,
          "interaction_matrix_overlap_bottom_k": -0.08637470752000809,
          "effective_rank": 0.7586565017700195,
          "effective_rank_mergeability_score": 0.18906241655349731,
          "stable_rank": 0.44810259342193604,
          "spectral_gap": -0.5072253942489624,
          "singular_value_ratio": -0.5484257936477661,
          "layerwise_effective_rank": -0.08491044491529465,
          "layerwise_effective_rank_mergeability_score": 0.18392841517925262,
          "task_vector_cosine_similarity": 0.597354531288147,
          "task_vector_l2_distance": 0.11620897799730301,
          "task_vector_dot_product": 0.33136287331581116,
          "weight_space_angle": 0.505297064781189,
          "task_vector_magnitude_ratio": -0.49573540687561035,
          "singular_value_overlap": 0.13240502774715424,
          "subspace_overlap": 0.07782711833715439,
          "right_subspace_overlap": -0.13993540406227112,
          "activation_l2_distance": 0.2178342044353485,
          "activation_cosine_similarity": 0.6821919083595276,
          "activation_magnitude_ratio": -0.10370177030563354,
          "activation_dot_product": -0.37101271748542786,
          "encoder_gradient_cosine_similarity": -0.10740114748477936,
          "encoder_gradient_l2_distance": -0.04763941094279289,
          "encoder_gradient_dot_product": 0.011838345788419247,
          "input_gradient_cosine_similarity": 0.0916684940457344,
          "input_gradient_l2_distance": 0.12310396879911423,
          "input_gradient_dot_product": -0.38513442873954773
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.007473485997693824,
        "train_r2": -1.0485066380846662,
        "train_pearson_r": 0.5032514071194463,
        "val_mse": 0.013926526509929142,
        "val_r2": -5.835584725934715,
        "val_pearson_r": 0.07838310425146591,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.21065513789653778,
          "right_subspace_overlap_bottom_k": 0.10578227043151855,
          "interaction_matrix_overlap_top_k": -0.07363462448120117,
          "interaction_matrix_overlap_bottom_k": -0.34568771719932556,
          "effective_rank": 0.5516208410263062,
          "effective_rank_mergeability_score": 0.3274126648902893,
          "stable_rank": 0.025105653330683708,
          "spectral_gap": 0.20078538358211517,
          "singular_value_ratio": -0.4745253324508667,
          "layerwise_effective_rank": -0.07915493100881577,
          "layerwise_effective_rank_mergeability_score": 0.005490483250468969,
          "task_vector_cosine_similarity": 0.009929175488650799,
          "task_vector_l2_distance": 0.10443376749753952,
          "task_vector_dot_product": -0.039466097950935364,
          "weight_space_angle": 0.2573816776275635,
          "task_vector_magnitude_ratio": 0.5552709102630615,
          "singular_value_overlap": 0.11088940501213074,
          "subspace_overlap": -0.0041067106649279594,
          "right_subspace_overlap": -0.09693554043769836,
          "activation_l2_distance": -0.031796377152204514,
          "activation_cosine_similarity": 0.2386624813079834,
          "activation_magnitude_ratio": 0.015147306956350803,
          "activation_dot_product": -0.15803754329681396,
          "encoder_gradient_cosine_similarity": 0.050895288586616516,
          "encoder_gradient_l2_distance": -0.275889128446579,
          "encoder_gradient_dot_product": 0.08285889029502869,
          "input_gradient_cosine_similarity": -0.11010342091321945,
          "input_gradient_l2_distance": -0.0227422583848238,
          "input_gradient_dot_product": -0.1399787962436676
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.3328334906865094,
        "train_r2": -93.91560780611995,
        "train_pearson_r": 0.16585201206816122,
        "val_mse": 0.20684336129828923,
        "val_r2": -75.35868620457529,
        "val_pearson_r": -0.10513814321962589,
        "n_iterations": 138,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.14269594848155975,
          "right_subspace_overlap_bottom_k": -1.080151081085205,
          "interaction_matrix_overlap_top_k": -2.568972110748291,
          "interaction_matrix_overlap_bottom_k": 0.3026536703109741,
          "effective_rank": -0.49502941966056824,
          "effective_rank_mergeability_score": -0.1985287219285965,
          "stable_rank": -1.6893633604049683,
          "spectral_gap": -1.1539297103881836,
          "singular_value_ratio": -0.8403965830802917,
          "layerwise_effective_rank": -1.6171220541000366,
          "layerwise_effective_rank_mergeability_score": -2.2002735137939453,
          "task_vector_cosine_similarity": -0.9578976631164551,
          "task_vector_l2_distance": -0.21606415510177612,
          "task_vector_dot_product": 1.7689549922943115,
          "weight_space_angle": 2.1735482215881348,
          "task_vector_magnitude_ratio": 0.9991854429244995,
          "singular_value_overlap": 0.9020894169807434,
          "subspace_overlap": 2.7647171020507812,
          "right_subspace_overlap": 0.4094597399234772,
          "activation_l2_distance": 1.60055673122406,
          "activation_cosine_similarity": 1.449082612991333,
          "activation_magnitude_ratio": 0.7230449318885803,
          "activation_dot_product": 0.04379895702004433,
          "encoder_gradient_cosine_similarity": -0.22591441869735718,
          "encoder_gradient_l2_distance": 0.7112831473350525,
          "encoder_gradient_dot_product": 0.6067808866500854,
          "input_gradient_cosine_similarity": -0.20730343461036682,
          "input_gradient_l2_distance": -0.2838560938835144,
          "input_gradient_dot_product": 0.12880158424377441
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_mse": 0.006742717899384497,
        "train_r2": -0.8303441850195947,
        "train_pearson_r": 0.5851824788689419,
        "val_mse": 0.020620405557306983,
        "val_r2": -8.939417617518941,
        "val_pearson_r": -0.07289612098670172,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.48031488060951233,
          "right_subspace_overlap_bottom_k": 0.1763298362493515,
          "interaction_matrix_overlap_top_k": -0.2503017485141754,
          "interaction_matrix_overlap_bottom_k": -0.376990407705307,
          "effective_rank": 0.19421450793743134,
          "effective_rank_mergeability_score": -0.08778615295886993,
          "stable_rank": -0.25290027260780334,
          "spectral_gap": 0.12533628940582275,
          "singular_value_ratio": -0.31338149309158325,
          "layerwise_effective_rank": 0.5683045983314514,
          "layerwise_effective_rank_mergeability_score": 0.4503321051597595,
          "task_vector_cosine_similarity": 0.21174515783786774,
          "task_vector_l2_distance": 0.11708679050207138,
          "task_vector_dot_product": -0.4173564314842224,
          "weight_space_angle": 0.07653466612100601,
          "task_vector_magnitude_ratio": 0.3895643651485443,
          "singular_value_overlap": 0.14994554221630096,
          "subspace_overlap": -0.1720498502254486,
          "right_subspace_overlap": 0.012127388268709183,
          "activation_l2_distance": 0.14989987015724182,
          "activation_cosine_similarity": 0.29919442534446716,
          "activation_magnitude_ratio": -0.010861700400710106,
          "activation_dot_product": -0.09592429548501968,
          "encoder_gradient_cosine_similarity": 0.03349417820572853,
          "encoder_gradient_l2_distance": -0.23991864919662476,
          "encoder_gradient_dot_product": 0.07495979964733124,
          "input_gradient_cosine_similarity": -0.12580282986164093,
          "input_gradient_l2_distance": -0.0544871911406517,
          "input_gradient_dot_product": -0.11107978224754333
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.5719975078029667,
        "train_r2": -154.79701182296688,
        "train_pearson_r": -0.23529878646670133,
        "val_mse": 0.36539921906748934,
        "val_r2": -176.63597067916072,
        "val_pearson_r": -0.48099142106763915,
        "n_iterations": 177,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.05816817656159401,
          "right_subspace_overlap_bottom_k": -0.07883394509553909,
          "interaction_matrix_overlap_top_k": -1.506447196006775,
          "interaction_matrix_overlap_bottom_k": 0.9402664303779602,
          "effective_rank": 0.8061920404434204,
          "effective_rank_mergeability_score": -0.02875431627035141,
          "stable_rank": -0.6863300800323486,
          "spectral_gap": 0.19855576753616333,
          "singular_value_ratio": -0.3876039981842041,
          "layerwise_effective_rank": 0.9128277897834778,
          "layerwise_effective_rank_mergeability_score": 0.5148007869720459,
          "task_vector_cosine_similarity": -1.162894606590271,
          "task_vector_l2_distance": 0.250436007976532,
          "task_vector_dot_product": -0.1022343635559082,
          "weight_space_angle": 0.1221405491232872,
          "task_vector_magnitude_ratio": -0.08451054245233536,
          "singular_value_overlap": -0.49561798572540283,
          "subspace_overlap": 0.8088626265525818,
          "right_subspace_overlap": 0.8053515553474426,
          "activation_l2_distance": -0.47530239820480347,
          "activation_cosine_similarity": -0.04056641086935997,
          "activation_magnitude_ratio": 0.25332504510879517,
          "activation_dot_product": 0.6001165509223938,
          "encoder_gradient_cosine_similarity": 0.44516605138778687,
          "encoder_gradient_l2_distance": 0.4055488705635071,
          "encoder_gradient_dot_product": -0.40362226963043213,
          "input_gradient_cosine_similarity": -0.187106654047966,
          "input_gradient_l2_distance": 0.5948416590690613,
          "input_gradient_dot_product": -1.0789297819137573
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.01298895338350799,
        "train_r2": -2.707625741768189,
        "train_pearson_r": 0.3720340981674511,
        "val_mse": 0.020796862023134615,
        "val_r2": -10.330021751836616,
        "val_pearson_r": 0.18815642957415898,
        "n_iterations": 247,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.02001882530748844,
          "right_subspace_overlap_bottom_k": 0.09779561311006546,
          "interaction_matrix_overlap_top_k": 0.09926808625459671,
          "interaction_matrix_overlap_bottom_k": -0.28349563479423523,
          "effective_rank": 0.0965496152639389,
          "effective_rank_mergeability_score": 0.17558255791664124,
          "stable_rank": 0.11570290476083755,
          "spectral_gap": 0.40161654353141785,
          "singular_value_ratio": 0.27622902393341064,
          "layerwise_effective_rank": 0.1105215847492218,
          "layerwise_effective_rank_mergeability_score": 0.005544034298509359,
          "task_vector_cosine_similarity": -0.14170101284980774,
          "task_vector_l2_distance": 0.07225042581558228,
          "task_vector_dot_product": 0.02495776116847992,
          "weight_space_angle": 0.2315635085105896,
          "task_vector_magnitude_ratio": 0.018511135131120682,
          "singular_value_overlap": 0.15082556009292603,
          "subspace_overlap": 0.18094094097614288,
          "right_subspace_overlap": -0.20388935506343842,
          "activation_l2_distance": 0.0058669145219028,
          "activation_cosine_similarity": 0.30286362767219543,
          "activation_magnitude_ratio": 0.013756593689322472,
          "activation_dot_product": -0.2099023312330246,
          "encoder_gradient_cosine_similarity": 0.015475327149033546,
          "encoder_gradient_l2_distance": -0.29493847489356995,
          "encoder_gradient_dot_product": 0.03612484410405159,
          "input_gradient_cosine_similarity": -0.24182912707328796,
          "input_gradient_l2_distance": -0.1142917275428772,
          "input_gradient_dot_product": 0.07877948135137558
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.006700902637991639,
        "train_r2": -0.8433961891311994,
        "train_pearson_r": 0.5600184732766369,
        "val_mse": 0.00549585257262164,
        "val_r2": -2.1848189725234914,
        "val_pearson_r": 0.6648739476486109,
        "n_iterations": 793,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.1370251327753067,
          "right_subspace_overlap_bottom_k": -0.08512023091316223,
          "interaction_matrix_overlap_top_k": -0.4961104393005371,
          "interaction_matrix_overlap_bottom_k": -0.13926613330841064,
          "effective_rank": 0.2783452868461609,
          "effective_rank_mergeability_score": 0.05715831741690636,
          "stable_rank": 0.13494719564914703,
          "spectral_gap": 0.08023453503847122,
          "singular_value_ratio": -0.23481889069080353,
          "layerwise_effective_rank": -0.19735436141490936,
          "layerwise_effective_rank_mergeability_score": 0.03576430305838585,
          "task_vector_cosine_similarity": 0.11269351840019226,
          "task_vector_l2_distance": 0.09038805216550827,
          "task_vector_dot_product": 0.0030702752992510796,
          "weight_space_angle": 0.43810346722602844,
          "task_vector_magnitude_ratio": 0.20131266117095947,
          "singular_value_overlap": 0.10546652227640152,
          "subspace_overlap": 0.0360400527715683,
          "right_subspace_overlap": 0.402768611907959,
          "activation_l2_distance": 0.15989205241203308,
          "activation_cosine_similarity": 0.38017934560775757,
          "activation_magnitude_ratio": 0.005942882504314184,
          "activation_dot_product": -0.1299624741077423,
          "encoder_gradient_cosine_similarity": 0.03855045139789581,
          "encoder_gradient_l2_distance": -0.19841378927230835,
          "encoder_gradient_dot_product": 0.07615713030099869,
          "input_gradient_cosine_similarity": -0.13508984446525574,
          "input_gradient_l2_distance": -0.068963423371315,
          "input_gradient_dot_product": -0.08872000873088837
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.0519818325223104,
        "train_r2": -13.880305702545748,
        "train_pearson_r": 0.36591213616044105,
        "val_mse": 0.2045491878979149,
        "val_r2": -130.67426743916945,
        "val_pearson_r": 0.5818967756060602,
        "n_iterations": 67,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.20462258160114288,
          "right_subspace_overlap_bottom_k": 0.0582372322678566,
          "interaction_matrix_overlap_top_k": -0.7609366178512573,
          "interaction_matrix_overlap_bottom_k": -0.3044355511665344,
          "effective_rank": 0.06939910352230072,
          "effective_rank_mergeability_score": 0.2986840605735779,
          "stable_rank": 0.4040059745311737,
          "spectral_gap": 0.2996985912322998,
          "singular_value_ratio": 0.15804752707481384,
          "layerwise_effective_rank": 0.2387971132993698,
          "layerwise_effective_rank_mergeability_score": -0.14517560601234436,
          "task_vector_cosine_similarity": 0.01928425021469593,
          "task_vector_l2_distance": -0.14309221506118774,
          "task_vector_dot_product": 0.21655063331127167,
          "weight_space_angle": -0.3019258975982666,
          "task_vector_magnitude_ratio": -0.32903674244880676,
          "singular_value_overlap": 0.08029758930206299,
          "subspace_overlap": -0.09097325056791306,
          "right_subspace_overlap": 0.19242805242538452,
          "activation_l2_distance": 0.28013360500335693,
          "activation_cosine_similarity": 0.14095249772071838,
          "activation_magnitude_ratio": 0.31641125679016113,
          "activation_dot_product": 0.3116651773452759,
          "encoder_gradient_cosine_similarity": 0.01674887351691723,
          "encoder_gradient_l2_distance": -0.33939746022224426,
          "encoder_gradient_dot_product": 0.29752951860427856,
          "input_gradient_cosine_similarity": -0.01538790576159954,
          "input_gradient_l2_distance": -0.04306715726852417,
          "input_gradient_dot_product": 0.280918687582016
        }
      }
    ],
    "optimization_params": {
      "objective": "MSE",
      "n_iterations": 1000,
      "learning_rate": 0.01,
      "patience": 50,
      "convergence_threshold": 1e-06
    }
  },
  "isotropic": {
    "aggregate_metrics": {
      "train_mse": 203.33887427833918,
      "train_r2": -14826.024764467677,
      "train_pearson_r": 0.014196215290816992,
      "train_pearson_p": 0.42050645684764265,
      "val_mse": 214.887141243676,
      "val_r2": -15668.09903639886,
      "val_pearson_r": -0.06217753611763909,
      "val_pearson_p": 0.2406051480558673
    },
    "per_fold_stats": {
      "train_mse_mean": 202.21669989124206,
      "train_mse_std": 876.0751191951183,
      "val_mse_mean": 226.17567054949623,
      "val_mse_std": 979.146216814534,
      "train_r_mean": 0.07625783065008787,
      "train_r_std": 0.1323439898779083,
      "val_r_mean": 0.08190730434074647,
      "val_r_std": 0.197799498826537
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.19084852933883667,
      "right_subspace_overlap_bottom_k": -0.7688701748847961,
      "interaction_matrix_overlap_top_k": 0.499372661113739,
      "interaction_matrix_overlap_bottom_k": 0.33530324697494507,
      "effective_rank": -1.8433221578598022,
      "effective_rank_mergeability_score": -0.07229985296726227,
      "stable_rank": -0.17211191356182098,
      "spectral_gap": 1.5110061168670654,
      "singular_value_ratio": 1.2150951623916626,
      "layerwise_effective_rank": 1.17367684841156,
      "layerwise_effective_rank_mergeability_score": 2.855938673019409,
      "task_vector_cosine_similarity": -1.145220160484314,
      "task_vector_l2_distance": -0.6551850438117981,
      "task_vector_dot_product": 0.8074405789375305,
      "weight_space_angle": -0.7864280939102173,
      "task_vector_magnitude_ratio": -0.04690765216946602,
      "singular_value_overlap": -0.14943332970142365,
      "subspace_overlap": -1.166695475578308,
      "right_subspace_overlap": -0.571045994758606,
      "activation_l2_distance": -0.7451198697090149,
      "activation_cosine_similarity": 0.14132744073867798,
      "activation_magnitude_ratio": 0.28263646364212036,
      "activation_dot_product": 0.4128771424293518,
      "encoder_gradient_cosine_similarity": -0.21290525794029236,
      "encoder_gradient_l2_distance": 1.264595866203308,
      "encoder_gradient_dot_product": -0.2422790229320526,
      "input_gradient_cosine_similarity": -0.35566583275794983,
      "input_gradient_l2_distance": 0.21039243042469025,
      "input_gradient_dot_product": -0.9745997190475464
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.5706644654273987,
      "right_subspace_overlap_bottom_k": 2.2825136184692383,
      "interaction_matrix_overlap_top_k": 1.5748592615127563,
      "interaction_matrix_overlap_bottom_k": 1.659278154373169,
      "effective_rank": 6.9234089851379395,
      "effective_rank_mergeability_score": 1.0580519437789917,
      "stable_rank": 1.3540372848510742,
      "spectral_gap": 5.309899806976318,
      "singular_value_ratio": 4.043066024780273,
      "layerwise_effective_rank": 3.838733434677124,
      "layerwise_effective_rank_mergeability_score": 10.955427169799805,
      "task_vector_cosine_similarity": 3.846855401992798,
      "task_vector_l2_distance": 2.9753777980804443,
      "task_vector_dot_product": 3.1980838775634766,
      "weight_space_angle": 3.7270522117614746,
      "task_vector_magnitude_ratio": 1.1358726024627686,
      "singular_value_overlap": 2.348289728164673,
      "subspace_overlap": 4.057639122009277,
      "right_subspace_overlap": 3.2014787197113037,
      "activation_l2_distance": 2.1147308349609375,
      "activation_cosine_similarity": 0.765545129776001,
      "activation_magnitude_ratio": 0.4787321388721466,
      "activation_dot_product": 1.704944372177124,
      "encoder_gradient_cosine_similarity": 2.0359046459198,
      "encoder_gradient_l2_distance": 4.928892612457275,
      "encoder_gradient_dot_product": 2.7708916664123535,
      "input_gradient_cosine_similarity": 1.5144866704940796,
      "input_gradient_l2_distance": 3.4977834224700928,
      "input_gradient_dot_product": 3.626002550125122
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.17302778998278573,
        "train_r2": -11.033790720318438,
        "train_pearson_r": 0.0762345294837552,
        "val_mse": 0.21587778517171965,
        "val_r2": -28.414728537106015,
        "val_pearson_r": 0.3729196769656553,
        "n_iterations": 57,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.2939257323741913,
          "right_subspace_overlap_bottom_k": 0.5545640587806702,
          "interaction_matrix_overlap_top_k": 0.6688445210456848,
          "interaction_matrix_overlap_bottom_k": -0.3108638525009155,
          "effective_rank": 0.10320203006267548,
          "effective_rank_mergeability_score": -0.14188231527805328,
          "stable_rank": -0.9131637811660767,
          "spectral_gap": 0.4181327223777771,
          "singular_value_ratio": 1.358400583267212,
          "layerwise_effective_rank": -0.8420835733413696,
          "layerwise_effective_rank_mergeability_score": -0.30885422229766846,
          "task_vector_cosine_similarity": -0.29910025000572205,
          "task_vector_l2_distance": -0.48896774649620056,
          "task_vector_dot_product": 0.4685319662094116,
          "weight_space_angle": 0.3687526285648346,
          "task_vector_magnitude_ratio": 0.07096366584300995,
          "singular_value_overlap": 0.1078319400548935,
          "subspace_overlap": -1.837984323501587,
          "right_subspace_overlap": 0.9204232692718506,
          "activation_l2_distance": -0.01808871515095234,
          "activation_cosine_similarity": -0.043995533138513565,
          "activation_magnitude_ratio": 0.1367330253124237,
          "activation_dot_product": 0.05976630747318268,
          "encoder_gradient_cosine_similarity": 0.3072780668735504,
          "encoder_gradient_l2_distance": -0.38045379519462585,
          "encoder_gradient_dot_product": 0.9230774641036987,
          "input_gradient_cosine_similarity": 0.07720524817705154,
          "input_gradient_l2_distance": -0.3204299211502075,
          "input_gradient_dot_product": 0.6411697268486023
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 16.48768180647519,
        "train_r2": -1147.1145076834505,
        "train_pearson_r": 0.012147786593088997,
        "val_mse": 22.52061417970381,
        "val_r2": -2890.974232796764,
        "val_pearson_r": 0.228192319295458,
        "n_iterations": 91,
        "coefficients": {
          "right_subspace_overlap_top_k": 1.8906164169311523,
          "right_subspace_overlap_bottom_k": -3.4812355041503906,
          "interaction_matrix_overlap_top_k": 4.8431172370910645,
          "interaction_matrix_overlap_bottom_k": 0.33135494589805603,
          "effective_rank": -4.470944404602051,
          "effective_rank_mergeability_score": -2.4655048847198486,
          "stable_rank": 2.8188796043395996,
          "spectral_gap": 1.7053773403167725,
          "singular_value_ratio": 6.271564483642578,
          "layerwise_effective_rank": 2.7966551780700684,
          "layerwise_effective_rank_mergeability_score": 2.102994441986084,
          "task_vector_cosine_similarity": -1.3490220308303833,
          "task_vector_l2_distance": 0.33005666732788086,
          "task_vector_dot_product": -1.6851727962493896,
          "weight_space_angle": -2.2087483406066895,
          "task_vector_magnitude_ratio": -4.205746173858643,
          "singular_value_overlap": 2.849130630493164,
          "subspace_overlap": -1.2633581161499023,
          "right_subspace_overlap": 1.3914917707443237,
          "activation_l2_distance": -5.836390495300293,
          "activation_cosine_similarity": -1.0099098682403564,
          "activation_magnitude_ratio": 1.1258758306503296,
          "activation_dot_product": 0.41804009675979614,
          "encoder_gradient_cosine_similarity": 1.6536598205566406,
          "encoder_gradient_l2_distance": 8.954771041870117,
          "encoder_gradient_dot_product": 3.2400524616241455,
          "input_gradient_cosine_similarity": -3.7272541522979736,
          "input_gradient_l2_distance": -3.2628724575042725,
          "input_gradient_dot_product": -6.785585403442383
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.9011013882321851,
        "train_r2": -62.0671097409711,
        "train_pearson_r": 0.017415952129969464,
        "val_mse": 0.39788553156669554,
        "val_r2": -51.64392067079144,
        "val_pearson_r": 0.23080680462585268,
        "n_iterations": 85,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.5240185260772705,
          "right_subspace_overlap_bottom_k": -0.08513104170560837,
          "interaction_matrix_overlap_top_k": -1.3955399990081787,
          "interaction_matrix_overlap_bottom_k": -0.7694824934005737,
          "effective_rank": -1.0496501922607422,
          "effective_rank_mergeability_score": -0.41877973079681396,
          "stable_rank": -0.7304440140724182,
          "spectral_gap": -0.9774077534675598,
          "singular_value_ratio": 0.3529066741466522,
          "layerwise_effective_rank": 0.6195008754730225,
          "layerwise_effective_rank_mergeability_score": 1.5947614908218384,
          "task_vector_cosine_similarity": -2.1547181606292725,
          "task_vector_l2_distance": 0.681984007358551,
          "task_vector_dot_product": 0.07943529635667801,
          "weight_space_angle": -0.5609956383705139,
          "task_vector_magnitude_ratio": 0.7067607641220093,
          "singular_value_overlap": 0.5171496272087097,
          "subspace_overlap": 1.8623924255371094,
          "right_subspace_overlap": 1.3910428285598755,
          "activation_l2_distance": 0.6226107478141785,
          "activation_cosine_similarity": 1.4306029081344604,
          "activation_magnitude_ratio": 1.413681983947754,
          "activation_dot_product": -0.20380599796772003,
          "encoder_gradient_cosine_similarity": -0.2554261088371277,
          "encoder_gradient_l2_distance": -0.18495692312717438,
          "encoder_gradient_dot_product": -1.3168702125549316,
          "input_gradient_cosine_similarity": 0.2894432246685028,
          "input_gradient_l2_distance": -0.9730249047279358,
          "input_gradient_dot_product": 1.0243483781814575
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.07776640646730022,
        "train_r2": -4.524027173140446,
        "train_pearson_r": 0.021666049261349934,
        "val_mse": 0.035272618443588755,
        "val_r2": -3.698216331791283,
        "val_pearson_r": -0.20493223660706147,
        "n_iterations": 93,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.04052373766899109,
          "right_subspace_overlap_bottom_k": 0.044705867767333984,
          "interaction_matrix_overlap_top_k": -0.791556715965271,
          "interaction_matrix_overlap_bottom_k": 0.1394132822751999,
          "effective_rank": -0.15931841731071472,
          "effective_rank_mergeability_score": 0.24318835139274597,
          "stable_rank": 0.4027305543422699,
          "spectral_gap": -0.4312356412410736,
          "singular_value_ratio": 0.16221918165683746,
          "layerwise_effective_rank": -0.0882672369480133,
          "layerwise_effective_rank_mergeability_score": -0.14505328238010406,
          "task_vector_cosine_similarity": 0.01231206301599741,
          "task_vector_l2_distance": -0.1264183521270752,
          "task_vector_dot_product": 0.267981618642807,
          "weight_space_angle": 0.38865476846694946,
          "task_vector_magnitude_ratio": -0.7352321743965149,
          "singular_value_overlap": 0.24837738275527954,
          "subspace_overlap": -0.14864054322242737,
          "right_subspace_overlap": 0.23653343319892883,
          "activation_l2_distance": 0.1681593656539917,
          "activation_cosine_similarity": 0.12256532907485962,
          "activation_magnitude_ratio": 0.18066371977329254,
          "activation_dot_product": 0.17003029584884644,
          "encoder_gradient_cosine_similarity": 0.25297102332115173,
          "encoder_gradient_l2_distance": 0.25820547342300415,
          "encoder_gradient_dot_product": 0.29318609833717346,
          "input_gradient_cosine_similarity": 0.34268683195114136,
          "input_gradient_l2_distance": -0.5038148760795593,
          "input_gradient_dot_product": 0.22924640774726868
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.022007930506065386,
        "train_r2": -0.5347321888455399,
        "train_pearson_r": 0.16212267041583137,
        "val_mse": 0.02101953949657413,
        "val_r2": -1.708401933624193,
        "val_pearson_r": 0.07580421530086985,
        "n_iterations": 273,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.2010032832622528,
          "right_subspace_overlap_bottom_k": 0.21644149720668793,
          "interaction_matrix_overlap_top_k": -0.20289652049541473,
          "interaction_matrix_overlap_bottom_k": -0.16857990622520447,
          "effective_rank": 0.25186455249786377,
          "effective_rank_mergeability_score": -0.769839346408844,
          "stable_rank": -0.387478768825531,
          "spectral_gap": 0.7485547661781311,
          "singular_value_ratio": -0.5752421021461487,
          "layerwise_effective_rank": 0.051385197788476944,
          "layerwise_effective_rank_mergeability_score": 0.6748127341270447,
          "task_vector_cosine_similarity": -0.7937504053115845,
          "task_vector_l2_distance": -0.15732939541339874,
          "task_vector_dot_product": 0.5753923654556274,
          "weight_space_angle": 0.44830232858657837,
          "task_vector_magnitude_ratio": 1.2598754167556763,
          "singular_value_overlap": 0.06649716198444366,
          "subspace_overlap": 0.13846705853939056,
          "right_subspace_overlap": -0.0748104527592659,
          "activation_l2_distance": -0.216685950756073,
          "activation_cosine_similarity": -0.10149048268795013,
          "activation_magnitude_ratio": -0.02198087051510811,
          "activation_dot_product": 0.018865231424570084,
          "encoder_gradient_cosine_similarity": 0.03154822438955307,
          "encoder_gradient_l2_distance": 0.019539568573236465,
          "encoder_gradient_dot_product": 0.13049036264419556,
          "input_gradient_cosine_similarity": -0.0896737277507782,
          "input_gradient_l2_distance": -0.17866277694702148,
          "input_gradient_dot_product": -0.09715614467859268
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_mse": 0.07566599856537536,
        "train_r2": -4.129556784182318,
        "train_pearson_r": -0.08582047151559989,
        "val_mse": 0.08372529546886703,
        "val_r2": -25.688724585069064,
        "val_pearson_r": -0.4233888720585314,
        "n_iterations": 129,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.2709823250770569,
          "right_subspace_overlap_bottom_k": -0.11834828555583954,
          "interaction_matrix_overlap_top_k": 0.3342590034008026,
          "interaction_matrix_overlap_bottom_k": -0.20566080510616302,
          "effective_rank": -0.4248369336128235,
          "effective_rank_mergeability_score": -0.5747389197349548,
          "stable_rank": 0.4327804744243622,
          "spectral_gap": 0.6802686452865601,
          "singular_value_ratio": -0.151575967669487,
          "layerwise_effective_rank": 0.21569392085075378,
          "layerwise_effective_rank_mergeability_score": 0.15005946159362793,
          "task_vector_cosine_similarity": -0.029348358511924744,
          "task_vector_l2_distance": 0.28623276948928833,
          "task_vector_dot_product": 0.047459255903959274,
          "weight_space_angle": 0.027144838124513626,
          "task_vector_magnitude_ratio": 0.2623170018196106,
          "singular_value_overlap": 0.18974068760871887,
          "subspace_overlap": 0.02200273983180523,
          "right_subspace_overlap": -0.1700102984905243,
          "activation_l2_distance": -0.30003538727760315,
          "activation_cosine_similarity": 0.009352131746709347,
          "activation_magnitude_ratio": 0.14064809679985046,
          "activation_dot_product": -0.32661381363868713,
          "encoder_gradient_cosine_similarity": 0.4007464647293091,
          "encoder_gradient_l2_distance": 0.5473209619522095,
          "encoder_gradient_dot_product": 0.5584323406219482,
          "input_gradient_cosine_similarity": -0.29397088289260864,
          "input_gradient_l2_distance": -0.3661019504070282,
          "input_gradient_dot_product": -0.07928495109081268
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_mse": 0.05732439203951912,
        "train_r2": -3.242368949649726,
        "train_pearson_r": -0.08071871614525698,
        "val_mse": 0.04803586844570328,
        "val_r2": -4.500231258181488,
        "val_pearson_r": -0.10452900722106641,
        "n_iterations": 53,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.36678817868232727,
          "right_subspace_overlap_bottom_k": -0.10240638256072998,
          "interaction_matrix_overlap_top_k": -0.005736851133406162,
          "interaction_matrix_overlap_bottom_k": -0.253375381231308,
          "effective_rank": 0.09633847326040268,
          "effective_rank_mergeability_score": -0.3706459701061249,
          "stable_rank": -0.04588766396045685,
          "spectral_gap": 0.16882406175136566,
          "singular_value_ratio": -0.07623786479234695,
          "layerwise_effective_rank": 0.19505266845226288,
          "layerwise_effective_rank_mergeability_score": 0.3162865936756134,
          "task_vector_cosine_similarity": -0.2525257170200348,
          "task_vector_l2_distance": 0.1552565097808838,
          "task_vector_dot_product": 0.21713915467262268,
          "weight_space_angle": 0.3243441879749298,
          "task_vector_magnitude_ratio": -0.0702962651848793,
          "singular_value_overlap": 0.17593492567539215,
          "subspace_overlap": 0.10246460139751434,
          "right_subspace_overlap": -0.1321127563714981,
          "activation_l2_distance": 0.11989389359951019,
          "activation_cosine_similarity": 0.3046671450138092,
          "activation_magnitude_ratio": -0.0806131586432457,
          "activation_dot_product": 0.08444967120885849,
          "encoder_gradient_cosine_similarity": 0.16440218687057495,
          "encoder_gradient_l2_distance": -0.3414521813392639,
          "encoder_gradient_dot_product": -0.10264937579631805,
          "input_gradient_cosine_similarity": 0.14797484874725342,
          "input_gradient_l2_distance": -0.04715326055884361,
          "input_gradient_dot_product": -0.05475600063800812
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.6171973214986177,
        "train_r2": -45.222475993450466,
        "train_pearson_r": 0.24063188054785734,
        "val_mse": 2.475624301000171,
        "val_r2": -355.18543286337444,
        "val_pearson_r": 0.043371043863279765,
        "n_iterations": 68,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.8156259655952454,
          "right_subspace_overlap_bottom_k": 0.5783103704452515,
          "interaction_matrix_overlap_top_k": -0.04246046766638756,
          "interaction_matrix_overlap_bottom_k": 0.940304160118103,
          "effective_rank": -0.1158786341547966,
          "effective_rank_mergeability_score": 1.0872894525527954,
          "stable_rank": 0.4768866300582886,
          "spectral_gap": -0.3715202808380127,
          "singular_value_ratio": 0.9001718163490295,
          "layerwise_effective_rank": 0.578191339969635,
          "layerwise_effective_rank_mergeability_score": 1.3070114850997925,
          "task_vector_cosine_similarity": 1.5991392135620117,
          "task_vector_l2_distance": -0.25386688113212585,
          "task_vector_dot_product": -1.3137412071228027,
          "weight_space_angle": -0.9332020282745361,
          "task_vector_magnitude_ratio": -0.11599310487508774,
          "singular_value_overlap": -0.4723815619945526,
          "subspace_overlap": -1.681596279144287,
          "right_subspace_overlap": -1.2277145385742188,
          "activation_l2_distance": -0.9375064373016357,
          "activation_cosine_similarity": -0.279215931892395,
          "activation_magnitude_ratio": 0.5944496393203735,
          "activation_dot_product": 0.24791671335697174,
          "encoder_gradient_cosine_similarity": 0.9315415024757385,
          "encoder_gradient_l2_distance": -0.920303225517273,
          "encoder_gradient_dot_product": 0.3550508916378021,
          "input_gradient_cosine_similarity": 0.8104203939437866,
          "input_gradient_l2_distance": -1.8797580003738403,
          "input_gradient_dot_product": 0.3015323579311371
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_mse": 0.01871625914204895,
        "train_r2": -0.3093434369614263,
        "train_pearson_r": 0.27920157957387554,
        "val_mse": 0.021285715760628154,
        "val_r2": -1.7483725510232042,
        "val_pearson_r": 0.27548929689401797,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.06643776595592499,
          "right_subspace_overlap_bottom_k": 0.2323455512523651,
          "interaction_matrix_overlap_top_k": -0.3255864381790161,
          "interaction_matrix_overlap_bottom_k": -0.19660262763500214,
          "effective_rank": 0.6165199279785156,
          "effective_rank_mergeability_score": 0.33310002088546753,
          "stable_rank": 0.19410596787929535,
          "spectral_gap": 0.3054255247116089,
          "singular_value_ratio": -0.0037266691215336323,
          "layerwise_effective_rank": -0.006032327655702829,
          "layerwise_effective_rank_mergeability_score": 0.2340167909860611,
          "task_vector_cosine_similarity": 0.046656910330057144,
          "task_vector_l2_distance": -0.09690306335687637,
          "task_vector_dot_product": 0.3327848017215729,
          "weight_space_angle": 0.49361905455589294,
          "task_vector_magnitude_ratio": 0.022687070071697235,
          "singular_value_overlap": -0.024208806455135345,
          "subspace_overlap": -0.43659162521362305,
          "right_subspace_overlap": 0.4737972915172577,
          "activation_l2_distance": -0.4657137393951416,
          "activation_cosine_similarity": -0.3170008659362793,
          "activation_magnitude_ratio": -0.040928684175014496,
          "activation_dot_product": -0.005997750908136368,
          "encoder_gradient_cosine_similarity": 0.01143110916018486,
          "encoder_gradient_l2_distance": -0.2550084888935089,
          "encoder_gradient_dot_product": 0.2089548408985138,
          "input_gradient_cosine_similarity": -0.13859950006008148,
          "input_gradient_l2_distance": -0.11091472953557968,
          "input_gradient_dot_product": -0.1476345658302307
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.03339524795251623,
        "train_r2": -1.311752446286341,
        "train_pearson_r": -0.07598841825832406,
        "val_mse": 0.15092354830886365,
        "val_r2": -18.99337022550123,
        "val_pearson_r": 0.2423800288798209,
        "n_iterations": 69,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.16700363159179688,
          "right_subspace_overlap_bottom_k": -0.06543021649122238,
          "interaction_matrix_overlap_top_k": -0.05275604873895645,
          "interaction_matrix_overlap_bottom_k": -0.1438804566860199,
          "effective_rank": 0.18223436176776886,
          "effective_rank_mergeability_score": 0.29056480526924133,
          "stable_rank": 0.1692027747631073,
          "spectral_gap": -0.11875621974468231,
          "singular_value_ratio": -0.08984585106372833,
          "layerwise_effective_rank": 0.26404112577438354,
          "layerwise_effective_rank_mergeability_score": 0.04640854522585869,
          "task_vector_cosine_similarity": -0.011000963859260082,
          "task_vector_l2_distance": 0.08656211197376251,
          "task_vector_dot_product": -0.26480233669281006,
          "weight_space_angle": 0.19965898990631104,
          "task_vector_magnitude_ratio": -0.25994378328323364,
          "singular_value_overlap": 0.12307320535182953,
          "subspace_overlap": 0.018332209438085556,
          "right_subspace_overlap": 0.1864997297525406,
          "activation_l2_distance": -0.053501371294260025,
          "activation_cosine_similarity": 0.1524784415960312,
          "activation_magnitude_ratio": -0.04367846995592117,
          "activation_dot_product": 0.060151007026433945,
          "encoder_gradient_cosine_similarity": 0.19461920857429504,
          "encoder_gradient_l2_distance": -0.04324115440249443,
          "encoder_gradient_dot_product": 0.27408209443092346,
          "input_gradient_cosine_similarity": -0.1395675092935562,
          "input_gradient_l2_distance": 0.12733229994773865,
          "input_gradient_dot_product": -0.2544173300266266
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.020655769875513135,
        "train_r2": -0.5138173383543616,
        "train_pearson_r": 0.21881326775680715,
        "val_mse": 0.023187115194873664,
        "val_r2": -2.5942219953725574,
        "val_pearson_r": 0.23623717034598618,
        "n_iterations": 684,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.33562472462654114,
          "right_subspace_overlap_bottom_k": -0.003911852370947599,
          "interaction_matrix_overlap_top_k": 0.21029222011566162,
          "interaction_matrix_overlap_bottom_k": -0.028179533779621124,
          "effective_rank": 0.19199302792549133,
          "effective_rank_mergeability_score": 0.09540669620037079,
          "stable_rank": 0.7631844878196716,
          "spectral_gap": 0.30247727036476135,
          "singular_value_ratio": 0.37575870752334595,
          "layerwise_effective_rank": -0.17946085333824158,
          "layerwise_effective_rank_mergeability_score": 0.48552635312080383,
          "task_vector_cosine_similarity": -0.5758309960365295,
          "task_vector_l2_distance": -0.051148414611816406,
          "task_vector_dot_product": 0.35741519927978516,
          "weight_space_angle": 0.24600638449192047,
          "task_vector_magnitude_ratio": -0.4099389314651489,
          "singular_value_overlap": -0.0181930810213089,
          "subspace_overlap": 0.21531282365322113,
          "right_subspace_overlap": -0.5059317350387573,
          "activation_l2_distance": -0.10997681319713593,
          "activation_cosine_similarity": 0.20472963154315948,
          "activation_magnitude_ratio": -0.02669086493551731,
          "activation_dot_product": -0.2553488314151764,
          "encoder_gradient_cosine_similarity": 0.020084606483578682,
          "encoder_gradient_l2_distance": -0.32940179109573364,
          "encoder_gradient_dot_product": 0.12995518743991852,
          "input_gradient_cosine_similarity": -0.16170059144496918,
          "input_gradient_l2_distance": -0.07728023827075958,
          "input_gradient_dot_product": -0.19977699220180511
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.03121371046677691,
        "train_r2": -1.2228208790714565,
        "train_pearson_r": -0.05760864064165855,
        "val_mse": 0.04158052221190128,
        "val_r2": -4.1535188654614315,
        "val_pearson_r": 0.173490732025642,
        "n_iterations": 88,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.15460322797298431,
          "right_subspace_overlap_bottom_k": 0.007142743095755577,
          "interaction_matrix_overlap_top_k": 0.039927657693624496,
          "interaction_matrix_overlap_bottom_k": -0.2313234508037567,
          "effective_rank": 0.12071073055267334,
          "effective_rank_mergeability_score": -0.04400436207652092,
          "stable_rank": 0.09495391696691513,
          "spectral_gap": 0.028473805636167526,
          "singular_value_ratio": -0.10256113111972809,
          "layerwise_effective_rank": 0.1394275575876236,
          "layerwise_effective_rank_mergeability_score": 0.07845255732536316,
          "task_vector_cosine_similarity": -0.20609503984451294,
          "task_vector_l2_distance": 0.17534027993679047,
          "task_vector_dot_product": 0.03782368078827858,
          "weight_space_angle": 0.20041611790657043,
          "task_vector_magnitude_ratio": -0.14791828393936157,
          "singular_value_overlap": 0.19844083487987518,
          "subspace_overlap": 0.06150832027196884,
          "right_subspace_overlap": -0.11138883978128433,
          "activation_l2_distance": 0.10734984278678894,
          "activation_cosine_similarity": 0.3112514615058899,
          "activation_magnitude_ratio": 0.08714526891708374,
          "activation_dot_product": -0.1637451946735382,
          "encoder_gradient_cosine_similarity": -0.03355364501476288,
          "encoder_gradient_l2_distance": -0.09475056082010269,
          "encoder_gradient_dot_product": 0.2748792767524719,
          "input_gradient_cosine_similarity": 0.030419638380408287,
          "input_gradient_l2_distance": -0.07338276505470276,
          "input_gradient_dot_product": 0.05625540018081665
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.0174633709367742,
        "train_r2": -0.2729599287217308,
        "train_pearson_r": 0.2646041667033699,
        "val_mse": 0.010513649706170265,
        "val_r2": -0.29687930598217815,
        "val_pearson_r": 0.0659451947085101,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.1346723884344101,
          "right_subspace_overlap_bottom_k": 0.1090913787484169,
          "interaction_matrix_overlap_top_k": -0.252265065908432,
          "interaction_matrix_overlap_bottom_k": -0.020532628521323204,
          "effective_rank": 0.07171681523323059,
          "effective_rank_mergeability_score": -0.09120988845825195,
          "stable_rank": 0.11651550233364105,
          "spectral_gap": 0.42119115591049194,
          "singular_value_ratio": -0.26584163308143616,
          "layerwise_effective_rank": 0.09656523168087006,
          "layerwise_effective_rank_mergeability_score": 0.19862698018550873,
          "task_vector_cosine_similarity": -0.028705598786473274,
          "task_vector_l2_distance": 0.005623443517833948,
          "task_vector_dot_product": -0.26417437195777893,
          "weight_space_angle": 0.028597472235560417,
          "task_vector_magnitude_ratio": 0.5168934464454651,
          "singular_value_overlap": -0.023368775844573975,
          "subspace_overlap": -0.02177434228360653,
          "right_subspace_overlap": 0.11406834423542023,
          "activation_l2_distance": 0.33872368931770325,
          "activation_cosine_similarity": 0.4838255047798157,
          "activation_magnitude_ratio": 0.004292149096727371,
          "activation_dot_product": -0.1812146157026291,
          "encoder_gradient_cosine_similarity": 0.022702300921082497,
          "encoder_gradient_l2_distance": -0.21376827359199524,
          "encoder_gradient_dot_product": 0.0880030021071434,
          "input_gradient_cosine_similarity": -0.12476466596126556,
          "input_gradient_l2_distance": -0.13633781671524048,
          "input_gradient_dot_product": -0.12677478790283203
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 4.5222265512025555,
        "train_r2": -313.4317335818656,
        "train_pearson_r": 0.03420793839144419,
        "val_mse": 2.7497627040858363,
        "val_r2": -384.64493594542563,
        "val_pearson_r": 0.068903676741998,
        "n_iterations": 71,
        "coefficients": {
          "right_subspace_overlap_top_k": 1.1167153120040894,
          "right_subspace_overlap_bottom_k": -3.4645447731018066,
          "interaction_matrix_overlap_top_k": 0.6166225671768188,
          "interaction_matrix_overlap_bottom_k": -0.03298034891486168,
          "effective_rank": -1.92387056350708,
          "effective_rank_mergeability_score": -0.9445991516113281,
          "stable_rank": -1.258697748184204,
          "spectral_gap": 1.8363059759140015,
          "singular_value_ratio": -1.3876265287399292,
          "layerwise_effective_rank": 1.3420864343643188,
          "layerwise_effective_rank_mergeability_score": -1.7565510272979736,
          "task_vector_cosine_similarity": -0.37087419629096985,
          "task_vector_l2_distance": -0.40089482069015503,
          "task_vector_dot_product": 2.0431625843048096,
          "weight_space_angle": 0.31637799739837646,
          "task_vector_magnitude_ratio": 2.116156816482544,
          "singular_value_overlap": 1.8940269947052002,
          "subspace_overlap": -1.2902984619140625,
          "right_subspace_overlap": 1.3568426370620728,
          "activation_l2_distance": 0.30084148049354553,
          "activation_cosine_similarity": -1.1440469026565552,
          "activation_magnitude_ratio": 1.2083725929260254,
          "activation_dot_product": 0.15406541526317596,
          "encoder_gradient_cosine_similarity": 0.8183530569076538,
          "encoder_gradient_l2_distance": -1.527817726135254,
          "encoder_gradient_dot_product": 0.7079795598983765,
          "input_gradient_cosine_similarity": 2.059434175491333,
          "input_gradient_l2_distance": -2.5712339878082275,
          "input_gradient_dot_product": 1.1805471181869507
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.018720093649809897,
        "train_r2": -0.3752118280005887,
        "train_pearson_r": 0.2323750168169028,
        "val_mse": 0.011611218029369843,
        "val_r2": -0.5187591532421765,
        "val_pearson_r": 0.30364056797049815,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.5654332041740417,
          "right_subspace_overlap_bottom_k": -0.1163962334394455,
          "interaction_matrix_overlap_top_k": -0.14730985462665558,
          "interaction_matrix_overlap_bottom_k": 0.1384912133216858,
          "effective_rank": 0.22015798091888428,
          "effective_rank_mergeability_score": 0.08371734619140625,
          "stable_rank": 0.21987231075763702,
          "spectral_gap": 0.30916550755500793,
          "singular_value_ratio": -0.10473345965147018,
          "layerwise_effective_rank": 0.16965800523757935,
          "layerwise_effective_rank_mergeability_score": 0.31887540221214294,
          "task_vector_cosine_similarity": 0.13927657902240753,
          "task_vector_l2_distance": 0.06328056752681732,
          "task_vector_dot_product": -0.2795405685901642,
          "weight_space_angle": 0.17517401278018951,
          "task_vector_magnitude_ratio": 0.21433496475219727,
          "singular_value_overlap": -0.01681407541036606,
          "subspace_overlap": -0.1382717788219452,
          "right_subspace_overlap": -0.2927826941013336,
          "activation_l2_distance": -0.004481689538806677,
          "activation_cosine_similarity": 0.19722002744674683,
          "activation_magnitude_ratio": -0.008791325613856316,
          "activation_dot_product": -0.16482175886631012,
          "encoder_gradient_cosine_similarity": 0.022260844707489014,
          "encoder_gradient_l2_distance": -0.24199692904949188,
          "encoder_gradient_dot_product": 0.08983836323022842,
          "input_gradient_cosine_similarity": -0.1563229113817215,
          "input_gradient_l2_distance": -0.1390535980463028,
          "input_gradient_dot_product": -0.11516446620225906
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_mse": 4020.9066875446288,
        "train_r2": -289016.23395019106,
        "train_pearson_r": 0.019461331355954372,
        "val_mse": 4494.122129493438,
        "val_r2": -615857.117881244,
        "val_pearson_r": 0.17487932024029185,
        "n_iterations": 51,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.6118670701980591,
          "right_subspace_overlap_bottom_k": -9.542757987976074,
          "interaction_matrix_overlap_top_k": 5.160565376281738,
          "interaction_matrix_overlap_bottom_k": 7.43651819229126,
          "effective_rank": -31.63255500793457,
          "effective_rank_mergeability_score": 3.453791856765747,
          "stable_rank": -4.904798984527588,
          "spectral_gap": 24.491239547729492,
          "singular_value_ratio": 17.654401779174805,
          "layerwise_effective_rank": 17.627653121948242,
          "layerwise_effective_rank_mergeability_score": 50.496578216552734,
          "task_vector_cosine_similarity": -17.643896102905273,
          "task_vector_l2_distance": -13.577522277832031,
          "task_vector_dot_product": 14.393957138061523,
          "weight_space_angle": -16.7708740234375,
          "task_vector_magnitude_ratio": -0.06452257186174393,
          "singular_value_overlap": -9.896339416503906,
          "subspace_overlap": -18.524438858032227,
          "right_subspace_overlap": -14.225059509277344,
          "activation_l2_distance": -7.954945087432861,
          "activation_cosine_similarity": 2.434908628463745,
          "activation_magnitude_ratio": 0.9264131188392639,
          "activation_dot_product": 7.800567150115967,
          "encoder_gradient_cosine_similarity": -8.885515213012695,
          "encoder_gradient_l2_distance": 20.814794540405273,
          "encoder_gradient_dot_product": -11.83228874206543,
          "input_gradient_cosine_similarity": -5.360095977783203,
          "input_gradient_l2_distance": 14.93886947631836,
          "input_gradient_dot_product": -15.241864204406738
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_mse": 0.02471407815340622,
        "train_r2": -0.7336050287777043,
        "train_pearson_r": 0.21636691737231423,
        "val_mse": 0.014389097418093027,
        "val_r2": -0.8524382261943566,
        "val_pearson_r": 0.18292652362773013,
        "n_iterations": 1000,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.30641865730285645,
          "right_subspace_overlap_bottom_k": -0.10111521929502487,
          "interaction_matrix_overlap_top_k": 0.1300947666168213,
          "interaction_matrix_overlap_bottom_k": 0.0635281354188919,
          "effective_rank": 0.42717236280441284,
          "effective_rank_mergeability_score": -0.19988735020160675,
          "stable_rank": 0.22691205143928528,
          "spectral_gap": 0.4725838899612427,
          "singular_value_ratio": 0.12132862955331802,
          "layerwise_effective_rank": -0.1615477055311203,
          "layerwise_effective_rank_mergeability_score": 0.5550568103790283,
          "task_vector_cosine_similarity": 0.0552908331155777,
          "task_vector_l2_distance": -0.09239697456359863,
          "task_vector_dot_product": 0.6199172735214233,
          "weight_space_angle": 1.290113925933838,
          "task_vector_magnitude_ratio": 0.1004074364900589,
          "singular_value_overlap": -0.004865450784564018,
          "subspace_overlap": -0.0654321163892746,
          "right_subspace_overlap": -0.2641024887561798,
          "activation_l2_distance": -1.0971685647964478,
          "activation_cosine_similarity": -0.8715413212776184,
          "activation_magnitude_ratio": -0.06257279962301254,
          "activation_dot_product": 0.08808605372905731,
          "encoder_gradient_cosine_similarity": 0.04496210813522339,
          "encoder_gradient_l2_distance": -0.29237955808639526,
          "encoder_gradient_dot_product": 0.13424378633499146,
          "input_gradient_cosine_similarity": -0.1885412037372589,
          "input_gradient_l2_distance": -0.0642007514834404,
          "input_gradient_dot_product": -0.1695239096879959
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.13295347021656248,
        "train_r2": -8.578980533957623,
        "train_pearson_r": 0.08248939939052713,
        "val_mse": 0.2496618714417287,
        "val_r2": -26.101062436098022,
        "val_pearson_r": -0.027126628676181076,
        "n_iterations": 62,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007649797480553389,
          "right_subspace_overlap_bottom_k": -0.015060123056173325,
          "interaction_matrix_overlap_top_k": 0.6745287775993347,
          "interaction_matrix_overlap_bottom_k": 0.056865494698286057,
          "effective_rank": 0.4438819885253906,
          "effective_rank_mergeability_score": -0.012405982241034508,
          "stable_rank": -0.45166805386543274,
          "spectral_gap": 0.2886503338813782,
          "singular_value_ratio": -0.18400925397872925,
          "layerwise_effective_rank": 0.4166649281978607,
          "layerwise_effective_rank_mergeability_score": -0.14303714036941528,
          "task_vector_cosine_similarity": -0.5649294853210449,
          "task_vector_l2_distance": 0.110977403819561,
          "task_vector_dot_product": 0.36880454421043396,
          "weight_space_angle": -0.06492877751588821,
          "task_vector_magnitude_ratio": -0.16148369014263153,
          "singular_value_overlap": 0.35136082768440247,
          "subspace_overlap": 0.07513581961393356,
          "right_subspace_overlap": -0.4374106824398041,
          "activation_l2_distance": 0.17816323041915894,
          "activation_cosine_similarity": 0.442600280046463,
          "activation_magnitude_ratio": 0.041053272783756256,
          "activation_dot_product": 0.21676774322986603,
          "encoder_gradient_cosine_similarity": 0.13722525537014008,
          "encoder_gradient_l2_distance": 0.1315709948539734,
          "encoder_gradient_dot_product": 0.248941108584404,
          "input_gradient_cosine_similarity": -0.6000494956970215,
          "input_gradient_l2_distance": -0.20111620426177979,
          "input_gradient_dot_product": -0.3628319799900055
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.08521092452206942,
        "train_r2": -14.567760458289616,
        "train_pearson_r": 0.12596295622833129,
        "val_mse": 0.25694975656363656,
        "val_r2": -98.53307584079761,
        "val_pearson_r": -0.07720969050116017,
        "n_iterations": 59,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.34099695086479187,
          "right_subspace_overlap_bottom_k": 0.08095736056566238,
          "interaction_matrix_overlap_top_k": 0.04169771447777748,
          "interaction_matrix_overlap_bottom_k": 0.10584711283445358,
          "effective_rank": 0.08844999969005585,
          "effective_rank_mergeability_score": -0.9095003604888916,
          "stable_rank": 0.10266386717557907,
          "spectral_gap": 0.26748964190483093,
          "singular_value_ratio": -0.15510404109954834,
          "layerwise_effective_rank": 0.09228667616844177,
          "layerwise_effective_rank_mergeability_score": 0.3784360885620117,
          "task_vector_cosine_similarity": 0.0011536860838532448,
          "task_vector_l2_distance": 0.08357290178537369,
          "task_vector_dot_product": 0.09140007197856903,
          "weight_space_angle": 0.28769850730895996,
          "task_vector_magnitude_ratio": -0.437042236328125,
          "singular_value_overlap": 0.38371920585632324,
          "subspace_overlap": -0.1383332908153534,
          "right_subspace_overlap": 0.1934049427509308,
          "activation_l2_distance": 0.26540184020996094,
          "activation_cosine_similarity": 0.2857900857925415,
          "activation_magnitude_ratio": -0.22965911030769348,
          "activation_dot_product": 0.19003993272781372,
          "encoder_gradient_cosine_similarity": -0.27438148856163025,
          "encoder_gradient_l2_distance": -0.3008715510368347,
          "encoder_gradient_dot_product": 0.41537711024284363,
          "input_gradient_cosine_similarity": 0.2150467336177826,
          "input_gradient_l2_distance": -0.07454285770654678,
          "input_gradient_dot_product": 0.28864869475364685
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_mse": 0.11026777032683543,
        "train_r2": -6.900536548808766,
        "train_pearson_r": -0.17840858245878205,
        "val_mse": 0.06336117846971595,
        "val_r2": -6.650416829560535,
        "val_pearson_r": -0.19965404960668123,
        "n_iterations": 95,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.22930796444416046,
          "right_subspace_overlap_bottom_k": -0.10462449491024017,
          "interaction_matrix_overlap_top_k": 0.4836118817329407,
          "interaction_matrix_overlap_bottom_k": -0.1447957158088684,
          "effective_rank": 0.0963669940829277,
          "effective_rank_mergeability_score": -0.09005729854106903,
          "stable_rank": -0.7687874436378479,
          "spectral_gap": -0.3251200318336487,
          "singular_value_ratio": 0.20165495574474335,
          "layerwise_effective_rank": 0.1460687667131424,
          "layerwise_effective_rank_mergeability_score": 0.5343624949455261,
          "task_vector_cosine_similarity": -0.4784340560436249,
          "task_vector_l2_distance": 0.16285981237888336,
          "task_vector_dot_product": 0.055038921535015106,
          "weight_space_angle": 0.015324750915169716,
          "task_vector_magnitude_ratio": 0.3995676040649414,
          "singular_value_overlap": 0.3622218668460846,
          "subspace_overlap": -0.2828082740306854,
          "right_subspace_overlap": -0.24369873106479645,
          "activation_l2_distance": -0.009047038853168488,
          "activation_cosine_similarity": 0.21375831961631775,
          "activation_magnitude_ratio": 0.30831584334373474,
          "activation_dot_product": 0.05034558102488518,
          "encoder_gradient_cosine_similarity": 0.1769859790802002,
          "encoder_gradient_l2_distance": -0.30788496136665344,
          "encoder_gradient_dot_product": 0.33368295431137085,
          "input_gradient_cosine_similarity": -0.10540717840194702,
          "input_gradient_l2_distance": 0.1215275451540947,
          "input_gradient_dot_product": 0.4210260510444641
        }
      }
    ],
    "optimization_params": {
      "objective": "MSE",
      "n_iterations": 1000,
      "learning_rate": 0.01,
      "patience": 50,
      "convergence_threshold": 1e-06
    }
  }
}