{
  "aggregate_metrics": {
    "train_mse": 65.79623127721104,
    "train_r2": -16117.626068648115,
    "train_pearson_r": 0.07062355252309695,
    "train_pearson_p": 6.0146370816548416e-05,
    "val_mse": 90.3225586423997,
    "val_r2": -22126.03541227111,
    "val_pearson_r": -0.06616280631831493,
    "val_pearson_p": 0.21172002583663055
  },
  "per_fold_stats": {
    "train_mse_mean": 66.0003218085351,
    "train_mse_std": 196.43723756756944,
    "val_mse_mean": 88.44176990727794,
    "val_mse_std": 285.64235820484515,
    "train_r_mean": 0.23314818778393867,
    "train_r_std": 0.22833233962500848,
    "val_r_mean": 0.18687256302310465,
    "val_r_std": 0.35235980022069285
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 1.8058252334594727,
    "right_subspace_overlap_bottom_k": -1.3870881795883179,
    "interaction_matrix_overlap_top_k": 0.8444067239761353,
    "interaction_matrix_overlap_bottom_k": 1.2753050327301025,
    "effective_rank": 1.5006048679351807,
    "effective_rank_mergeability_score": 0.00985858403146267,
    "stable_rank": 1.307286024093628,
    "spectral_gap": -1.4312965869903564,
    "singular_value_ratio": -2.8738560676574707,
    "layerwise_effective_rank": -1.5182852745056152,
    "layerwise_effective_rank_mergeability_score": -0.5700728297233582,
    "task_vector_cosine_similarity": -0.6403070688247681,
    "task_vector_l2_distance": 0.09525584429502487,
    "task_vector_dot_product": 0.39443689584732056,
    "weight_space_angle": -1.3025461435317993,
    "task_vector_magnitude_ratio": 0.3075953423976898,
    "singular_value_overlap": 1.067650556564331,
    "subspace_overlap": 1.3921890258789062,
    "right_subspace_overlap": -1.7947447299957275,
    "activation_l2_distance": -0.5298110246658325,
    "activation_cosine_similarity": 0.8698446154594421,
    "activation_magnitude_ratio": 0.5118957757949829,
    "activation_dot_product": 0.2537786066532135,
    "encoder_gradient_cosine_similarity": 1.532606601715088,
    "encoder_gradient_l2_distance": -0.5751479864120483,
    "encoder_gradient_dot_product": 0.4765914976596832,
    "input_gradient_cosine_similarity": -1.2081639766693115,
    "input_gradient_l2_distance": -0.41626840829849243,
    "input_gradient_dot_product": 1.5912938117980957
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 5.105084419250488,
    "right_subspace_overlap_bottom_k": 7.868483543395996,
    "interaction_matrix_overlap_top_k": 3.99006724357605,
    "interaction_matrix_overlap_bottom_k": 3.1081314086914062,
    "effective_rank": 4.639261245727539,
    "effective_rank_mergeability_score": 1.9102100133895874,
    "stable_rank": 5.668040752410889,
    "spectral_gap": 8.164864540100098,
    "singular_value_ratio": 8.715383529663086,
    "layerwise_effective_rank": 6.2415900230407715,
    "layerwise_effective_rank_mergeability_score": 3.7116498947143555,
    "task_vector_cosine_similarity": 5.086080551147461,
    "task_vector_l2_distance": 1.4514036178588867,
    "task_vector_dot_product": 3.163069725036621,
    "weight_space_angle": 6.166738033294678,
    "task_vector_magnitude_ratio": 5.634439945220947,
    "singular_value_overlap": 4.105656623840332,
    "subspace_overlap": 7.451869487762451,
    "right_subspace_overlap": 5.263078212738037,
    "activation_l2_distance": 3.455319404602051,
    "activation_cosine_similarity": 6.879420757293701,
    "activation_magnitude_ratio": 1.882379174232483,
    "activation_dot_product": 3.6240499019622803,
    "encoder_gradient_cosine_similarity": 5.814236164093018,
    "encoder_gradient_l2_distance": 4.5888872146606445,
    "encoder_gradient_dot_product": 3.2293033599853516,
    "input_gradient_cosine_similarity": 5.052158355712891,
    "input_gradient_l2_distance": 8.169217109680176,
    "input_gradient_dot_product": 4.96410608291626
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.006494030915670673,
      "train_r2": -0.6421228444603617,
      "train_pearson_r": 0.5502301533513804,
      "val_mse": 0.005995544139338355,
      "val_r2": -2.0396282759634987,
      "val_pearson_r": 0.5412642194579437,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5015450716018677,
        "right_subspace_overlap_bottom_k": 0.10363337397575378,
        "interaction_matrix_overlap_top_k": -0.6193697452545166,
        "interaction_matrix_overlap_bottom_k": -0.2125515341758728,
        "effective_rank": 0.22710831463336945,
        "effective_rank_mergeability_score": -0.045060690492391586,
        "stable_rank": 0.04158557951450348,
        "spectral_gap": 0.054597336798906326,
        "singular_value_ratio": -0.3537108898162842,
        "layerwise_effective_rank": 0.060531772673130035,
        "layerwise_effective_rank_mergeability_score": 0.24425353109836578,
        "task_vector_cosine_similarity": -0.06813260912895203,
        "task_vector_l2_distance": 0.048835862427949905,
        "task_vector_dot_product": -0.11705438792705536,
        "weight_space_angle": 0.04085724055767059,
        "task_vector_magnitude_ratio": 0.2987034320831299,
        "singular_value_overlap": 0.040603116154670715,
        "subspace_overlap": 0.04257604479789734,
        "right_subspace_overlap": 0.08585675805807114,
        "activation_l2_distance": 0.5054065585136414,
        "activation_cosine_similarity": 0.7095668315887451,
        "activation_magnitude_ratio": 0.004388925153762102,
        "activation_dot_product": -0.2056703418493271,
        "encoder_gradient_cosine_similarity": 0.028838496655225754,
        "encoder_gradient_l2_distance": -0.1839449405670166,
        "encoder_gradient_dot_product": 0.06832937151193619,
        "input_gradient_cosine_similarity": -0.10361086577177048,
        "input_gradient_l2_distance": -0.11409493535757065,
        "input_gradient_dot_product": -0.08384513854980469
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.017618485366996044,
      "train_r2": -3.230767285701382,
      "train_pearson_r": 0.3611250928545767,
      "val_mse": 0.016266523948033147,
      "val_r2": -7.318835538134424,
      "val_pearson_r": 0.11486767448792917,
      "n_iterations": 60,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.04346197098493576,
        "right_subspace_overlap_bottom_k": -0.028818411752581596,
        "interaction_matrix_overlap_top_k": -0.13633374869823456,
        "interaction_matrix_overlap_bottom_k": -0.04926997423171997,
        "effective_rank": 0.0968763530254364,
        "effective_rank_mergeability_score": 0.21399913728237152,
        "stable_rank": 0.09424205869436264,
        "spectral_gap": 0.1959235817193985,
        "singular_value_ratio": -0.24144825339317322,
        "layerwise_effective_rank": -0.14591005444526672,
        "layerwise_effective_rank_mergeability_score": -0.036461781710386276,
        "task_vector_cosine_similarity": -0.06280477344989777,
        "task_vector_l2_distance": 0.11381185799837112,
        "task_vector_dot_product": -0.5055162906646729,
        "weight_space_angle": -0.06947128474712372,
        "task_vector_magnitude_ratio": 0.600864052772522,
        "singular_value_overlap": 0.1628025770187378,
        "subspace_overlap": 0.16535358130931854,
        "right_subspace_overlap": -0.045025456696748734,
        "activation_l2_distance": 0.2148231565952301,
        "activation_cosine_similarity": 0.3410813808441162,
        "activation_magnitude_ratio": 0.12666359543800354,
        "activation_dot_product": 0.024881675839424133,
        "encoder_gradient_cosine_similarity": 0.0681108832359314,
        "encoder_gradient_l2_distance": -0.28165772557258606,
        "encoder_gradient_dot_product": 0.23950369656085968,
        "input_gradient_cosine_similarity": 0.01158287562429905,
        "input_gradient_l2_distance": -0.11265236884355545,
        "input_gradient_dot_product": 0.08559601753950119
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 12.766052528450437,
      "train_r2": -3008.6953853661917,
      "train_pearson_r": -0.12457106631186576,
      "val_mse": 10.10043942656666,
      "val_r2": -4599.186835708717,
      "val_pearson_r": -0.22364587011934592,
      "n_iterations": 52,
      "coefficients": {
        "right_subspace_overlap_top_k": 8.217000007629395,
        "right_subspace_overlap_bottom_k": 3.439969778060913,
        "interaction_matrix_overlap_top_k": -1.489062786102295,
        "interaction_matrix_overlap_bottom_k": 4.684792995452881,
        "effective_rank": 6.010285377502441,
        "effective_rank_mergeability_score": 4.348766803741455,
        "stable_rank": -2.834906816482544,
        "spectral_gap": -0.9944260716438293,
        "singular_value_ratio": -2.6480660438537598,
        "layerwise_effective_rank": -4.101172924041748,
        "layerwise_effective_rank_mergeability_score": -2.681809663772583,
        "task_vector_cosine_similarity": 3.7345471382141113,
        "task_vector_l2_distance": -3.0967466831207275,
        "task_vector_dot_product": -1.1798949241638184,
        "weight_space_angle": 7.961326599121094,
        "task_vector_magnitude_ratio": 5.037882328033447,
        "singular_value_overlap": -2.5016603469848633,
        "subspace_overlap": -8.176319122314453,
        "right_subspace_overlap": -0.5958988070487976,
        "activation_l2_distance": -5.12571907043457,
        "activation_cosine_similarity": -3.780369520187378,
        "activation_magnitude_ratio": -1.6821027994155884,
        "activation_dot_product": 2.2067089080810547,
        "encoder_gradient_cosine_similarity": -4.560495376586914,
        "encoder_gradient_l2_distance": -3.5891568660736084,
        "encoder_gradient_dot_product": 0.9575493931770325,
        "input_gradient_cosine_similarity": -0.4814671576023102,
        "input_gradient_l2_distance": 2.0050418376922607,
        "input_gradient_dot_product": 1.8827824592590332
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.8359693014179114,
      "train_r2": -203.05431680509224,
      "train_pearson_r": -0.10394448987677578,
      "val_mse": 0.42983159869450355,
      "val_r2": -212.65934671486062,
      "val_pearson_r": -0.36396651198520646,
      "n_iterations": 140,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.5302114486694336,
        "right_subspace_overlap_bottom_k": -0.5816190838813782,
        "interaction_matrix_overlap_top_k": -2.069439649581909,
        "interaction_matrix_overlap_bottom_k": -1.7333592176437378,
        "effective_rank": -1.4569010734558105,
        "effective_rank_mergeability_score": -2.258430242538452,
        "stable_rank": -0.4789849519729614,
        "spectral_gap": 3.926006317138672,
        "singular_value_ratio": 3.3322715759277344,
        "layerwise_effective_rank": 0.9888357520103455,
        "layerwise_effective_rank_mergeability_score": 0.6629985570907593,
        "task_vector_cosine_similarity": -0.696834921836853,
        "task_vector_l2_distance": 2.529909372329712,
        "task_vector_dot_product": -2.3062338829040527,
        "weight_space_angle": -2.8664565086364746,
        "task_vector_magnitude_ratio": 0.45339176058769226,
        "singular_value_overlap": 0.8926398754119873,
        "subspace_overlap": -0.10864519327878952,
        "right_subspace_overlap": 2.247804641723633,
        "activation_l2_distance": -2.3866171836853027,
        "activation_cosine_similarity": -0.4901508390903473,
        "activation_magnitude_ratio": -0.7885288000106812,
        "activation_dot_product": -1.2396271228790283,
        "encoder_gradient_cosine_similarity": 0.3621945083141327,
        "encoder_gradient_l2_distance": 1.1537203788757324,
        "encoder_gradient_dot_product": 2.4894931316375732,
        "input_gradient_cosine_similarity": 0.671427309513092,
        "input_gradient_l2_distance": 0.8815101385116577,
        "input_gradient_dot_product": -1.6711146831512451
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.008709599238155272,
      "train_r2": -1.1134529581463704,
      "train_pearson_r": 0.47406820269825706,
      "val_mse": 0.016556172314183975,
      "val_r2": -5.337283508445506,
      "val_pearson_r": 0.5598055133047942,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.07785766571760178,
        "right_subspace_overlap_bottom_k": -0.1901814043521881,
        "interaction_matrix_overlap_top_k": -0.5809399485588074,
        "interaction_matrix_overlap_bottom_k": 0.0470866933465004,
        "effective_rank": 0.12265483289957047,
        "effective_rank_mergeability_score": -0.06759938597679138,
        "stable_rank": 0.30898961424827576,
        "spectral_gap": 0.274494469165802,
        "singular_value_ratio": -0.17514237761497498,
        "layerwise_effective_rank": 0.04871784895658493,
        "layerwise_effective_rank_mergeability_score": 0.43862536549568176,
        "task_vector_cosine_similarity": -0.6122279167175293,
        "task_vector_l2_distance": 0.07628201693296432,
        "task_vector_dot_product": -0.07129103690385818,
        "weight_space_angle": -0.0798344761133194,
        "task_vector_magnitude_ratio": 0.3191929757595062,
        "singular_value_overlap": 0.0846552699804306,
        "subspace_overlap": 0.7021064758300781,
        "right_subspace_overlap": 0.26953980326652527,
        "activation_l2_distance": 0.25857555866241455,
        "activation_cosine_similarity": 0.4702267348766327,
        "activation_magnitude_ratio": 0.015008204616606236,
        "activation_dot_product": -0.10106448829174042,
        "encoder_gradient_cosine_similarity": 0.05184703320264816,
        "encoder_gradient_l2_distance": -0.21650637686252594,
        "encoder_gradient_dot_product": 0.040335625410079956,
        "input_gradient_cosine_similarity": -0.19937364757061005,
        "input_gradient_l2_distance": -0.08643071353435516,
        "input_gradient_dot_product": -0.06962601840496063
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_mse": 0.22738131496138178,
      "train_r2": -53.899894521297185,
      "train_pearson_r": -0.07884424390987158,
      "val_mse": 0.09477467640436288,
      "val_r2": -42.4756400096251,
      "val_pearson_r": -0.22063925725182637,
      "n_iterations": 160,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.9845483899116516,
        "right_subspace_overlap_bottom_k": -0.007197195664048195,
        "interaction_matrix_overlap_top_k": -0.28488847613334656,
        "interaction_matrix_overlap_bottom_k": -0.2673262655735016,
        "effective_rank": 0.8626580834388733,
        "effective_rank_mergeability_score": -0.8152667284011841,
        "stable_rank": 0.45300164818763733,
        "spectral_gap": 0.9303023219108582,
        "singular_value_ratio": -0.02795748971402645,
        "layerwise_effective_rank": -0.4817885756492615,
        "layerwise_effective_rank_mergeability_score": 0.34374478459358215,
        "task_vector_cosine_similarity": 0.3980044424533844,
        "task_vector_l2_distance": 0.33917030692100525,
        "task_vector_dot_product": 0.15200018882751465,
        "weight_space_angle": 0.3846574127674103,
        "task_vector_magnitude_ratio": -0.2021251916885376,
        "singular_value_overlap": -0.8046612739562988,
        "subspace_overlap": 0.8721202611923218,
        "right_subspace_overlap": 0.3012221157550812,
        "activation_l2_distance": -0.5389862656593323,
        "activation_cosine_similarity": 0.245595782995224,
        "activation_magnitude_ratio": 0.3652581572532654,
        "activation_dot_product": -0.3724941313266754,
        "encoder_gradient_cosine_similarity": -0.000722814816981554,
        "encoder_gradient_l2_distance": -0.14944183826446533,
        "encoder_gradient_dot_product": 0.32912489771842957,
        "input_gradient_cosine_similarity": 0.00222951197065413,
        "input_gradient_l2_distance": 0.06534621864557266,
        "input_gradient_dot_product": -0.1062127947807312
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_mse": 0.07715142973030652,
      "train_r2": -18.350480722785026,
      "train_pearson_r": 0.04258242332034279,
      "val_mse": 0.17407325942701377,
      "val_r2": -95.11120718332711,
      "val_pearson_r": 0.16523711450517764,
      "n_iterations": 62,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.050340160727500916,
        "right_subspace_overlap_bottom_k": -0.11002074182033539,
        "interaction_matrix_overlap_top_k": -0.3335300385951996,
        "interaction_matrix_overlap_bottom_k": 0.13023170828819275,
        "effective_rank": -0.0021546429488807917,
        "effective_rank_mergeability_score": 0.0038985502906143665,
        "stable_rank": 0.5357245206832886,
        "spectral_gap": -0.2187800407409668,
        "singular_value_ratio": 0.015362914651632309,
        "layerwise_effective_rank": -0.16645604372024536,
        "layerwise_effective_rank_mergeability_score": 0.4061454236507416,
        "task_vector_cosine_similarity": 0.21020154654979706,
        "task_vector_l2_distance": 0.263214111328125,
        "task_vector_dot_product": 0.07244568318128586,
        "weight_space_angle": 0.2254849076271057,
        "task_vector_magnitude_ratio": -0.2686350345611572,
        "singular_value_overlap": 0.7414997816085815,
        "subspace_overlap": 0.14183814823627472,
        "right_subspace_overlap": -0.17304667830467224,
        "activation_l2_distance": -0.12136116623878479,
        "activation_cosine_similarity": -0.004341526888310909,
        "activation_magnitude_ratio": 0.16559019684791565,
        "activation_dot_product": 0.007339825853705406,
        "encoder_gradient_cosine_similarity": 0.017921313643455505,
        "encoder_gradient_l2_distance": -0.019042152911424637,
        "encoder_gradient_dot_product": -0.02745748870074749,
        "input_gradient_cosine_similarity": -0.25587528944015503,
        "input_gradient_l2_distance": -0.0316561795771122,
        "input_gradient_dot_product": -0.16206450760364532
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 790.2211886136038,
      "train_r2": -220078.69557729142,
      "train_pearson_r": 0.21821325787578505,
      "val_mse": 1268.7345558885254,
      "val_r2": -663189.3748691857,
      "val_pearson_r": 0.023490154904212746,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.009305715560913,
        "right_subspace_overlap_bottom_k": -34.6861572265625,
        "interaction_matrix_overlap_top_k": 16.970306396484375,
        "interaction_matrix_overlap_bottom_k": 4.202853202819824,
        "effective_rank": 5.205721855163574,
        "effective_rank_mergeability_score": -6.134680271148682,
        "stable_rank": 25.40328598022461,
        "spectral_gap": -36.555938720703125,
        "singular_value_ratio": -33.41578674316406,
        "layerwise_effective_rank": -23.56412124633789,
        "layerwise_effective_rank_mergeability_score": -10.626612663269043,
        "task_vector_cosine_similarity": -2.5167434215545654,
        "task_vector_l2_distance": 4.684350490570068,
        "task_vector_dot_product": 12.558123588562012,
        "weight_space_angle": -9.546321868896484,
        "task_vector_magnitude_ratio": 15.725997924804688,
        "singular_value_overlap": 18.427377700805664,
        "subspace_overlap": 32.693763732910156,
        "right_subspace_overlap": -21.106319427490234,
        "activation_l2_distance": -3.740892171859741,
        "activation_cosine_similarity": 29.25728416442871,
        "activation_magnitude_ratio": 0.6357885003089905,
        "activation_dot_product": -4.809090614318848,
        "encoder_gradient_cosine_similarity": 14.781245231628418,
        "encoder_gradient_l2_distance": -16.753376007080078,
        "encoder_gradient_dot_product": -9.132038116455078,
        "input_gradient_cosine_similarity": -14.364052772521973,
        "input_gradient_l2_distance": 24.429950714111328,
        "input_gradient_dot_product": 20.89995574951172
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_mse": 0.008190921941981911,
      "train_r2": -0.960411718356533,
      "train_pearson_r": 0.4864551354404168,
      "val_mse": 0.007883520365991381,
      "val_r2": -2.295904720193254,
      "val_pearson_r": 0.5740658718205838,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0811174288392067,
        "right_subspace_overlap_bottom_k": 0.1496574729681015,
        "interaction_matrix_overlap_top_k": -0.12665148079395294,
        "interaction_matrix_overlap_bottom_k": -0.31740668416023254,
        "effective_rank": 0.11684655398130417,
        "effective_rank_mergeability_score": -0.017690453678369522,
        "stable_rank": 0.5691369771957397,
        "spectral_gap": 0.15639087557792664,
        "singular_value_ratio": 0.14784710109233856,
        "layerwise_effective_rank": -0.1444728672504425,
        "layerwise_effective_rank_mergeability_score": 0.41319698095321655,
        "task_vector_cosine_similarity": -0.22827987372875214,
        "task_vector_l2_distance": 0.09267397224903107,
        "task_vector_dot_product": -0.1668136864900589,
        "weight_space_angle": 0.11161430925130844,
        "task_vector_magnitude_ratio": -0.18548016250133514,
        "singular_value_overlap": 0.07599227130413055,
        "subspace_overlap": 0.17968812584877014,
        "right_subspace_overlap": 0.32365626096725464,
        "activation_l2_distance": 0.11460516601800919,
        "activation_cosine_similarity": 0.29382216930389404,
        "activation_magnitude_ratio": -0.0013622479746118188,
        "activation_dot_product": -0.07440344989299774,
        "encoder_gradient_cosine_similarity": 0.03336207941174507,
        "encoder_gradient_l2_distance": -0.241509348154068,
        "encoder_gradient_dot_product": 0.11271486431360245,
        "input_gradient_cosine_similarity": -0.13750885426998138,
        "input_gradient_l2_distance": -0.08531773835420609,
        "input_gradient_dot_product": -0.08262838423252106
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 30.480466468112304,
      "train_r2": -7721.196746188418,
      "train_pearson_r": 0.1032860590550282,
      "val_mse": 70.52953206072127,
      "val_r2": -23953.083242817604,
      "val_pearson_r": -0.13505421595863687,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.5628321170806885,
        "right_subspace_overlap_bottom_k": -2.194441556930542,
        "interaction_matrix_overlap_top_k": 3.1257903575897217,
        "interaction_matrix_overlap_bottom_k": 8.487127304077148,
        "effective_rank": -2.8871192932128906,
        "effective_rank_mergeability_score": 0.8939045071601868,
        "stable_rank": 4.099572658538818,
        "spectral_gap": 4.238776683807373,
        "singular_value_ratio": -3.2769062519073486,
        "layerwise_effective_rank": 10.047021865844727,
        "layerwise_effective_rank_mergeability_score": 8.43239688873291,
        "task_vector_cosine_similarity": 6.704230785369873,
        "task_vector_l2_distance": -1.295399785041809,
        "task_vector_dot_product": 4.290590763092041,
        "weight_space_angle": -0.5699487924575806,
        "task_vector_magnitude_ratio": 3.8975348472595215,
        "singular_value_overlap": -0.61711585521698,
        "subspace_overlap": -1.998716950416565,
        "right_subspace_overlap": -4.783637523651123,
        "activation_l2_distance": -10.123641014099121,
        "activation_cosine_similarity": -2.6867570877075195,
        "activation_magnitude_ratio": 1.4996728897094727,
        "activation_dot_product": -5.669218063354492,
        "encoder_gradient_cosine_similarity": -0.8821572065353394,
        "encoder_gradient_l2_distance": -0.5064927935600281,
        "encoder_gradient_dot_product": 2.3351547718048096,
        "input_gradient_cosine_similarity": -16.712331771850586,
        "input_gradient_l2_distance": -6.22330379486084,
        "input_gradient_dot_product": 1.7647422552108765
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.008914298319485066,
      "train_r2": -1.5391685274862281,
      "train_pearson_r": 0.4822302498540507,
      "val_mse": 0.011550898448410458,
      "val_r2": -5.920606845472527,
      "val_pearson_r": 0.4520083941971499,
      "n_iterations": 567,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.18293428421020508,
        "right_subspace_overlap_bottom_k": -0.18692001700401306,
        "interaction_matrix_overlap_top_k": 0.08366822451353073,
        "interaction_matrix_overlap_bottom_k": 0.03771665692329407,
        "effective_rank": 0.2193940281867981,
        "effective_rank_mergeability_score": -0.2656913995742798,
        "stable_rank": -0.10567401349544525,
        "spectral_gap": 0.07903212308883667,
        "singular_value_ratio": -0.0006082195322960615,
        "layerwise_effective_rank": 0.1999851018190384,
        "layerwise_effective_rank_mergeability_score": 0.4826907217502594,
        "task_vector_cosine_similarity": -0.1089906096458435,
        "task_vector_l2_distance": 0.015750987455248833,
        "task_vector_dot_product": 0.2447122484445572,
        "weight_space_angle": 0.42036131024360657,
        "task_vector_magnitude_ratio": -0.028608379885554314,
        "singular_value_overlap": 0.07582012563943863,
        "subspace_overlap": -0.12130072712898254,
        "right_subspace_overlap": -0.09205377101898193,
        "activation_l2_distance": 0.13660269975662231,
        "activation_cosine_similarity": 0.3839362859725952,
        "activation_magnitude_ratio": 0.019505122676491737,
        "activation_dot_product": -0.18729165196418762,
        "encoder_gradient_cosine_similarity": 0.03237801045179367,
        "encoder_gradient_l2_distance": -0.1992858648300171,
        "encoder_gradient_dot_product": 0.14459802210330963,
        "input_gradient_cosine_similarity": -0.15804991126060486,
        "input_gradient_l2_distance": -0.09388505667448044,
        "input_gradient_dot_product": -0.2105865627527237
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.019149383341182054,
      "train_r2": -3.6084033411560297,
      "train_pearson_r": 0.2200561445405937,
      "val_mse": 0.022661796011881376,
      "val_r2": -10.14438253810115,
      "val_pearson_r": 0.08390384455341292,
      "n_iterations": 248,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.27666279673576355,
        "right_subspace_overlap_bottom_k": 0.18792949616909027,
        "interaction_matrix_overlap_top_k": -0.06309544295072556,
        "interaction_matrix_overlap_bottom_k": -0.3646450936794281,
        "effective_rank": 0.3512739837169647,
        "effective_rank_mergeability_score": -0.3554307818412781,
        "stable_rank": 0.3314375579357147,
        "spectral_gap": 0.3314051628112793,
        "singular_value_ratio": -0.4250406324863434,
        "layerwise_effective_rank": -0.2722756862640381,
        "layerwise_effective_rank_mergeability_score": 0.2668405771255493,
        "task_vector_cosine_similarity": 0.3138699233531952,
        "task_vector_l2_distance": 0.08469494432210922,
        "task_vector_dot_product": 0.3001410961151123,
        "weight_space_angle": 0.40639904141426086,
        "task_vector_magnitude_ratio": 0.25414642691612244,
        "singular_value_overlap": 0.1404152810573578,
        "subspace_overlap": -0.17061026394367218,
        "right_subspace_overlap": 0.19634214043617249,
        "activation_l2_distance": -0.08530935645103455,
        "activation_cosine_similarity": 0.21539151668548584,
        "activation_magnitude_ratio": 0.02747342549264431,
        "activation_dot_product": -0.2075960636138916,
        "encoder_gradient_cosine_similarity": 0.023540543392300606,
        "encoder_gradient_l2_distance": -0.22208160161972046,
        "encoder_gradient_dot_product": 0.18840713798999786,
        "input_gradient_cosine_similarity": -0.026091113686561584,
        "input_gradient_l2_distance": -0.047991253435611725,
        "input_gradient_dot_product": -0.10526027530431747
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 483.0389718128666,
      "train_r2": -122779.53724427204,
      "train_pearson_r": 0.1659078141421891,
      "val_mse": 416.53661077233886,
      "val_r2": -206528.25304895968,
      "val_pearson_r": 0.29625609615623205,
      "n_iterations": 52,
      "coefficients": {
        "right_subspace_overlap_top_k": 22.54905128479004,
        "right_subspace_overlap_bottom_k": 7.427090644836426,
        "interaction_matrix_overlap_top_k": 4.97927713394165,
        "interaction_matrix_overlap_bottom_k": 10.497476577758789,
        "effective_rank": 19.934619903564453,
        "effective_rank_mergeability_score": 2.2789947986602783,
        "stable_rank": -2.076051712036133,
        "spectral_gap": -1.25151789188385,
        "singular_value_ratio": -23.099252700805664,
        "layerwise_effective_rank": -12.26413345336914,
        "layerwise_effective_rank_mergeability_score": -9.359789848327637,
        "task_vector_cosine_similarity": -21.369659423828125,
        "task_vector_l2_distance": -1.3216900825500488,
        "task_vector_dot_product": -4.338826656341553,
        "weight_space_angle": -25.0842342376709,
        "task_vector_magnitude_ratio": -18.61222267150879,
        "singular_value_overlap": 3.3477306365966797,
        "subspace_overlap": 2.7042360305786133,
        "right_subspace_overlap": -11.923957824707031,
        "activation_l2_distance": 9.72875690460205,
        "activation_cosine_similarity": -8.923073768615723,
        "activation_magnitude_ratio": 8.25240421295166,
        "activation_dot_product": 14.189093589782715,
        "encoder_gradient_cosine_similarity": 21.836345672607422,
        "encoder_gradient_l2_distance": 11.45976734161377,
        "encoder_gradient_dot_product": 10.793251991271973,
        "input_gradient_cosine_similarity": 7.105270862579346,
        "input_gradient_l2_distance": -26.329198837280273,
        "input_gradient_dot_product": 9.82205581665039
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.25757817469329625,
      "train_r2": -60.17602549828345,
      "train_pearson_r": 0.45944111255731035,
      "val_mse": 0.14413720465806978,
      "val_r2": -56.07052414347014,
      "val_pearson_r": 0.6556563510173351,
      "n_iterations": 77,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.36649617552757263,
        "right_subspace_overlap_bottom_k": -0.2784446179866791,
        "interaction_matrix_overlap_top_k": -0.008806105703115463,
        "interaction_matrix_overlap_bottom_k": -0.05355469882488251,
        "effective_rank": 0.7377135157585144,
        "effective_rank_mergeability_score": 0.46871641278266907,
        "stable_rank": 0.11825310438871384,
        "spectral_gap": -0.09907730668783188,
        "singular_value_ratio": -0.15386778116226196,
        "layerwise_effective_rank": 0.1316457986831665,
        "layerwise_effective_rank_mergeability_score": -0.35481786727905273,
        "task_vector_cosine_similarity": -0.05425296723842621,
        "task_vector_l2_distance": -0.243205264210701,
        "task_vector_dot_product": 0.0139019088819623,
        "weight_space_angle": 0.16105276346206665,
        "task_vector_magnitude_ratio": -0.9024935960769653,
        "singular_value_overlap": -0.030772453173995018,
        "subspace_overlap": 0.463822603225708,
        "right_subspace_overlap": 0.5235461592674255,
        "activation_l2_distance": 0.03128408268094063,
        "activation_cosine_similarity": 0.015114519745111465,
        "activation_magnitude_ratio": 0.15386229753494263,
        "activation_dot_product": 0.22191938757896423,
        "encoder_gradient_cosine_similarity": 0.8542152643203735,
        "encoder_gradient_l2_distance": -0.5381020307540894,
        "encoder_gradient_dot_product": 0.3815673291683197,
        "input_gradient_cosine_similarity": -0.6423994898796082,
        "input_gradient_l2_distance": -0.27435964345932007,
        "input_gradient_dot_product": -0.01728706806898117
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.007088999115769163,
      "train_r2": -0.764666824171816,
      "train_pearson_r": 0.5178070346556815,
      "val_mse": 0.009506088978558659,
      "val_r2": -2.170314911519515,
      "val_pearson_r": 0.36081768240959045,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.08908762782812119,
        "right_subspace_overlap_bottom_k": 0.00542212650179863,
        "interaction_matrix_overlap_top_k": -0.03958059847354889,
        "interaction_matrix_overlap_bottom_k": -0.20513668656349182,
        "effective_rank": 0.144802987575531,
        "effective_rank_mergeability_score": -0.10307519137859344,
        "stable_rank": 0.13496220111846924,
        "spectral_gap": 0.4039575755596161,
        "singular_value_ratio": -0.07327494770288467,
        "layerwise_effective_rank": 0.09514009207487106,
        "layerwise_effective_rank_mergeability_score": 0.3227781355381012,
        "task_vector_cosine_similarity": -0.038999151438474655,
        "task_vector_l2_distance": 0.11154060810804367,
        "task_vector_dot_product": -0.17056122422218323,
        "weight_space_angle": 0.1465829759836197,
        "task_vector_magnitude_ratio": 0.34627026319503784,
        "singular_value_overlap": 0.0713743194937706,
        "subspace_overlap": -0.15693838894367218,
        "right_subspace_overlap": 0.19932085275650024,
        "activation_l2_distance": 0.0032601880375295877,
        "activation_cosine_similarity": 0.21561549603939056,
        "activation_magnitude_ratio": 0.008615673519670963,
        "activation_dot_product": -0.11034021526575089,
        "encoder_gradient_cosine_similarity": 0.04654063656926155,
        "encoder_gradient_l2_distance": -0.2303743213415146,
        "encoder_gradient_dot_product": 0.09122782945632935,
        "input_gradient_cosine_similarity": -0.13327334821224213,
        "input_gradient_l2_distance": -0.07694897055625916,
        "input_gradient_dot_product": -0.097508504986763
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_mse": 0.0385358539900475,
      "train_r2": -8.112332290859714,
      "train_pearson_r": 0.09196075438093838,
      "val_mse": 0.03844176737693187,
      "val_r2": -14.781497799346775,
      "val_pearson_r": -0.595489948189134,
      "n_iterations": 146,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.15562564134597778,
        "right_subspace_overlap_bottom_k": 0.44669678807258606,
        "interaction_matrix_overlap_top_k": -0.6155273914337158,
        "interaction_matrix_overlap_bottom_k": -0.051556333899497986,
        "effective_rank": 0.7715209722518921,
        "effective_rank_mergeability_score": 0.20296114683151245,
        "stable_rank": -0.36917418241500854,
        "spectral_gap": 0.12538568675518036,
        "singular_value_ratio": 0.5030401945114136,
        "layerwise_effective_rank": 0.13848330080509186,
        "layerwise_effective_rank_mergeability_score": 0.27951833605766296,
        "task_vector_cosine_similarity": 0.1103639230132103,
        "task_vector_l2_distance": -0.18866443634033203,
        "task_vector_dot_product": 0.015484495088458061,
        "weight_space_angle": 0.40175676345825195,
        "task_vector_magnitude_ratio": -0.4313904345035553,
        "singular_value_overlap": 0.03406348451972008,
        "subspace_overlap": -0.1950450986623764,
        "right_subspace_overlap": 0.01399340108036995,
        "activation_l2_distance": -0.11147083342075348,
        "activation_cosine_similarity": -0.23570358753204346,
        "activation_magnitude_ratio": -0.04420734569430351,
        "activation_dot_product": 0.41736388206481934,
        "encoder_gradient_cosine_similarity": -0.07659336924552917,
        "encoder_gradient_l2_distance": 0.07627225667238235,
        "encoder_gradient_dot_product": 0.2440914362668991,
        "input_gradient_cosine_similarity": 0.03755611181259155,
        "input_gradient_l2_distance": -0.2676520347595215,
        "input_gradient_dot_product": -0.38554540276527405
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.010228235786176144,
      "train_r2": -1.4053076087720227,
      "train_pearson_r": 0.48577769765098117,
      "val_mse": 0.0074377520816650946,
      "val_r2": -2.1211595646778965,
      "val_pearson_r": 0.5586120664903695,
      "n_iterations": 345,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.13803917169570923,
        "right_subspace_overlap_bottom_k": -0.17891088128089905,
        "interaction_matrix_overlap_top_k": 0.21925729513168335,
        "interaction_matrix_overlap_bottom_k": 0.005509282927960157,
        "effective_rank": 0.30700239539146423,
        "effective_rank_mergeability_score": 0.16402755677700043,
        "stable_rank": 0.11458805948495865,
        "spectral_gap": 0.2638954222202301,
        "singular_value_ratio": 0.21088187396526337,
        "layerwise_effective_rank": -0.07645384967327118,
        "layerwise_effective_rank_mergeability_score": 0.05673651769757271,
        "task_vector_cosine_similarity": -0.16174942255020142,
        "task_vector_l2_distance": 0.07730579376220703,
        "task_vector_dot_product": -0.049913741648197174,
        "weight_space_angle": 0.3033444285392761,
        "task_vector_magnitude_ratio": -0.06537418067455292,
        "singular_value_overlap": 0.1118941605091095,
        "subspace_overlap": -0.051867496222257614,
        "right_subspace_overlap": -0.07735401391983032,
        "activation_l2_distance": 0.03582616522908211,
        "activation_cosine_similarity": 0.23547285795211792,
        "activation_magnitude_ratio": 0.001753176562488079,
        "activation_dot_product": -0.10080750286579132,
        "encoder_gradient_cosine_similarity": 0.06684447079896927,
        "encoder_gradient_l2_distance": -0.23351289331912994,
        "encoder_gradient_dot_product": 0.07952415943145752,
        "input_gradient_cosine_similarity": -0.1651258021593094,
        "input_gradient_l2_distance": -0.08456519991159439,
        "input_gradient_dot_product": -0.1461227983236313
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.04734283898294622,
      "train_r2": -10.893478182173492,
      "train_pearson_r": -0.06250984067793834,
      "val_mse": 0.12189492610290811,
      "val_r2": -49.303750287631026,
      "val_pearson_r": 0.058006786296928126,
      "n_iterations": 90,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.10434316098690033,
        "right_subspace_overlap_bottom_k": -0.02318265475332737,
        "interaction_matrix_overlap_top_k": -0.21814373135566711,
        "interaction_matrix_overlap_bottom_k": 0.18677540123462677,
        "effective_rank": 0.4899005591869354,
        "effective_rank_mergeability_score": 0.025957278907299042,
        "stable_rank": 0.3019057810306549,
        "spectral_gap": 0.16941404342651367,
        "singular_value_ratio": -0.14827415347099304,
        "layerwise_effective_rank": -0.354532390832901,
        "layerwise_effective_rank_mergeability_score": 0.08288277685642242,
        "task_vector_cosine_similarity": 0.12443062663078308,
        "task_vector_l2_distance": 0.057022351771593094,
        "task_vector_dot_product": 0.38631290197372437,
        "weight_space_angle": 0.2655068337917328,
        "task_vector_magnitude_ratio": -0.0991905927658081,
        "singular_value_overlap": 0.3681139349937439,
        "subspace_overlap": -0.2184048295021057,
        "right_subspace_overlap": -0.2936374843120575,
        "activation_l2_distance": 0.1309366226196289,
        "activation_cosine_similarity": -0.09346876293420792,
        "activation_magnitude_ratio": 0.15795373916625977,
        "activation_dot_product": 0.31821408867836,
        "encoder_gradient_cosine_similarity": 0.17174215614795685,
        "encoder_gradient_l2_distance": -0.24789246916770935,
        "encoder_gradient_dot_product": -0.2728075683116913,
        "input_gradient_cosine_similarity": -0.21304456889629364,
        "input_gradient_l2_distance": 0.24864834547042847,
        "input_gradient_dot_product": -0.2029271125793457
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.03720138076406366,
      "train_r2": -7.545245952907997,
      "train_pearson_r": 0.05116232663733686,
      "val_mse": 0.03030174090456845,
      "val_r2": -17.603830586566783,
      "val_pearson_r": 0.2165329673086095,
      "n_iterations": 189,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.3158283233642578,
        "right_subspace_overlap_bottom_k": -0.03691960498690605,
        "interaction_matrix_overlap_top_k": -0.5229999423027039,
        "interaction_matrix_overlap_bottom_k": -0.1604398787021637,
        "effective_rank": 0.13891205191612244,
        "effective_rank_mergeability_score": -0.3434264361858368,
        "stable_rank": 0.2833690941333771,
        "spectral_gap": 0.07643812149763107,
        "singular_value_ratio": 0.23823659121990204,
        "layerwise_effective_rank": -0.01870160549879074,
        "layerwise_effective_rank_mergeability_score": 0.3640023469924927,
        "task_vector_cosine_similarity": -0.026235029101371765,
        "task_vector_l2_distance": 0.28716567158699036,
        "task_vector_dot_product": -0.8751488327980042,
        "weight_space_angle": 0.22091174125671387,
        "task_vector_magnitude_ratio": -0.4583037197589874,
        "singular_value_overlap": 0.2495511919260025,
        "subspace_overlap": 0.4137667417526245,
        "right_subspace_overlap": 0.30703005194664,
        "activation_l2_distance": -0.23015642166137695,
        "activation_cosine_similarity": -0.43491512537002563,
        "activation_magnitude_ratio": 0.027337398380041122,
        "activation_dot_product": 0.5279589295387268,
        "encoder_gradient_cosine_similarity": 0.093532033264637,
        "encoder_gradient_l2_distance": 0.12165442854166031,
        "encoder_gradient_dot_product": 0.30076146125793457,
        "input_gradient_cosine_similarity": 0.11590798944234848,
        "input_gradient_l2_distance": -0.046727411448955536,
        "input_gradient_dot_product": 0.06809061020612717
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 1.8922024991034248,
      "train_r2": -459.6934872519553,
      "train_pearson_r": 0.32252993744035663,
      "val_mse": 1.8029465275504242,
      "val_r2": -885.0359931425609,
      "val_pearson_r": 0.6157223270559734,
      "n_iterations": 73,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.11687815189361572,
        "right_subspace_overlap_bottom_k": -0.9993511438369751,
        "interaction_matrix_overlap_top_k": -1.3817944526672363,
        "interaction_matrix_overlap_bottom_k": 0.6417780518531799,
        "effective_rank": -1.3790174722671509,
        "effective_rank_mergeability_score": 2.0022971630096436,
        "stable_rank": -0.7795419692993164,
        "spectral_gap": -0.7322129607200623,
        "singular_value_ratio": 2.114574670791626,
        "layerwise_effective_rank": -0.486050546169281,
        "layerwise_effective_rank_mergeability_score": -1.1387742757797241,
        "task_vector_cosine_similarity": 1.543121337890625,
        "task_vector_l2_distance": -0.7309049367904663,
        "task_vector_dot_product": -0.36372095346450806,
        "weight_space_angle": 1.1154882907867432,
        "task_vector_magnitude_ratio": 0.4717479646205902,
        "singular_value_overlap": 0.4826827943325043,
        "subspace_overlap": 0.6623576879501343,
        "right_subspace_overlap": -1.272273063659668,
        "activation_l2_distance": 0.7078567743301392,
        "activation_cosine_similarity": 1.6625676155090332,
        "activation_magnitude_ratio": 1.2928431034088135,
        "activation_dot_product": 0.23969514667987823,
        "encoder_gradient_cosine_similarity": -2.2965569496154785,
        "encoder_gradient_l2_distance": -0.7019978165626526,
        "encoder_gradient_dot_product": 0.16849876940250397,
        "input_gradient_cosine_similarity": 1.484951376914978,
        "input_gradient_l2_distance": -2.0810816287994385,
        "input_gradient_dot_product": 0.6433829069137573
      }
    }
  ],
  "optimization_params": {
    "objective": "MSE",
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 1e-06
  }
}