{
  "aggregate_metrics": {
    "train_r": 0.41581203760359914,
    "train_p": 6.26827177401533e-135,
    "val_r": 0.04981601091731226,
    "val_p": 0.3472942834632255
  },
  "per_fold_stats": {
    "train_r_mean": 0.5590102767517646,
    "train_r_std": 0.049449218859214356,
    "val_r_mean": 0.4424779064804386,
    "val_r_std": 0.14324887784596263,
    "n_nonzero_mean": 19.95,
    "n_nonzero_std": 3.761316258971054
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.000771186372730881,
    "right_subspace_overlap_bottom_k": 0.003557309042662382,
    "interaction_matrix_overlap_top_k": -0.0028331605717539787,
    "interaction_matrix_overlap_bottom_k": 0.03447685018181801,
    "effective_rank": -0.0006774563225917518,
    "effective_rank_mergeability_score": 0.0006938888691365719,
    "stable_rank": -0.0005642032483592629,
    "spectral_gap": 0.0002990943903569132,
    "singular_value_ratio": -0.0003529852838255465,
    "layerwise_effective_rank": -0.0008602337911725044,
    "layerwise_effective_rank_mergeability_score": 0.000725827063433826,
    "task_vector_cosine_similarity": -0.00022301636636257172,
    "task_vector_l2_distance": -0.022900372743606567,
    "task_vector_dot_product": -0.0005278041353449225,
    "weight_space_angle": 0.0008843258256092668,
    "task_vector_magnitude_ratio": -0.0058045280165970325,
    "singular_value_overlap": -0.021344900131225586,
    "subspace_overlap": 0.005373373627662659,
    "right_subspace_overlap": 0.00020797635079361498,
    "activation_l2_distance": -0.0001187356174341403,
    "activation_cosine_similarity": 0.0009398626280017197,
    "activation_magnitude_ratio": -0.005558758974075317,
    "activation_dot_product": -0.00347595801576972,
    "encoder_gradient_cosine_similarity": 0.0002979594864882529,
    "encoder_gradient_l2_distance": -0.013393186032772064,
    "encoder_gradient_dot_product": 0.00018637647735886276,
    "input_gradient_cosine_similarity": 0.0015135946450755,
    "input_gradient_l2_distance": -0.023171164095401764,
    "input_gradient_dot_product": -0.006487053819000721
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.004998355638235807,
    "right_subspace_overlap_bottom_k": 0.0055370330810546875,
    "interaction_matrix_overlap_top_k": 0.0031822386663407087,
    "interaction_matrix_overlap_bottom_k": 0.010634368285536766,
    "effective_rank": 0.0008734894217923284,
    "effective_rank_mergeability_score": 0.0008940139086917043,
    "stable_rank": 0.0007777729770168662,
    "spectral_gap": 0.0011336508905515075,
    "singular_value_ratio": 0.0008909093448892236,
    "layerwise_effective_rank": 0.0024193539284169674,
    "layerwise_effective_rank_mergeability_score": 0.0019393087131902575,
    "task_vector_cosine_similarity": 0.0019462124910205603,
    "task_vector_l2_distance": 0.010333985090255737,
    "task_vector_dot_product": 0.00223797676153481,
    "weight_space_angle": 0.0016441672341898084,
    "task_vector_magnitude_ratio": 0.0020388911943882704,
    "singular_value_overlap": 0.007576433941721916,
    "subspace_overlap": 0.004089727532118559,
    "right_subspace_overlap": 0.0021585174836218357,
    "activation_l2_distance": 0.004841342102736235,
    "activation_cosine_similarity": 0.0040938896127045155,
    "activation_magnitude_ratio": 0.0029136950615793467,
    "activation_dot_product": 0.0046693370677530766,
    "encoder_gradient_cosine_similarity": 0.0018286538543179631,
    "encoder_gradient_l2_distance": 0.005508338566869497,
    "encoder_gradient_dot_product": 0.001587862498126924,
    "input_gradient_cosine_similarity": 0.0012973534176126122,
    "input_gradient_l2_distance": 0.008264075964689255,
    "input_gradient_dot_product": 0.003065883880481124
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.45,
    "right_subspace_overlap_bottom_k": 0.9,
    "interaction_matrix_overlap_top_k": 0.7,
    "interaction_matrix_overlap_bottom_k": 0.95,
    "effective_rank": 0.4,
    "effective_rank_mergeability_score": 0.4,
    "stable_rank": 0.35,
    "spectral_gap": 0.5,
    "singular_value_ratio": 0.4,
    "layerwise_effective_rank": 0.55,
    "layerwise_effective_rank_mergeability_score": 0.55,
    "task_vector_cosine_similarity": 0.4,
    "task_vector_l2_distance": 0.95,
    "task_vector_dot_product": 0.65,
    "weight_space_angle": 0.5,
    "task_vector_magnitude_ratio": 0.95,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 1.0,
    "right_subspace_overlap": 0.35,
    "activation_l2_distance": 0.75,
    "activation_cosine_similarity": 0.75,
    "activation_magnitude_ratio": 1.0,
    "activation_dot_product": 0.8,
    "encoder_gradient_cosine_similarity": 0.55,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.5,
    "input_gradient_cosine_similarity": 0.65,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 1.0
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5854617798954647,
      "val_r": 0.5964049741628756,
      "n_iterations": 336,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.0027587604708969593,
        "interaction_matrix_overlap_top_k": -0.010969525203108788,
        "interaction_matrix_overlap_bottom_k": 0.027749070897698402,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0010086281690746546,
        "stable_rank": 0.0,
        "spectral_gap": -0.0011178120039403439,
        "singular_value_ratio": 0.0012271103914827108,
        "layerwise_effective_rank": 0.002391842193901539,
        "layerwise_effective_rank_mergeability_score": -0.0028714342042803764,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.012460729107260704,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.005719712004065514,
        "singular_value_overlap": -0.012858293019235134,
        "subspace_overlap": 0.011259743943810463,
        "right_subspace_overlap": 0.0010688547044992447,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.003077899571508169,
        "activation_magnitude_ratio": -0.004687635228037834,
        "activation_dot_product": -0.003703347872942686,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.007720253895968199,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.010256273671984673,
        "input_gradient_dot_product": -0.0031393738463521004
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5598343160521068,
      "val_r": 0.4802319593241553,
      "n_iterations": 279,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0029595668893307447,
        "interaction_matrix_overlap_top_k": -0.00288494979031384,
        "interaction_matrix_overlap_bottom_k": 0.03384906053543091,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.023483099415898323,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.006840126123279333,
        "singular_value_overlap": -0.018337465822696686,
        "subspace_overlap": 0.0018112375400960445,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0024381298571825027,
        "activation_cosine_similarity": 0.0017118381801992655,
        "activation_magnitude_ratio": -0.004561457317322493,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": -0.0014926593285053968,
        "encoder_gradient_l2_distance": -0.016845522448420525,
        "encoder_gradient_dot_product": 0.001872923457995057,
        "input_gradient_cosine_similarity": 0.0017683302285149693,
        "input_gradient_l2_distance": -0.018842626363039017,
        "input_gradient_dot_product": -0.0027029349002987146
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5509785595039542,
      "val_r": 0.4823206829271176,
      "n_iterations": 247,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.002037945669144392,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.025325004011392593,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.001185643021017313,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.015621689148247242,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.004695940297096968,
        "singular_value_overlap": -0.01590060070157051,
        "subspace_overlap": 0.003792770905420184,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.00423771096393466,
        "activation_dot_product": -0.0023560859262943268,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.009173925034701824,
        "encoder_gradient_dot_product": 0.0011871347669512033,
        "input_gradient_cosine_similarity": 0.001575128873810172,
        "input_gradient_l2_distance": -0.01621313765645027,
        "input_gradient_dot_product": -0.0069977943785488605
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5520038409731195,
      "val_r": 0.5049641080599196,
      "n_iterations": 378,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.011175630614161491,
        "interaction_matrix_overlap_top_k": -0.0037786581087857485,
        "interaction_matrix_overlap_bottom_k": 0.04352420195937157,
        "effective_rank": -0.0013932869769632816,
        "effective_rank_mergeability_score": 0.0019557003397494555,
        "stable_rank": -0.0014668668154627085,
        "spectral_gap": 0.0018305128905922174,
        "singular_value_ratio": -0.001493343384936452,
        "layerwise_effective_rank": -0.001542452024295926,
        "layerwise_effective_rank_mergeability_score": 0.0017373127629980445,
        "task_vector_cosine_similarity": -0.0015584758948534727,
        "task_vector_l2_distance": -0.03321041166782379,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.00815115962177515,
        "singular_value_overlap": -0.029935145750641823,
        "subspace_overlap": 0.005895503796637058,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0061234477907419205,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.00944657251238823,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.009805815294384956,
        "encoder_gradient_dot_product": -0.0012849490158259869,
        "input_gradient_cosine_similarity": 0.0037005236372351646,
        "input_gradient_l2_distance": -0.02814554050564766,
        "input_gradient_dot_product": -0.008749538101255894
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5939355863621305,
      "val_r": 0.5782080618901905,
      "n_iterations": 492,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0014651904348284006,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.031933967024087906,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.020801737904548645,
        "task_vector_dot_product": -0.003315472276881337,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0045225354842841625,
        "singular_value_overlap": -0.018129179254174232,
        "subspace_overlap": -0.0012885385658591986,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.001202852581627667,
        "activation_cosine_similarity": -0.0018208229448646307,
        "activation_magnitude_ratio": -0.005765118636190891,
        "activation_dot_product": -0.0012034588726237416,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.007299884222447872,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0025344151072204113,
        "input_gradient_l2_distance": -0.018506305292248726,
        "input_gradient_dot_product": -0.002709774998947978
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5663035228595943,
      "val_r": 0.6179450677284435,
      "n_iterations": 295,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.00376480957493186,
        "interaction_matrix_overlap_top_k": -0.005165766924619675,
        "interaction_matrix_overlap_bottom_k": 0.03284291923046112,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.017333179712295532,
        "task_vector_dot_product": 0.00436348607763648,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.006775065790861845,
        "singular_value_overlap": -0.015592200681567192,
        "subspace_overlap": 0.0016271410277113318,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.004894510842859745,
        "activation_dot_product": -0.0016683286521583796,
        "encoder_gradient_cosine_similarity": 0.001641861512325704,
        "encoder_gradient_l2_distance": -0.008354788646101952,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0011149403871968389,
        "input_gradient_l2_distance": -0.01126454770565033,
        "input_gradient_dot_product": -0.0034182490780949593
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5794153858561251,
      "val_r": 0.2084254564080656,
      "n_iterations": 187,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0012568258680403233,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.001206244807690382,
        "interaction_matrix_overlap_bottom_k": 0.0367540642619133,
        "effective_rank": -0.00116757582873106,
        "effective_rank_mergeability_score": 0.0017708060331642628,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.018162347376346588,
        "task_vector_dot_product": -0.006130089983344078,
        "weight_space_angle": 0.002183478558436036,
        "task_vector_magnitude_ratio": -0.006573235150426626,
        "singular_value_overlap": -0.023492464795708656,
        "subspace_overlap": 0.005407592281699181,
        "right_subspace_overlap": 0.002677262993529439,
        "activation_l2_distance": -0.012351015582680702,
        "activation_cosine_similarity": 0.012339349836111069,
        "activation_magnitude_ratio": 0.0034306657034903765,
        "activation_dot_product": -0.020225465297698975,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.021291878074407578,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.03108304925262928,
        "input_gradient_dot_product": -0.013210399076342583
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5194443213562621,
      "val_r": 0.3506908512145717,
      "n_iterations": 292,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.009286959655582905,
        "interaction_matrix_overlap_top_k": -0.0024412618950009346,
        "interaction_matrix_overlap_bottom_k": 0.04807247593998909,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.001273138914257288,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0010430682450532913,
        "task_vector_l2_distance": -0.03535817563533783,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0018898660782724619,
        "task_vector_magnitude_ratio": -0.007832750678062439,
        "singular_value_overlap": -0.028828782960772514,
        "subspace_overlap": 0.010617786087095737,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0071038659662008286,
        "activation_dot_product": -0.0032159066759049892,
        "encoder_gradient_cosine_similarity": 0.0014660044107586145,
        "encoder_gradient_l2_distance": -0.01344169769436121,
        "encoder_gradient_dot_product": 0.0010356779675930738,
        "input_gradient_cosine_similarity": 0.0015826476737856865,
        "input_gradient_l2_distance": -0.01642231084406376,
        "input_gradient_dot_product": -0.001204141415655613
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.47792095843498517,
      "val_r": 0.1806622521476343,
      "n_iterations": 232,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0016471596900373697,
        "right_subspace_overlap_bottom_k": -0.007955561392009258,
        "interaction_matrix_overlap_top_k": -0.0030426536686718464,
        "interaction_matrix_overlap_bottom_k": 0.034660037606954575,
        "effective_rank": -0.0021067573688924313,
        "effective_rank_mergeability_score": 0.002640481572598219,
        "stable_rank": -0.0017160429852083325,
        "spectral_gap": 0.0011007392313331366,
        "singular_value_ratio": -0.0019082824001088738,
        "layerwise_effective_rank": -0.002126976614817977,
        "layerwise_effective_rank_mergeability_score": 0.0019346732879057527,
        "task_vector_cosine_similarity": -0.0010352255776524544,
        "task_vector_l2_distance": -0.011725984513759613,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.005558381322771311,
        "singular_value_overlap": -0.014069187454879284,
        "subspace_overlap": 0.005278197582811117,
        "right_subspace_overlap": 0.001716629951260984,
        "activation_l2_distance": -0.0032885887194424868,
        "activation_cosine_similarity": 0.002993218833580613,
        "activation_magnitude_ratio": -0.0022105113603174686,
        "activation_dot_product": -0.0032860753126442432,
        "encoder_gradient_cosine_similarity": 0.0033969224896281958,
        "encoder_gradient_l2_distance": -0.008230943232774734,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.014593883417546749,
        "input_gradient_dot_product": -0.007520508952438831
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5630300177778378,
      "val_r": 0.18528250870671006,
      "n_iterations": 305,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0021007212344557047,
        "right_subspace_overlap_bottom_k": 0.011583030223846436,
        "interaction_matrix_overlap_top_k": -0.003537992015480995,
        "interaction_matrix_overlap_bottom_k": 0.04032205417752266,
        "effective_rank": -0.001509809517301619,
        "effective_rank_mergeability_score": 0.0014080627588555217,
        "stable_rank": -0.0017386488616466522,
        "spectral_gap": 0.0021088968496769667,
        "singular_value_ratio": -0.0018575451103970408,
        "layerwise_effective_rank": -0.001365026691928506,
        "layerwise_effective_rank_mergeability_score": 0.001328949467279017,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0327385850250721,
        "task_vector_dot_product": -0.0022230995818972588,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.005216115154325962,
        "singular_value_overlap": -0.03061533533036709,
        "subspace_overlap": 0.010448677465319633,
        "right_subspace_overlap": -0.003004038706421852,
        "activation_l2_distance": -0.004046001471579075,
        "activation_cosine_similarity": -0.0071115377359092236,
        "activation_magnitude_ratio": -0.0062423706986010075,
        "activation_dot_product": -0.007633410859853029,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.013650866225361824,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.03135497123003006,
        "input_gradient_dot_product": -0.004746966529637575
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5209096407120051,
      "val_r": 0.39523215658126853,
      "n_iterations": 314,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0018224542727693915,
        "right_subspace_overlap_bottom_k": 0.004415964707732201,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.03271207958459854,
        "effective_rank": -0.00110371015034616,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0012737065553665161,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0013404299970716238,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.003745407797396183,
        "task_vector_l2_distance": -0.018728584051132202,
        "task_vector_dot_product": -0.0023633763194084167,
        "weight_space_angle": 0.0020382837392389774,
        "task_vector_magnitude_ratio": -0.004438401199877262,
        "singular_value_overlap": -0.019354522228240967,
        "subspace_overlap": 0.004902530927211046,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.007980434224009514,
        "activation_cosine_similarity": -0.0016278389375656843,
        "activation_magnitude_ratio": -0.00763744255527854,
        "activation_dot_product": -0.006729804445058107,
        "encoder_gradient_cosine_similarity": -0.0025677853263914585,
        "encoder_gradient_l2_distance": -0.012332107871770859,
        "encoder_gradient_dot_product": -0.004689664579927921,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.020993636921048164,
        "input_gradient_dot_product": -0.00419513788074255
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5160949003075043,
      "val_r": 0.5273506802926412,
      "n_iterations": 399,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.004249352961778641,
        "interaction_matrix_overlap_bottom_k": 0.029796013608574867,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": -0.0010111491428688169,
        "task_vector_cosine_similarity": -0.0026182839646935463,
        "task_vector_l2_distance": -0.012520181015133858,
        "task_vector_dot_product": -0.0015849277842789888,
        "weight_space_angle": 0.0020940802060067654,
        "task_vector_magnitude_ratio": -0.005466807167977095,
        "singular_value_overlap": -0.021036451682448387,
        "subspace_overlap": 0.007442502770572901,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.001765526831150055,
        "activation_magnitude_ratio": -0.005946052260696888,
        "activation_dot_product": -0.006677696947008371,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.01266811415553093,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0023650103248655796,
        "input_gradient_l2_distance": -0.021279286593198776,
        "input_gradient_dot_product": -0.009634512476623058
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5217935230689998,
      "val_r": 0.5170272405408263,
      "n_iterations": 300,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.004577931482344866,
        "interaction_matrix_overlap_top_k": -0.0026789435651153326,
        "interaction_matrix_overlap_bottom_k": 0.04542727768421173,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0010594443883746862,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.030055886134505272,
        "task_vector_dot_product": 0.0011247212532907724,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.007549887523055077,
        "singular_value_overlap": -0.025544337928295135,
        "subspace_overlap": 0.003289029933512211,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0087269963696599,
        "activation_cosine_similarity": 0.001342222560197115,
        "activation_magnitude_ratio": -0.005399439018219709,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.014062394388020039,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0018111735116690397,
        "input_gradient_l2_distance": -0.025571368634700775,
        "input_gradient_dot_product": -0.009286168962717056
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5332221363382699,
      "val_r": 0.6599632738980735,
      "n_iterations": 258,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0024103557225316763,
        "right_subspace_overlap_bottom_k": 0.001528751803562045,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.03517743572592735,
        "effective_rank": -0.002174559747800231,
        "effective_rank_mergeability_score": 0.0017752563580870628,
        "stable_rank": -0.0015517068095505238,
        "spectral_gap": 0.001639249618165195,
        "singular_value_ratio": -0.0018940182635560632,
        "layerwise_effective_rank": -0.0015607469249516726,
        "layerwise_effective_rank_mergeability_score": 0.0018041995353996754,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.026725424453616142,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0013782830210402608,
        "task_vector_magnitude_ratio": -0.0054378751665353775,
        "singular_value_overlap": -0.02662530727684498,
        "subspace_overlap": 0.0017707271035760641,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0024774731136858463,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0072867851704359055,
        "activation_dot_product": -0.00521989818662405,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.015968579798936844,
        "encoder_gradient_dot_product": -0.0023279967717826366,
        "input_gradient_cosine_similarity": 0.0018183288630098104,
        "input_gradient_l2_distance": -0.026846542954444885,
        "input_gradient_dot_product": -0.008941066451370716
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5228571942107536,
      "val_r": 0.5773101313477232,
      "n_iterations": 255,
      "n_nonzero_coefficients": 28,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0023172739893198013,
        "right_subspace_overlap_bottom_k": 0.004072110168635845,
        "interaction_matrix_overlap_top_k": -0.00203699991106987,
        "interaction_matrix_overlap_bottom_k": 0.04563574492931366,
        "effective_rank": -0.0018331415485590696,
        "effective_rank_mergeability_score": 0.0015514213591814041,
        "stable_rank": -0.001941874623298645,
        "spectral_gap": 0.002033438766375184,
        "singular_value_ratio": -0.0010074053425341845,
        "layerwise_effective_rank": -0.0014756490709260106,
        "layerwise_effective_rank_mergeability_score": 0.0013806632487103343,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.03796462342143059,
        "task_vector_dot_product": 0.0012804262805730104,
        "weight_space_angle": 0.0029117476660758257,
        "task_vector_magnitude_ratio": -0.00954233855009079,
        "singular_value_overlap": -0.03390505164861679,
        "subspace_overlap": 0.009260897524654865,
        "right_subspace_overlap": -0.0013644634746015072,
        "activation_l2_distance": 0.0012803686549887061,
        "activation_cosine_similarity": -0.0024835695512592793,
        "activation_magnitude_ratio": -0.010037289001047611,
        "activation_dot_product": -0.0044958931393921375,
        "encoder_gradient_cosine_similarity": -0.0017973330104723573,
        "encoder_gradient_l2_distance": -0.015958959236741066,
        "encoder_gradient_dot_product": 0.001788097433745861,
        "input_gradient_cosine_similarity": 0.003128360491245985,
        "input_gradient_l2_distance": -0.037928733974695206,
        "input_gradient_dot_product": -0.007233182899653912
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5667041578943568,
      "val_r": 0.37760187492200314,
      "n_iterations": 323,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0019332119263708591,
        "right_subspace_overlap_bottom_k": 0.0021842382848262787,
        "interaction_matrix_overlap_top_k": -0.0011198152787983418,
        "interaction_matrix_overlap_bottom_k": 0.024706553667783737,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0011168336495757103,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0010831381659954786,
        "task_vector_l2_distance": -0.019113318994641304,
        "task_vector_dot_product": 0.0014080355176702142,
        "weight_space_angle": 0.001031993655487895,
        "task_vector_magnitude_ratio": -0.005882286000996828,
        "singular_value_overlap": -0.010165202431380749,
        "subspace_overlap": 0.0012828861363232136,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0017603333108127117,
        "activation_cosine_similarity": 0.0015686014667153358,
        "activation_magnitude_ratio": -0.005540624260902405,
        "activation_dot_product": -0.0036963652819395065,
        "encoder_gradient_cosine_similarity": -0.0019522779621183872,
        "encoder_gradient_l2_distance": -0.010910853743553162,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.015020867809653282,
        "input_gradient_dot_product": -0.0054370141588151455
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5594115615431068,
      "val_r": 0.46562127442574086,
      "n_iterations": 353,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.013511640019714832,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.05064597725868225,
        "effective_rank": -0.0022602854296565056,
        "effective_rank_mergeability_score": 0.0017674207920208573,
        "stable_rank": -0.0015952188987284899,
        "spectral_gap": 0.0022759768180549145,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0012183748185634613,
        "layerwise_effective_rank_mergeability_score": 0.0011823336826637387,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.043577276170253754,
        "task_vector_dot_product": 0.001259493874385953,
        "weight_space_angle": 0.002927586203441024,
        "task_vector_magnitude_ratio": -0.005321447737514973,
        "singular_value_overlap": -0.032079536467790604,
        "subspace_overlap": 0.006219078786671162,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.008866984397172928,
        "activation_cosine_similarity": -0.0017944632563740015,
        "activation_magnitude_ratio": -0.010304315015673637,
        "activation_dot_product": 0.0023681458551436663,
        "encoder_gradient_cosine_similarity": 0.004503736272454262,
        "encoder_gradient_l2_distance": -0.012335010804235935,
        "encoder_gradient_dot_product": 0.0016812224639579654,
        "input_gradient_cosine_similarity": 0.001873350003734231,
        "input_gradient_l2_distance": -0.03787010908126831,
        "input_gradient_dot_product": -0.00998497474938631
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5869140401741506,
      "val_r": 0.2790026856033174,
      "n_iterations": 199,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.007525056134909391,
        "interaction_matrix_overlap_top_k": -0.011347697116434574,
        "interaction_matrix_overlap_bottom_k": 0.03464752435684204,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0027237816248089075,
        "layerwise_effective_rank_mergeability_score": 0.002946848515421152,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.019477298483252525,
        "task_vector_dot_product": 0.0011870136950165033,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.002635451266542077,
        "singular_value_overlap": -0.013696659356355667,
        "subspace_overlap": 0.006757482886314392,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.001933180377818644,
        "activation_cosine_similarity": -0.0031888321973383427,
        "activation_magnitude_ratio": -0.005540188401937485,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": -0.001979042310267687,
        "encoder_gradient_l2_distance": -0.007543045561760664,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0036322367377579212,
        "input_gradient_l2_distance": -0.027478713542222977,
        "input_gradient_dot_product": -0.00415414571762085
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7340428511687523,
      "val_r": 0.5340119188901057,
      "n_iterations": 251,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.02126951888203621,
        "right_subspace_overlap_bottom_k": -0.001441311789676547,
        "interaction_matrix_overlap_top_k": -0.002203352050855756,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0016440270701423287,
        "singular_value_ratio": 0.001146916882134974,
        "layerwise_effective_rank": -0.010040774941444397,
        "layerwise_effective_rank_mergeability_score": 0.007177793886512518,
        "task_vector_cosine_similarity": -0.006860989611595869,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.0037139735650271177,
        "weight_space_angle": 0.004619083367288113,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.00844587292522192,
        "subspace_overlap": -0.0017687028739601374,
        "right_subspace_overlap": 0.007329538464546204,
        "activation_l2_distance": -0.0015975640853866935,
        "activation_cosine_similarity": 0.009437683038413525,
        "activation_magnitude_ratio": -0.0036213649436831474,
        "activation_dot_product": 0.001053058309480548,
        "encoder_gradient_cosine_similarity": 0.0030680415220558643,
        "encoder_gradient_l2_distance": -0.030028576031327248,
        "encoder_gradient_dot_product": 0.0024264648091048002,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.019093384966254234,
        "input_gradient_dot_product": -0.00916232354938984
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5699272405458133,
      "val_r": 0.33130097053738866,
      "n_iterations": 241,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0056770918890833855,
        "right_subspace_overlap_bottom_k": 0.010742605663836002,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.035755522549152374,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": -0.0010936502367258072,
        "task_vector_cosine_similarity": 0.001741033629514277,
        "task_vector_l2_distance": -0.028948934748768806,
        "task_vector_dot_product": -0.001848320011049509,
        "weight_space_angle": -0.0033878860995173454,
        "task_vector_magnitude_ratio": -0.00793104525655508,
        "singular_value_overlap": -0.028286410495638847,
        "subspace_overlap": 0.013460924848914146,
        "right_subspace_overlap": -0.004264256916940212,
        "activation_l2_distance": -0.002965926192700863,
        "activation_cosine_similarity": 0.0025879754684865475,
        "activation_magnitude_ratio": -0.004142588935792446,
        "activation_dot_product": -0.0028286210726946592,
        "encoder_gradient_cosine_similarity": 0.0016717216931283474,
        "encoder_gradient_l2_distance": -0.020240504294633865,
        "encoder_gradient_dot_product": 0.0020386194810271263,
        "input_gradient_cosine_similarity": 0.0033674477599561214,
        "input_gradient_l2_distance": -0.034657951444387436,
        "input_gradient_dot_product": -0.007312857545912266
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.3,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}