{
  "aggregate_metrics": {
    "train_r": 0.20681682351991035,
    "train_p": 1.8337289723875815e-32,
    "val_r": -0.06623537928182745,
    "val_p": 0.21121823215719754
  },
  "per_fold_stats": {
    "train_r_mean": 0.4020602173767463,
    "train_r_std": 0.11988676946900144,
    "val_r_mean": 0.3080382326484644,
    "val_r_std": 0.20502155606750072,
    "n_nonzero_mean": 24.75,
    "n_nonzero_std": 1.920286436967152
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.0050026485696434975,
    "right_subspace_overlap_bottom_k": 0.005834916140884161,
    "interaction_matrix_overlap_top_k": 0.0036775744520127773,
    "interaction_matrix_overlap_bottom_k": 0.06419934332370758,
    "effective_rank": 0.026529882103204727,
    "effective_rank_mergeability_score": 0.04969625547528267,
    "stable_rank": 0.014260893687605858,
    "spectral_gap": 0.055154889822006226,
    "singular_value_ratio": 0.02664296329021454,
    "layerwise_effective_rank": 0.03246966376900673,
    "layerwise_effective_rank_mergeability_score": 0.030321979895234108,
    "task_vector_cosine_similarity": 0.033555708825588226,
    "task_vector_l2_distance": -0.004642520099878311,
    "task_vector_dot_product": 0.002283920766785741,
    "weight_space_angle": 0.06355614960193634,
    "task_vector_magnitude_ratio": 0.0023139158729463816,
    "singular_value_overlap": -0.004964123945683241,
    "subspace_overlap": 0.0398387536406517,
    "right_subspace_overlap": 0.005033909343183041,
    "activation_l2_distance": 0.009047386236488819,
    "activation_cosine_similarity": 0.006861566100269556,
    "activation_magnitude_ratio": 0.0006721236277371645,
    "activation_dot_product": 0.005115295294672251,
    "encoder_gradient_cosine_similarity": 0.008529935963451862,
    "encoder_gradient_l2_distance": -0.0012927325442433357,
    "encoder_gradient_dot_product": 0.009031449444591999,
    "input_gradient_cosine_similarity": 0.014061744324862957,
    "input_gradient_l2_distance": -0.006346783135086298,
    "input_gradient_dot_product": 0.0013193546328693628
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.00527644157409668,
    "right_subspace_overlap_bottom_k": 0.005057893227785826,
    "interaction_matrix_overlap_top_k": 0.0046028089709579945,
    "interaction_matrix_overlap_bottom_k": 0.04041263833642006,
    "effective_rank": 0.022992722690105438,
    "effective_rank_mergeability_score": 0.027269862592220306,
    "stable_rank": 0.00974889937788248,
    "spectral_gap": 0.01780964806675911,
    "singular_value_ratio": 0.023738563060760498,
    "layerwise_effective_rank": 0.02656368725001812,
    "layerwise_effective_rank_mergeability_score": 0.026137739419937134,
    "task_vector_cosine_similarity": 0.02867422066628933,
    "task_vector_l2_distance": 0.007369569037109613,
    "task_vector_dot_product": 0.003109127515926957,
    "weight_space_angle": 0.021712666377425194,
    "task_vector_magnitude_ratio": 0.003084976226091385,
    "singular_value_overlap": 0.005290892440825701,
    "subspace_overlap": 0.03355112299323082,
    "right_subspace_overlap": 0.005296109244227409,
    "activation_l2_distance": 0.009097130037844181,
    "activation_cosine_similarity": 0.0054947007447481155,
    "activation_magnitude_ratio": 0.00672015268355608,
    "activation_dot_product": 0.006461990997195244,
    "encoder_gradient_cosine_similarity": 0.009647076949477196,
    "encoder_gradient_l2_distance": 0.0035873805172741413,
    "encoder_gradient_dot_product": 0.00725163659080863,
    "input_gradient_cosine_similarity": 0.011053862050175667,
    "input_gradient_l2_distance": 0.007068573962897062,
    "input_gradient_dot_product": 0.004239276517182589
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.75,
    "right_subspace_overlap_bottom_k": 0.9,
    "interaction_matrix_overlap_top_k": 0.7,
    "interaction_matrix_overlap_bottom_k": 0.95,
    "effective_rank": 0.9,
    "effective_rank_mergeability_score": 1.0,
    "stable_rank": 0.95,
    "spectral_gap": 1.0,
    "singular_value_ratio": 1.0,
    "layerwise_effective_rank": 1.0,
    "layerwise_effective_rank_mergeability_score": 1.0,
    "task_vector_cosine_similarity": 1.0,
    "task_vector_l2_distance": 0.7,
    "task_vector_dot_product": 0.6,
    "weight_space_angle": 1.0,
    "task_vector_magnitude_ratio": 0.6,
    "singular_value_overlap": 0.8,
    "subspace_overlap": 1.0,
    "right_subspace_overlap": 0.7,
    "activation_l2_distance": 0.95,
    "activation_cosine_similarity": 0.85,
    "activation_magnitude_ratio": 0.7,
    "activation_dot_product": 0.85,
    "encoder_gradient_cosine_similarity": 0.9,
    "encoder_gradient_l2_distance": 0.7,
    "encoder_gradient_dot_product": 0.95,
    "input_gradient_cosine_similarity": 0.95,
    "input_gradient_l2_distance": 0.7,
    "input_gradient_dot_product": 0.65
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.3234348499457338,
      "val_r": 0.2247130145938361,
      "n_iterations": 217,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.012105781584978104,
        "interaction_matrix_overlap_top_k": 0.0030521852895617485,
        "interaction_matrix_overlap_bottom_k": 0.09157423675060272,
        "effective_rank": 0.004457312636077404,
        "effective_rank_mergeability_score": 0.029378267005085945,
        "stable_rank": 0.010411798022687435,
        "spectral_gap": 0.07126694917678833,
        "singular_value_ratio": 0.010321298614144325,
        "layerwise_effective_rank": 0.04660293832421303,
        "layerwise_effective_rank_mergeability_score": 0.002659787191078067,
        "task_vector_cosine_similarity": 0.01698037050664425,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.07417549192905426,
        "task_vector_magnitude_ratio": 0.002828029217198491,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.06728126108646393,
        "right_subspace_overlap": -0.001415751175954938,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.002772153355181217,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0050691100768744946,
        "encoder_gradient_cosine_similarity": 0.0024271132424473763,
        "encoder_gradient_l2_distance": 0.0,
        "encoder_gradient_dot_product": 0.010018312372267246,
        "input_gradient_cosine_similarity": 0.006557122804224491,
        "input_gradient_l2_distance": -0.0038260973524302244,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5063520549915409,
      "val_r": 0.4073152951056832,
      "n_iterations": 374,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.001887317281216383,
        "right_subspace_overlap_bottom_k": 0.0032892944291234016,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.02297503501176834,
        "effective_rank": 0.021457819268107414,
        "effective_rank_mergeability_score": 0.052402276545763016,
        "stable_rank": 0.03325341269373894,
        "spectral_gap": 0.07027751207351685,
        "singular_value_ratio": 0.06031401827931404,
        "layerwise_effective_rank": 0.04964178428053856,
        "layerwise_effective_rank_mergeability_score": 0.046685606241226196,
        "task_vector_cosine_similarity": 0.0724324882030487,
        "task_vector_l2_distance": -0.014132550917565823,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.07597047090530396,
        "task_vector_magnitude_ratio": 0.0012874412350356579,
        "singular_value_overlap": -0.014101849868893623,
        "subspace_overlap": 0.0036467788740992546,
        "right_subspace_overlap": 0.003374922089278698,
        "activation_l2_distance": 0.004970336798578501,
        "activation_cosine_similarity": 0.002776562701910734,
        "activation_magnitude_ratio": -0.001985767390578985,
        "activation_dot_product": -0.0013917190954089165,
        "encoder_gradient_cosine_similarity": 0.0010788694489747286,
        "encoder_gradient_l2_distance": -0.006919016595929861,
        "encoder_gradient_dot_product": 0.00308799184858799,
        "input_gradient_cosine_similarity": 0.005165811628103256,
        "input_gradient_l2_distance": -0.017339300364255905,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.3040439584951941,
      "val_r": 0.22745240994297783,
      "n_iterations": 276,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009240318089723587,
        "right_subspace_overlap_bottom_k": 0.009684229269623756,
        "interaction_matrix_overlap_top_k": 0.00604553148150444,
        "interaction_matrix_overlap_bottom_k": 0.05985346809029579,
        "effective_rank": 0.02490375190973282,
        "effective_rank_mergeability_score": 0.03555745258927345,
        "stable_rank": 0.02669820748269558,
        "spectral_gap": 0.062099020928144455,
        "singular_value_ratio": 0.014614586718380451,
        "layerwise_effective_rank": 0.001051372499205172,
        "layerwise_effective_rank_mergeability_score": 0.021604740992188454,
        "task_vector_cosine_similarity": 0.005331520456820726,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.06697136163711548,
        "task_vector_magnitude_ratio": 0.010504861362278461,
        "singular_value_overlap": -0.001542209181934595,
        "subspace_overlap": 0.061107248067855835,
        "right_subspace_overlap": 0.00856365729123354,
        "activation_l2_distance": 0.0023748399689793587,
        "activation_cosine_similarity": 0.0024366218131035566,
        "activation_magnitude_ratio": -0.001734964200295508,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.017473220825195312,
        "encoder_gradient_l2_distance": 0.0,
        "encoder_gradient_dot_product": 0.015604173764586449,
        "input_gradient_cosine_similarity": 0.01966654136776924,
        "input_gradient_l2_distance": -0.004335665609687567,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.31016256464529135,
      "val_r": 0.31765456513106793,
      "n_iterations": 367,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.008971421048045158,
        "right_subspace_overlap_bottom_k": 0.005252446513622999,
        "interaction_matrix_overlap_top_k": 0.004304743837565184,
        "interaction_matrix_overlap_bottom_k": 0.1040075346827507,
        "effective_rank": 0.0045882281847298145,
        "effective_rank_mergeability_score": 0.03175710141658783,
        "stable_rank": 0.019804328680038452,
        "spectral_gap": 0.0499516986310482,
        "singular_value_ratio": 0.004011484328657389,
        "layerwise_effective_rank": 0.013139410875737667,
        "layerwise_effective_rank_mergeability_score": 0.01739640161395073,
        "task_vector_cosine_similarity": 0.01262974925339222,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0012931261444464326,
        "weight_space_angle": 0.048817653208971024,
        "task_vector_magnitude_ratio": 0.005295718554407358,
        "singular_value_overlap": -0.004574656952172518,
        "subspace_overlap": 0.06458920985460281,
        "right_subspace_overlap": 0.009590886533260345,
        "activation_l2_distance": 0.04191824421286583,
        "activation_cosine_similarity": 0.016479773446917534,
        "activation_magnitude_ratio": 0.001886219484731555,
        "activation_dot_product": 0.01124405488371849,
        "encoder_gradient_cosine_similarity": 0.010928524658083916,
        "encoder_gradient_l2_distance": -0.0010634582722559571,
        "encoder_gradient_dot_product": 0.01319578941911459,
        "input_gradient_cosine_similarity": 0.031876157969236374,
        "input_gradient_l2_distance": 0.0,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5570360965370867,
      "val_r": 0.5838090006701524,
      "n_iterations": 760,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004903800319880247,
        "right_subspace_overlap_bottom_k": 0.0018180327024310827,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.021841906011104584,
        "effective_rank": 0.03679506108164787,
        "effective_rank_mergeability_score": 0.03914790228009224,
        "stable_rank": 0.0025956290774047375,
        "spectral_gap": 0.06471437960863113,
        "singular_value_ratio": 0.05822739377617836,
        "layerwise_effective_rank": 0.04926056042313576,
        "layerwise_effective_rank_mergeability_score": 0.051924027502536774,
        "task_vector_cosine_similarity": 0.09222477674484253,
        "task_vector_l2_distance": -0.015972480177879333,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.09814286977052689,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.013685159385204315,
        "subspace_overlap": 0.0013385923812165856,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.004427280277013779,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002715685870498419,
        "activation_dot_product": -0.0023484486155211926,
        "encoder_gradient_cosine_similarity": -0.0015439426060765982,
        "encoder_gradient_l2_distance": -0.004224705044180155,
        "encoder_gradient_dot_product": 0.0036125383339822292,
        "input_gradient_cosine_similarity": 0.0018076575361192226,
        "input_gradient_l2_distance": -0.013345361687242985,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.2970791307057157,
      "val_r": 0.46116854011954006,
      "n_iterations": 258,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0029942835681140423,
        "right_subspace_overlap_bottom_k": 0.001216050935909152,
        "interaction_matrix_overlap_top_k": 0.0018693564925342798,
        "interaction_matrix_overlap_bottom_k": 0.09757205843925476,
        "effective_rank": 0.007005484774708748,
        "effective_rank_mergeability_score": 0.05895364657044411,
        "stable_rank": 0.011580719612538815,
        "spectral_gap": 0.04870785027742386,
        "singular_value_ratio": 0.005213411524891853,
        "layerwise_effective_rank": 0.03585762530565262,
        "layerwise_effective_rank_mergeability_score": 0.004559795372188091,
        "task_vector_cosine_similarity": 0.02555685304105282,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0010621235705912113,
        "weight_space_angle": 0.05343850329518318,
        "task_vector_magnitude_ratio": 0.006027781404554844,
        "singular_value_overlap": -0.0011435332708060741,
        "subspace_overlap": 0.07622770220041275,
        "right_subspace_overlap": 0.0068550193682312965,
        "activation_l2_distance": 0.006181170232594013,
        "activation_cosine_similarity": 0.00982162356376648,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.002186410129070282,
        "encoder_gradient_cosine_similarity": 0.013340622186660767,
        "encoder_gradient_l2_distance": 0.0,
        "encoder_gradient_dot_product": 0.003602496115490794,
        "input_gradient_cosine_similarity": 0.025860536843538284,
        "input_gradient_l2_distance": -0.003108869306743145,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.36052862462933916,
      "val_r": -0.19047123697990567,
      "n_iterations": 220,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0012613439466804266,
        "right_subspace_overlap_bottom_k": 0.019421368837356567,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.10714103281497955,
        "effective_rank": 0.009106048382818699,
        "effective_rank_mergeability_score": 0.04194368049502373,
        "stable_rank": 0.016658129170536995,
        "spectral_gap": 0.03908972069621086,
        "singular_value_ratio": 0.005805380642414093,
        "layerwise_effective_rank": 0.0018089241348206997,
        "layerwise_effective_rank_mergeability_score": 0.011528149247169495,
        "task_vector_cosine_similarity": 0.00225519435480237,
        "task_vector_l2_distance": 0.0034855741541832685,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.08066590130329132,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.06282069534063339,
        "right_subspace_overlap": 0.007096030283719301,
        "activation_l2_distance": 0.0025064614601433277,
        "activation_cosine_similarity": 0.01696012355387211,
        "activation_magnitude_ratio": 0.02895294316112995,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.018304258584976196,
        "encoder_gradient_l2_distance": -0.0011679647723212838,
        "encoder_gradient_dot_product": 0.017576206475496292,
        "input_gradient_cosine_similarity": 0.019100243225693703,
        "input_gradient_l2_distance": 0.0,
        "input_gradient_dot_product": 0.001853608526289463
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.30495282656937817,
      "val_r": 0.32353188974045227,
      "n_iterations": 220,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.011304913088679314,
        "right_subspace_overlap_bottom_k": 0.006661118473857641,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.13470561802387238,
        "effective_rank": 0.01803911291062832,
        "effective_rank_mergeability_score": 0.0012207827530801296,
        "stable_rank": 0.010950927622616291,
        "spectral_gap": 0.10125505179166794,
        "singular_value_ratio": 0.012847991660237312,
        "layerwise_effective_rank": 0.0029990561306476593,
        "layerwise_effective_rank_mergeability_score": 0.014093853533267975,
        "task_vector_cosine_similarity": 0.017038246616721153,
        "task_vector_l2_distance": 0.0022872621193528175,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0025441257748752832,
        "task_vector_magnitude_ratio": 0.0013816911960020661,
        "singular_value_overlap": -0.0018726969137787819,
        "subspace_overlap": 0.05444205179810524,
        "right_subspace_overlap": 0.014401545748114586,
        "activation_l2_distance": 0.015719885006546974,
        "activation_cosine_similarity": 0.009402060881257057,
        "activation_magnitude_ratio": 0.0024967254139482975,
        "activation_dot_product": 0.0010216168593615294,
        "encoder_gradient_cosine_similarity": 0.006988592445850372,
        "encoder_gradient_l2_distance": 0.007570573128759861,
        "encoder_gradient_dot_product": 0.006068970076739788,
        "input_gradient_cosine_similarity": 0.020022297278046608,
        "input_gradient_l2_distance": 0.0033267135731875896,
        "input_gradient_dot_product": 0.015221193432807922
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.2884479421618031,
      "val_r": -0.09709731957269038,
      "n_iterations": 285,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004074038937687874,
        "right_subspace_overlap_bottom_k": 0.007204233668744564,
        "interaction_matrix_overlap_top_k": 0.0028495164588093758,
        "interaction_matrix_overlap_bottom_k": 0.08317329734563828,
        "effective_rank": 0.010575196705758572,
        "effective_rank_mergeability_score": 0.05296779051423073,
        "stable_rank": 0.012971463613212109,
        "spectral_gap": 0.031121253967285156,
        "singular_value_ratio": 0.010335765779018402,
        "layerwise_effective_rank": 0.004155052825808525,
        "layerwise_effective_rank_mergeability_score": 0.018960127606987953,
        "task_vector_cosine_similarity": 0.011944541707634926,
        "task_vector_l2_distance": 0.0010641072876751423,
        "task_vector_dot_product": 0.009092269465327263,
        "weight_space_angle": 0.04467841610312462,
        "task_vector_magnitude_ratio": 0.0017658377764746547,
        "singular_value_overlap": 0.002077947836369276,
        "subspace_overlap": 0.06892240047454834,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.01937124878168106,
        "activation_cosine_similarity": 0.017238397151231766,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.004659892991185188,
        "encoder_gradient_cosine_similarity": 0.03754547983407974,
        "encoder_gradient_l2_distance": 0.0029650405049324036,
        "encoder_gradient_dot_product": 0.02316119149327278,
        "input_gradient_cosine_similarity": 0.025677356868982315,
        "input_gradient_l2_distance": 0.0011133492225781083,
        "input_gradient_dot_product": 0.009266708046197891
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.2906153479455351,
      "val_r": 0.2943712262795681,
      "n_iterations": 271,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010208917781710625,
        "right_subspace_overlap_bottom_k": 0.009297299198806286,
        "interaction_matrix_overlap_top_k": 0.015128380618989468,
        "interaction_matrix_overlap_bottom_k": 0.10255273431539536,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.036444973200559616,
        "stable_rank": 0.013604273088276386,
        "spectral_gap": 0.05436825379729271,
        "singular_value_ratio": 0.012876687571406364,
        "layerwise_effective_rank": 0.014603562653064728,
        "layerwise_effective_rank_mergeability_score": 0.007856684736907482,
        "task_vector_cosine_similarity": 0.0143578564748168,
        "task_vector_l2_distance": 0.001190589857287705,
        "task_vector_dot_product": 0.0055854180827736855,
        "weight_space_angle": 0.06998147815465927,
        "task_vector_magnitude_ratio": -0.0011208293726667762,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.07592980563640594,
        "right_subspace_overlap": 0.009888555854558945,
        "activation_l2_distance": 0.0014745327644050121,
        "activation_cosine_similarity": 0.009045174345374107,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.007947883568704128,
        "encoder_gradient_cosine_similarity": 0.0058761839754879475,
        "encoder_gradient_l2_distance": 0.0,
        "encoder_gradient_dot_product": 0.020907077938318253,
        "input_gradient_cosine_similarity": 0.0022248949389904737,
        "input_gradient_l2_distance": 0.0,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.32453498490917926,
      "val_r": 0.4312108227310043,
      "n_iterations": 272,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009619316086173058,
        "right_subspace_overlap_bottom_k": 0.014005456119775772,
        "interaction_matrix_overlap_top_k": 0.00934008602052927,
        "interaction_matrix_overlap_bottom_k": 0.0682634636759758,
        "effective_rank": 0.010394608601927757,
        "effective_rank_mergeability_score": 0.10407387465238571,
        "stable_rank": 0.0,
        "spectral_gap": 0.03676209971308708,
        "singular_value_ratio": 0.013880248181521893,
        "layerwise_effective_rank": 0.09846631437540054,
        "layerwise_effective_rank_mergeability_score": 0.004541289061307907,
        "task_vector_cosine_similarity": 0.010602984577417374,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.004629894159734249,
        "weight_space_angle": 0.030661607161164284,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.01466003991663456,
        "right_subspace_overlap": 0.002730089705437422,
        "activation_l2_distance": 0.01087195985019207,
        "activation_cosine_similarity": 0.009480404667556286,
        "activation_magnitude_ratio": -0.0016753474483266473,
        "activation_dot_product": 0.013241962529718876,
        "encoder_gradient_cosine_similarity": 0.0014238925650715828,
        "encoder_gradient_l2_distance": -0.002332544419914484,
        "encoder_gradient_dot_product": 0.00406532222405076,
        "input_gradient_cosine_similarity": 0.03191094100475311,
        "input_gradient_l2_distance": 0.0,
        "input_gradient_dot_product": 0.0028482505585998297
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.47962457721974694,
      "val_r": 0.41575144882486964,
      "n_iterations": 404,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.004349709954112768,
        "interaction_matrix_overlap_top_k": -0.0022377921268343925,
        "interaction_matrix_overlap_bottom_k": 0.02208542451262474,
        "effective_rank": 0.04822773486375809,
        "effective_rank_mergeability_score": 0.09229253232479095,
        "stable_rank": 0.022683437913656235,
        "spectral_gap": 0.051397450268268585,
        "singular_value_ratio": 0.03751422464847565,
        "layerwise_effective_rank": 0.0676909014582634,
        "layerwise_effective_rank_mergeability_score": 0.04627424478530884,
        "task_vector_cosine_similarity": 0.05156388878822327,
        "task_vector_l2_distance": -0.016707027330994606,
        "task_vector_dot_product": 0.0052054282277822495,
        "weight_space_angle": 0.06650687009096146,
        "task_vector_magnitude_ratio": 0.001068370882421732,
        "singular_value_overlap": -0.010322016663849354,
        "subspace_overlap": 0.008317001163959503,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.007107316050678492,
        "activation_cosine_similarity": 0.003972445614635944,
        "activation_magnitude_ratio": -0.0021591882687062025,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0017579493578523397,
        "encoder_gradient_l2_distance": -0.0031789850909262896,
        "encoder_gradient_dot_product": 0.0017002332024276257,
        "input_gradient_cosine_similarity": 0.00276566157117486,
        "input_gradient_l2_distance": -0.01182587817311287,
        "input_gradient_dot_product": -0.002640761900693178
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.49283417502784743,
      "val_r": 0.4724309280549316,
      "n_iterations": 423,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.025070233270525932,
        "effective_rank": 0.060015883296728134,
        "effective_rank_mergeability_score": 0.08279780298471451,
        "stable_rank": 0.03089010901749134,
        "spectral_gap": 0.06342441588640213,
        "singular_value_ratio": 0.05090634152293205,
        "layerwise_effective_rank": 0.03706544265151024,
        "layerwise_effective_rank_mergeability_score": 0.03839727118611336,
        "task_vector_cosine_similarity": 0.06508945673704147,
        "task_vector_l2_distance": -0.01259162649512291,
        "task_vector_dot_product": -0.0010337303392589092,
        "weight_space_angle": 0.06273765116930008,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.012714223936200142,
        "subspace_overlap": 0.0023911839816719294,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0075680967420339584,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.003523873398080468,
        "activation_dot_product": 0.0015368795720860362,
        "encoder_gradient_cosine_similarity": 0.0011968198232352734,
        "encoder_gradient_l2_distance": 0.0,
        "encoder_gradient_dot_product": 0.004451029933989048,
        "input_gradient_cosine_similarity": 0.006837334018200636,
        "input_gradient_l2_distance": -0.015475133433938026,
        "input_gradient_dot_product": -0.0016597347566857934
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.26786927253104853,
      "val_r": 0.43831991763755984,
      "n_iterations": 477,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.012373083271086216,
        "right_subspace_overlap_bottom_k": 0.005002265330404043,
        "interaction_matrix_overlap_top_k": 0.011106531135737896,
        "interaction_matrix_overlap_bottom_k": 0.09595635533332825,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.05617320537567139,
        "stable_rank": 0.014119816944003105,
        "spectral_gap": 0.04066113010048866,
        "singular_value_ratio": 0.004337072838097811,
        "layerwise_effective_rank": 0.017435628920793533,
        "layerwise_effective_rank_mergeability_score": 0.003313993336632848,
        "task_vector_cosine_similarity": 0.0017888844013214111,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.05947111174464226,
        "task_vector_magnitude_ratio": 0.007630105130374432,
        "singular_value_overlap": -0.0028392933309078217,
        "subspace_overlap": 0.0802265852689743,
        "right_subspace_overlap": 0.00698067294433713,
        "activation_l2_distance": 0.012537820264697075,
        "activation_cosine_similarity": 0.0026464578695595264,
        "activation_magnitude_ratio": 0.0012226359685882926,
        "activation_dot_product": 0.019216204062104225,
        "encoder_gradient_cosine_similarity": 0.022978490218520164,
        "encoder_gradient_l2_distance": 0.003457120154052973,
        "encoder_gradient_dot_product": 0.014284062199294567,
        "input_gradient_cosine_similarity": 0.01740487478673458,
        "input_gradient_l2_distance": 0.0,
        "input_gradient_dot_product": 0.005060833878815174
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4751272945059014,
      "val_r": 0.5681104634664744,
      "n_iterations": 681,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0020882892422378063,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.016329409554600716,
        "effective_rank": 0.07474885135889053,
        "effective_rank_mergeability_score": 0.08317190408706665,
        "stable_rank": 0.001452677883207798,
        "spectral_gap": 0.0633162260055542,
        "singular_value_ratio": 0.05823477357625961,
        "layerwise_effective_rank": 0.058033592998981476,
        "layerwise_effective_rank_mergeability_score": 0.05667423829436302,
        "task_vector_cosine_similarity": 0.04676862433552742,
        "task_vector_l2_distance": -0.00981929711997509,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.05577229708433151,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.01072001364082098,
        "subspace_overlap": 0.007792133372277021,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.001711905817501247,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.003539605997502804,
        "activation_dot_product": -0.0014568404294550419,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.004066281020641327,
        "encoder_gradient_dot_product": 0.0012040629517287016,
        "input_gradient_cosine_similarity": 0.003284706501290202,
        "input_gradient_l2_distance": -0.013846809044480324,
        "input_gradient_dot_product": -0.0012771805049851537
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5316493955534956,
      "val_r": 0.33571292161242405,
      "n_iterations": 456,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0022839016746729612,
        "interaction_matrix_overlap_top_k": 0.0012188879773020744,
        "interaction_matrix_overlap_bottom_k": 0.02012234553694725,
        "effective_rank": 0.06030718609690666,
        "effective_rank_mergeability_score": 0.07771886885166168,
        "stable_rank": 0.00970469694584608,
        "spectral_gap": 0.05812413617968559,
        "singular_value_ratio": 0.05346459522843361,
        "layerwise_effective_rank": 0.05206706374883652,
        "layerwise_effective_rank_mergeability_score": 0.04200845956802368,
        "task_vector_cosine_similarity": 0.06891856342554092,
        "task_vector_l2_distance": -0.0151622723788023,
        "task_vector_dot_product": 0.0013853204436600208,
        "weight_space_angle": 0.07160083204507828,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.006040120497345924,
        "subspace_overlap": 0.0015570592368021607,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.012850149534642696,
        "activation_cosine_similarity": 0.004282104782760143,
        "activation_magnitude_ratio": -0.0035887539852410555,
        "activation_dot_product": 0.002080171834677458,
        "encoder_gradient_cosine_similarity": 0.0010680537670850754,
        "encoder_gradient_l2_distance": -0.002811357844620943,
        "encoder_gradient_dot_product": 0.001842282246798277,
        "input_gradient_cosine_similarity": 0.003347939345985651,
        "input_gradient_l2_distance": -0.011519668623805046,
        "input_gradient_dot_product": -0.0020763122010976076
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.29248938669788566,
      "val_r": 0.2664098703647227,
      "n_iterations": 417,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.014905480667948723,
        "right_subspace_overlap_bottom_k": 0.004391595255583525,
        "interaction_matrix_overlap_top_k": 0.008477793075144291,
        "interaction_matrix_overlap_bottom_k": 0.07864594459533691,
        "effective_rank": 0.0079755038022995,
        "effective_rank_mergeability_score": 0.02370840683579445,
        "stable_rank": 0.011631493456661701,
        "spectral_gap": 0.04520896077156067,
        "singular_value_ratio": 0.005626408848911524,
        "layerwise_effective_rank": 0.003824335290119052,
        "layerwise_effective_rank_mergeability_score": 0.004694455768913031,
        "task_vector_cosine_similarity": 0.0026400000788271427,
        "task_vector_l2_distance": -0.002606102265417576,
        "task_vector_dot_product": 0.002019460080191493,
        "weight_space_angle": 0.08624841272830963,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.003883832599967718,
        "subspace_overlap": 0.0998578816652298,
        "right_subspace_overlap": 0.014890080317854881,
        "activation_l2_distance": 0.0070493086241185665,
        "activation_cosine_similarity": 0.008612453937530518,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.020812060683965683,
        "encoder_gradient_cosine_similarity": 0.013568608090281487,
        "encoder_gradient_l2_distance": -0.0026981139089912176,
        "encoder_gradient_dot_product": 0.019612358883023262,
        "input_gradient_cosine_similarity": 0.01663484424352646,
        "input_gradient_l2_distance": 0.0,
        "input_gradient_dot_product": 0.002961922436952591
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3845796235521117,
      "val_r": -0.03616753092254377,
      "n_iterations": 249,
      "n_nonzero_coefficients": 28,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0010657534003257751,
        "right_subspace_overlap_bottom_k": 0.007417366374284029,
        "interaction_matrix_overlap_top_k": 0.009852616116404533,
        "interaction_matrix_overlap_bottom_k": 0.11164368689060211,
        "effective_rank": 0.026476822793483734,
        "effective_rank_mergeability_score": 0.004187475424259901,
        "stable_rank": 0.028568902984261513,
        "spectral_gap": 0.03170979022979736,
        "singular_value_ratio": 0.0012004534946754575,
        "layerwise_effective_rank": 0.0035597386304289103,
        "layerwise_effective_rank_mergeability_score": 0.08677110821008682,
        "task_vector_cosine_similarity": 0.017523106187582016,
        "task_vector_l2_distance": 0.0014307107776403427,
        "task_vector_dot_product": 0.002687889849767089,
        "weight_space_angle": 0.04965782165527344,
        "task_vector_magnitude_ratio": 0.005587821360677481,
        "singular_value_overlap": -0.002252239268273115,
        "subspace_overlap": 0.04248855635523796,
        "right_subspace_overlap": 0.007257794961333275,
        "activation_l2_distance": 0.012918264605104923,
        "activation_cosine_similarity": 0.011389434337615967,
        "activation_magnitude_ratio": 0.0011371473083272576,
        "activation_dot_product": 0.006966262124478817,
        "encoder_gradient_cosine_similarity": 0.011662304401397705,
        "encoder_gradient_l2_distance": 0.0,
        "encoder_gradient_dot_product": 0.012739129364490509,
        "input_gradient_cosine_similarity": 0.032900117337703705,
        "input_gradient_l2_distance": -0.004182205535471439,
        "input_gradient_dot_product": 0.001621114439330995
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6911544293523026,
      "val_r": 0.5001974589795519,
      "n_iterations": 359,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.011462780646979809,
        "right_subspace_overlap_bottom_k": -0.0018214936135336757,
        "interaction_matrix_overlap_top_k": 0.0014494727365672588,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.05021950602531433,
        "effective_rank_mergeability_score": 0.028694629669189453,
        "stable_rank": 0.00132488994859159,
        "spectral_gap": 0.03445211425423622,
        "singular_value_ratio": 0.03769076243042946,
        "layerwise_effective_rank": 0.05404794216156006,
        "layerwise_effective_rank_mergeability_score": 0.09017971903085709,
        "task_vector_cosine_similarity": 0.06826629489660263,
        "task_vector_l2_distance": 0.001069343532435596,
        "task_vector_dot_product": 0.010312303900718689,
        "weight_space_angle": 0.09711143374443054,
        "task_vector_magnitude_ratio": 0.004021492321044207,
        "singular_value_overlap": -0.0021965072955936193,
        "subspace_overlap": 0.0010810114908963442,
        "right_subspace_overlap": 0.012345829978585243,
        "activation_l2_distance": 0.006153657101094723,
        "activation_cosine_similarity": 0.007873660884797573,
        "activation_magnitude_ratio": -0.0013300133869051933,
        "activation_dot_product": 0.007594991475343704,
        "encoder_gradient_cosine_similarity": 0.004523669369518757,
        "encoder_gradient_l2_distance": -0.009721306152641773,
        "encoder_gradient_dot_product": 0.003895784728229046,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.013196360319852829,
        "input_gradient_dot_product": -0.0030927867628633976
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5586878115587891,
      "val_r": 0.21634096718961132,
      "n_iterations": 254,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.00511967996135354,
        "interaction_matrix_overlap_top_k": 0.0010941813234239817,
        "interaction_matrix_overlap_bottom_k": 0.020473098382353783,
        "effective_rank": 0.05530351772904396,
        "effective_rank_mergeability_score": 0.06133255362510681,
        "stable_rank": 0.006312975659966469,
        "spectral_gap": 0.08518984168767929,
        "singular_value_ratio": 0.07543633133172989,
        "layerwise_effective_rank": 0.038081925362348557,
        "layerwise_effective_rank_mergeability_score": 0.036315616220235825,
        "task_vector_cosine_similarity": 0.06720072776079178,
        "task_vector_l2_distance": -0.016386637464165688,
        "task_vector_dot_product": 0.003438910935074091,
        "weight_space_angle": 0.07596874982118607,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.013472088612616062,
        "subspace_overlap": 0.0020979621913284063,
        "right_subspace_overlap": -0.001881149597465992,
        "activation_l2_distance": 0.0032352495472878218,
        "activation_cosine_similarity": 0.0020418688654899597,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.003925414755940437,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0016636503860354424,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.008189854212105274,
        "input_gradient_l2_distance": -0.019374370574951172,
        "input_gradient_dot_product": -0.0016997616039589047
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}