{
  "aggregate_metrics": {
    "train_r": 0.4229345304529925,
    "train_p": 5.26258186418199e-140,
    "val_r": -0.0880221739229809,
    "val_p": 0.09634002949003403
  },
  "per_fold_stats": {
    "train_r_mean": 0.5446837725027,
    "train_r_std": 0.05272028548641055,
    "val_r_mean": 0.4472012323728304,
    "val_r_std": 0.13467487063992079,
    "n_nonzero_mean": 15.6,
    "n_nonzero_std": 3.352610922848042
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 6.552942795678973e-05,
    "right_subspace_overlap_bottom_k": 0.0022824849002063274,
    "interaction_matrix_overlap_top_k": -0.000125858437968418,
    "interaction_matrix_overlap_bottom_k": 0.018964434042572975,
    "effective_rank": -0.00028956783353351057,
    "effective_rank_mergeability_score": 0.0003153859288431704,
    "stable_rank": -0.0002790758153423667,
    "spectral_gap": 0.0005526760360226035,
    "singular_value_ratio": -0.0003730769385583699,
    "layerwise_effective_rank": -0.00045246435911394656,
    "layerwise_effective_rank_mergeability_score": 0.00032660976285114884,
    "task_vector_cosine_similarity": -1.3625865904032253e-05,
    "task_vector_l2_distance": -0.012670865282416344,
    "task_vector_dot_product": -0.00039465673035010695,
    "weight_space_angle": -0.0004812762199435383,
    "task_vector_magnitude_ratio": -0.0021063191816210747,
    "singular_value_overlap": -0.01109122484922409,
    "subspace_overlap": 0.0008735476294532418,
    "right_subspace_overlap": 0.0007022420759312809,
    "activation_l2_distance": -0.0007255393429659307,
    "activation_cosine_similarity": 0.00013696230598725379,
    "activation_magnitude_ratio": -0.0025946972891688347,
    "activation_dot_product": -0.001993908081203699,
    "encoder_gradient_cosine_similarity": 0.00046810711501166224,
    "encoder_gradient_l2_distance": -0.0072061107493937016,
    "encoder_gradient_dot_product": 0.0002226797805633396,
    "input_gradient_cosine_similarity": 0.0006472301320172846,
    "input_gradient_l2_distance": -0.013994483277201653,
    "input_gradient_dot_product": -0.0025119150523096323
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.0014700625324621797,
    "right_subspace_overlap_bottom_k": 0.0031030243262648582,
    "interaction_matrix_overlap_top_k": 0.0015834998339414597,
    "interaction_matrix_overlap_bottom_k": 0.004994598682969809,
    "effective_rank": 0.0005043584387749434,
    "effective_rank_mergeability_score": 0.0006583528593182564,
    "stable_rank": 0.0005742284120060503,
    "spectral_gap": 0.0007848274544812739,
    "singular_value_ratio": 0.0006799512193538249,
    "layerwise_effective_rank": 0.0008582131122238934,
    "layerwise_effective_rank_mergeability_score": 0.0007383339107036591,
    "task_vector_cosine_similarity": 0.0010622214758768678,
    "task_vector_l2_distance": 0.005000103265047073,
    "task_vector_dot_product": 0.001800523605197668,
    "weight_space_angle": 0.0013269133633002639,
    "task_vector_magnitude_ratio": 0.000998556730337441,
    "singular_value_overlap": 0.002995614428073168,
    "subspace_overlap": 0.0015844128793105483,
    "right_subspace_overlap": 0.0017606657929718494,
    "activation_l2_distance": 0.0032864955719560385,
    "activation_cosine_similarity": 0.0016776449047029018,
    "activation_magnitude_ratio": 0.0010854477295652032,
    "activation_dot_product": 0.002524887677282095,
    "encoder_gradient_cosine_similarity": 0.0009654632303863764,
    "encoder_gradient_l2_distance": 0.005611919332295656,
    "encoder_gradient_dot_product": 0.0013024749932810664,
    "input_gradient_cosine_similarity": 0.0011322472710162401,
    "input_gradient_l2_distance": 0.006393385585397482,
    "input_gradient_dot_product": 0.0022833894472569227
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.45,
    "right_subspace_overlap_bottom_k": 0.75,
    "interaction_matrix_overlap_top_k": 0.45,
    "interaction_matrix_overlap_bottom_k": 1.0,
    "effective_rank": 0.25,
    "effective_rank_mergeability_score": 0.2,
    "stable_rank": 0.2,
    "spectral_gap": 0.35,
    "singular_value_ratio": 0.25,
    "layerwise_effective_rank": 0.25,
    "layerwise_effective_rank_mergeability_score": 0.2,
    "task_vector_cosine_similarity": 0.4,
    "task_vector_l2_distance": 0.95,
    "task_vector_dot_product": 0.4,
    "weight_space_angle": 0.4,
    "task_vector_magnitude_ratio": 0.9,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.35,
    "right_subspace_overlap": 0.4,
    "activation_l2_distance": 0.4,
    "activation_cosine_similarity": 0.25,
    "activation_magnitude_ratio": 0.95,
    "activation_dot_product": 0.6,
    "encoder_gradient_cosine_similarity": 0.5,
    "encoder_gradient_l2_distance": 0.95,
    "encoder_gradient_dot_product": 0.35,
    "input_gradient_cosine_similarity": 0.6,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.85
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5984624886034957,
      "val_r": 0.5852707796854559,
      "n_iterations": 229,
      "n_nonzero_coefficients": 12,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0014381272485479712,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.01577678509056568,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0022318800911307335,
        "task_vector_l2_distance": -0.009619096294045448,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0030038238037377596,
        "singular_value_overlap": -0.0115586519241333,
        "subspace_overlap": 0.003089148085564375,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.003741474822163582,
        "activation_dot_product": -0.00449453154578805,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0057722777128219604,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.008563513867557049,
        "input_gradient_dot_product": -0.002137810690328479
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5507345099646073,
      "val_r": 0.45167722377696917,
      "n_iterations": 279,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0011070913169533014,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.020043691620230675,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0016062305076047778,
        "stable_rank": 0.0,
        "spectral_gap": 0.0010552393505349755,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.010855383239686489,
        "task_vector_dot_product": 0.0012525105848908424,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0030730199068784714,
        "singular_value_overlap": -0.007556232623755932,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": -0.0023737361188977957,
        "activation_l2_distance": 0.0010407654335722327,
        "activation_cosine_similarity": 0.0010346666676923633,
        "activation_magnitude_ratio": -0.002030535601079464,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.007805325090885162,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.001657809130847454,
        "input_gradient_l2_distance": -0.010549671947956085,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5350124878764876,
      "val_r": 0.4734727476921665,
      "n_iterations": 234,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0029410962015390396,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.017254849895834923,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0015587566886097193,
        "task_vector_l2_distance": -0.013245494104921818,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0015584651846438646,
        "singular_value_overlap": -0.011879872530698776,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0032596811652183533,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002964272163808346,
        "activation_dot_product": -0.001548245083540678,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.005555889569222927,
        "encoder_gradient_dot_product": -0.001822206424549222,
        "input_gradient_cosine_similarity": 0.0012905977200716734,
        "input_gradient_l2_distance": -0.01207603607326746,
        "input_gradient_dot_product": -0.0019435224821791053
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5523572302846307,
      "val_r": 0.5141149891820217,
      "n_iterations": 318,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.003426416777074337,
        "interaction_matrix_overlap_top_k": 0.0011154416715726256,
        "interaction_matrix_overlap_bottom_k": 0.017352893948554993,
        "effective_rank": -0.0010910083074122667,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0010500943753868341,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0012323603732511401,
        "task_vector_l2_distance": -0.01165380235761404,
        "task_vector_dot_product": 0.0013758381828665733,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.001953958533704281,
        "singular_value_overlap": -0.012031862512230873,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0036610602401196957,
        "activation_dot_product": -0.003284701146185398,
        "encoder_gradient_cosine_similarity": -0.0012681677471846342,
        "encoder_gradient_l2_distance": -0.004441739059984684,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.001685662311501801,
        "input_gradient_l2_distance": -0.011261435225605965,
        "input_gradient_dot_product": -0.0033816820941865444
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5708241074038031,
      "val_r": 0.5951013632915878,
      "n_iterations": 243,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0012091738171875477,
        "right_subspace_overlap_bottom_k": 0.0030588367953896523,
        "interaction_matrix_overlap_top_k": 0.00194265425670892,
        "interaction_matrix_overlap_bottom_k": 0.02552112750709057,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0014485931023955345,
        "singular_value_ratio": -0.0010427285451442003,
        "layerwise_effective_rank": -0.0010899277403950691,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0013668397441506386,
        "task_vector_l2_distance": -0.020691031590104103,
        "task_vector_dot_product": -0.0032377205789089203,
        "weight_space_angle": -0.0012811279157176614,
        "task_vector_magnitude_ratio": -0.002033067401498556,
        "singular_value_overlap": -0.016274508088827133,
        "subspace_overlap": -0.0010156265925616026,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0020964238792657852,
        "activation_dot_product": -0.004218418151140213,
        "encoder_gradient_cosine_similarity": 0.0012201754143461585,
        "encoder_gradient_l2_distance": -0.004976240452378988,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.016778698191046715,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5257096412068283,
      "val_r": 0.6965171659214692,
      "n_iterations": 301,
      "n_nonzero_coefficients": 13,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.003384063486009836,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.022228214889764786,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0013943712692707777,
        "task_vector_l2_distance": -0.013342232443392277,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0023561534471809864,
        "singular_value_overlap": -0.013659429736435413,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.001089025754481554,
        "activation_l2_distance": -0.002182080876082182,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002557947300374508,
        "activation_dot_product": -0.0031952240969985723,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.006282821297645569,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0021890331991016865,
        "input_gradient_l2_distance": -0.01230686902999878,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5525768067041729,
      "val_r": 0.24657392384193688,
      "n_iterations": 321,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0010649290634319186,
        "right_subspace_overlap_bottom_k": 0.006503187119960785,
        "interaction_matrix_overlap_top_k": -0.0019224865827709436,
        "interaction_matrix_overlap_bottom_k": 0.02238009311258793,
        "effective_rank": -0.0013025305233895779,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0020066520664840937,
        "singular_value_ratio": -0.0020946403965353966,
        "layerwise_effective_rank": -0.002138781826943159,
        "layerwise_effective_rank_mergeability_score": 0.001417043269611895,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.016403021290898323,
        "task_vector_dot_product": -0.005198238417506218,
        "weight_space_angle": 0.0022673048079013824,
        "task_vector_magnitude_ratio": -0.002549689495936036,
        "singular_value_overlap": -0.01655854843556881,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.003445724956691265,
        "activation_cosine_similarity": 0.0014984223525971174,
        "activation_magnitude_ratio": -0.001776242977939546,
        "activation_dot_product": -0.010769030079245567,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.012777618132531643,
        "encoder_gradient_dot_product": 0.00249113654717803,
        "input_gradient_cosine_similarity": -0.0020597197581082582,
        "input_gradient_l2_distance": -0.018921438604593277,
        "input_gradient_dot_product": -0.002296565566211939
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5277414561588265,
      "val_r": 0.3883309783984004,
      "n_iterations": 189,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.001449286355637014,
        "interaction_matrix_overlap_top_k": -0.003372735809534788,
        "interaction_matrix_overlap_bottom_k": 0.023899590596556664,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0013096937909722328,
        "spectral_gap": 0.0015864279121160507,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.012329088523983955,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0032918488141149282,
        "singular_value_overlap": -0.01094839908182621,
        "subspace_overlap": 0.0012138914316892624,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.003398518543690443,
        "activation_dot_product": -0.0023327942471951246,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.00523685896769166,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0061825113371014595,
        "input_gradient_dot_product": -0.0016045646043494344
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5351060054548051,
      "val_r": 0.39513481755547275,
      "n_iterations": 250,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.0017021982930600643,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.020674221217632294,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0022277701646089554,
        "stable_rank": 0.0,
        "spectral_gap": 0.001089185243472457,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0011633741669356823,
        "task_vector_cosine_similarity": -0.0015672000590711832,
        "task_vector_l2_distance": -0.007976889610290527,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0024591556284576654,
        "task_vector_magnitude_ratio": -0.0012200034689158201,
        "singular_value_overlap": -0.008226889185607433,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0017398596974089742,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.001615991466678679,
        "encoder_gradient_l2_distance": -0.005447461269795895,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.001363264280371368,
        "input_gradient_l2_distance": -0.00952247716486454,
        "input_gradient_dot_product": -0.0027236510068178177
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.56711061846266,
      "val_r": 0.1755846333171502,
      "n_iterations": 328,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0015877539990469813,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.018468273803591728,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0012182325590401888,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0010098416823893785,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01284770481288433,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0026327483355998993,
        "singular_value_overlap": -0.01206082385033369,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": -0.0010976267512887716,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": -0.0018832720816135406,
        "activation_magnitude_ratio": -0.003323041135445237,
        "activation_dot_product": -0.0017477403162047267,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.005412775091826916,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.012251491658389568,
        "input_gradient_dot_product": -0.001264780294150114
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.47720659168573176,
      "val_r": 0.3088082983729836,
      "n_iterations": 433,
      "n_nonzero_coefficients": 12,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.004203435964882374,
        "interaction_matrix_overlap_top_k": -0.00110324053093791,
        "interaction_matrix_overlap_bottom_k": 0.015336010605096817,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.010317753069102764,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.001397250802256167,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.00807985384017229,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0027410676702857018,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.006698683835566044,
        "encoder_gradient_dot_product": 0.0013536084443330765,
        "input_gradient_cosine_similarity": 0.0017515176441520452,
        "input_gradient_l2_distance": -0.00844768900424242,
        "input_gradient_dot_product": -0.0016930440906435251
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5169677771677631,
      "val_r": 0.5192806448708999,
      "n_iterations": 347,
      "n_nonzero_coefficients": 11,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.020127054303884506,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.011425885371863842,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0016076158499345183,
        "singular_value_overlap": -0.011100009083747864,
        "subspace_overlap": 0.003186162794008851,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0021799455862492323,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0030756695196032524,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": -0.001267787185497582,
        "encoder_gradient_l2_distance": -0.005985839758068323,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.012938723899424076,
        "input_gradient_dot_product": -0.0024285325780510902
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5119461705363894,
      "val_r": 0.5255933366816106,
      "n_iterations": 408,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0011153401574119925,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.01683555729687214,
        "effective_rank": -0.0012644871603697538,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0010545613477006555,
        "task_vector_l2_distance": -0.011971622705459595,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.003126151394098997,
        "singular_value_overlap": -0.010248998180031776,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0013522951630875468,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.001529501168988645,
        "encoder_gradient_l2_distance": -0.004374487325549126,
        "encoder_gradient_dot_product": -0.0016332913655787706,
        "input_gradient_cosine_similarity": 0.0015230237040668726,
        "input_gradient_l2_distance": -0.010959535837173462,
        "input_gradient_dot_product": -0.004412577487528324
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4302571207169676,
      "val_r": 0.5237598468849746,
      "n_iterations": 307,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003546022344380617,
        "right_subspace_overlap_bottom_k": 0.0031581528019160032,
        "interaction_matrix_overlap_top_k": 0.001408232725225389,
        "interaction_matrix_overlap_bottom_k": 0.017587922513484955,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0013541547814384103,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0025019075255841017,
        "task_vector_l2_distance": -0.008486184291541576,
        "task_vector_dot_product": 0.002355222124606371,
        "weight_space_angle": -0.0032818333711475134,
        "task_vector_magnitude_ratio": -0.002054717391729355,
        "singular_value_overlap": -0.006253937259316444,
        "subspace_overlap": 0.0025185521226376295,
        "right_subspace_overlap": 0.0024793411139398813,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0013093962334096432,
        "activation_dot_product": -0.0010847561061382294,
        "encoder_gradient_cosine_similarity": 0.0027072099037468433,
        "encoder_gradient_l2_distance": -0.008186860010027885,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0014802315272390842,
        "input_gradient_l2_distance": -0.012508882209658623,
        "input_gradient_dot_product": -0.011143351905047894
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.48810923896126734,
      "val_r": 0.5437359399986808,
      "n_iterations": 368,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.003903299570083618,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.017176367342472076,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.016214832663536072,
        "task_vector_dot_product": -0.004307907074689865,
        "weight_space_angle": -0.0011252772528678179,
        "task_vector_magnitude_ratio": -0.0021495455875992775,
        "singular_value_overlap": -0.01554578822106123,
        "subspace_overlap": 0.004939825274050236,
        "right_subspace_overlap": 0.0027221606578677893,
        "activation_l2_distance": -0.004161341581493616,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002906988374888897,
        "activation_dot_product": -0.0017216817941516638,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.00839540921151638,
        "encoder_gradient_dot_product": -0.001689306227490306,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01679784059524536,
        "input_gradient_dot_product": -0.0027049179188907146
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5508619943793118,
      "val_r": 0.4013676940837619,
      "n_iterations": 384,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.001608472433872521,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.019609127193689346,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.016579635441303253,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.002390575595200062,
        "singular_value_overlap": -0.00858575664460659,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0019923921208828688,
        "activation_l2_distance": -0.0010713416850194335,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.005197542253881693,
        "activation_dot_product": -0.0037386626936495304,
        "encoder_gradient_cosine_similarity": 0.0010521163931116462,
        "encoder_gradient_l2_distance": -0.008018243126571178,
        "encoder_gradient_dot_product": 0.0020141489803791046,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.013926360756158829,
        "input_gradient_dot_product": -0.0033450969494879246
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5517792818319422,
      "val_r": 0.49588252050391185,
      "n_iterations": 353,
      "n_nonzero_coefficients": 11,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0010411972180008888,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.014196068979799747,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0014032311737537384,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009156021289527416,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0010920872446149588,
        "task_vector_magnitude_ratio": -0.0013156443601474166,
        "singular_value_overlap": -0.00791970081627369,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002389767440035939,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0038520474918186665,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.007561051286756992,
        "input_gradient_dot_product": -0.0012834734516218305
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5782033234843059,
      "val_r": 0.21701777119502325,
      "n_iterations": 192,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0023376040626317263,
        "right_subspace_overlap_bottom_k": 0.012536398135125637,
        "interaction_matrix_overlap_top_k": -0.0024718933273106813,
        "interaction_matrix_overlap_bottom_k": 0.029811635613441467,
        "effective_rank": -0.001026809448376298,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0019081333884969354,
        "spectral_gap": 0.0018707062117755413,
        "singular_value_ratio": -0.0010904375230893493,
        "layerwise_effective_rank": -0.001846124418079853,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.025020744651556015,
        "task_vector_dot_product": 0.0011320380726829171,
        "weight_space_angle": -0.003440272295847535,
        "task_vector_magnitude_ratio": -0.001680090557783842,
        "singular_value_overlap": -0.0139318173751235,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.005564758088439703,
        "activation_cosine_similarity": -0.003834816161543131,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.0017423788085579872,
        "encoder_gradient_cosine_similarity": 0.001090198871679604,
        "encoder_gradient_l2_distance": 0.0,
        "encoder_gradient_dot_product": 0.003739505773410201,
        "input_gradient_cosine_similarity": 0.0021431788336485624,
        "input_gradient_l2_distance": -0.030311817303299904,
        "input_gradient_dot_product": -0.002100628102198243
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7064033441266103,
      "val_r": 0.5681030280308375,
      "n_iterations": 360,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002624868182465434,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.004048763308674097,
        "interaction_matrix_overlap_bottom_k": 0.00411337660625577,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0010704864980652928,
        "stable_rank": -0.001145456568337977,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.002924358006566763,
        "layerwise_effective_rank_mergeability_score": 0.002941936021670699,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.007309289183467627,
        "subspace_overlap": 0.003538999240845442,
        "right_subspace_overlap": 0.00597360311076045,
        "activation_l2_distance": -0.012435766868293285,
        "activation_cosine_similarity": 0.0059242453426122665,
        "activation_magnitude_ratio": -0.0033802823163568974,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0016118725761771202,
        "encoder_gradient_l2_distance": -0.02937040664255619,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0016361558809876442,
        "input_gradient_l2_distance": -0.030590400099754333,
        "input_gradient_dot_product": -0.0025904125068336725
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5663052550433917,
      "val_r": 0.3186969441712954,
      "n_iterations": 275,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0033771039452403784,
        "right_subspace_overlap_bottom_k": 0.0013747295597568154,
        "interaction_matrix_overlap_top_k": -0.002161904703825712,
        "interaction_matrix_overlap_bottom_k": 0.020895833149552345,
        "effective_rank": -0.001106521114706993,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0019967155531048775,
        "singular_value_ratio": -0.001879577524960041,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01528088841587305,
        "task_vector_dot_product": -0.0012648776173591614,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.004129265435039997,
        "singular_value_overlap": -0.012094134464859962,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002251556608825922,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0010710316710174084,
        "encoder_gradient_l2_distance": -0.005531218834221363,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0010103760287165642,
        "input_gradient_l2_distance": -0.01743323728442192,
        "input_gradient_dot_product": -0.003183686872944236
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1.0,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}