{
  "aggregate_metrics": {
    "train_r": 0.5136176975362746,
    "train_p": 1.9826254112934166e-216,
    "val_r": 0.2806640519184891,
    "val_p": 6.635287004186968e-08
  },
  "per_fold_stats": {
    "train_r_mean": 0.7552994809918221,
    "train_r_std": 0.040983991659465105,
    "val_r_mean": 0.6263238358279405,
    "val_r_std": 0.16764940520451446,
    "n_nonzero_mean": 23.75,
    "n_nonzero_std": 4.085033659592048
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.02614269219338894,
    "right_subspace_overlap_bottom_k": -0.06519121676683426,
    "interaction_matrix_overlap_top_k": 0.0014574499800801277,
    "interaction_matrix_overlap_bottom_k": 0.02519049122929573,
    "effective_rank": -0.001100545865483582,
    "effective_rank_mergeability_score": 0.0010268473997712135,
    "stable_rank": -0.002752876142039895,
    "spectral_gap": 0.0005758834886364639,
    "singular_value_ratio": -0.0005722002242691815,
    "layerwise_effective_rank": -0.005257123149931431,
    "layerwise_effective_rank_mergeability_score": 0.004965951666235924,
    "task_vector_cosine_similarity": -0.0005221606115810573,
    "task_vector_l2_distance": -0.01453630905598402,
    "task_vector_dot_product": -0.0012456985423341393,
    "weight_space_angle": -8.390508446609601e-05,
    "task_vector_magnitude_ratio": -0.002123479964211583,
    "singular_value_overlap": 0.0011224301997572184,
    "subspace_overlap": 0.0027066455222666264,
    "right_subspace_overlap": 0.024000700563192368,
    "activation_l2_distance": -0.0035514694172888994,
    "activation_cosine_similarity": 0.03996554762125015,
    "activation_magnitude_ratio": -0.010531645268201828,
    "activation_dot_product": 0.018158668652176857,
    "encoder_gradient_cosine_similarity": 0.012641352601349354,
    "encoder_gradient_l2_distance": -0.08846522867679596,
    "encoder_gradient_dot_product": 0.005914599634706974,
    "input_gradient_cosine_similarity": 0.004979727324098349,
    "input_gradient_l2_distance": -0.06751187145709991,
    "input_gradient_dot_product": -0.022342301905155182
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.014460334554314613,
    "right_subspace_overlap_bottom_k": 0.02796490490436554,
    "interaction_matrix_overlap_top_k": 0.009935401380062103,
    "interaction_matrix_overlap_bottom_k": 0.028310995548963547,
    "effective_rank": 0.0036985131446272135,
    "effective_rank_mergeability_score": 0.0037176483310759068,
    "stable_rank": 0.00404495419934392,
    "spectral_gap": 0.0031851481180638075,
    "singular_value_ratio": 0.00326457223854959,
    "layerwise_effective_rank": 0.005326064303517342,
    "layerwise_effective_rank_mergeability_score": 0.004898867104202509,
    "task_vector_cosine_similarity": 0.011718063615262508,
    "task_vector_l2_distance": 0.016348131000995636,
    "task_vector_dot_product": 0.008321672677993774,
    "weight_space_angle": 0.01042709406465292,
    "task_vector_magnitude_ratio": 0.0032441476359963417,
    "singular_value_overlap": 0.006059568375349045,
    "subspace_overlap": 0.010242149233818054,
    "right_subspace_overlap": 0.014824566431343555,
    "activation_l2_distance": 0.013335608877241611,
    "activation_cosine_similarity": 0.02013869397342205,
    "activation_magnitude_ratio": 0.010919869877398014,
    "activation_dot_product": 0.040092989802360535,
    "encoder_gradient_cosine_similarity": 0.008577995002269745,
    "encoder_gradient_l2_distance": 0.04789772257208824,
    "encoder_gradient_dot_product": 0.009363388642668724,
    "input_gradient_cosine_similarity": 0.005748338531702757,
    "input_gradient_l2_distance": 0.05199272558093071,
    "input_gradient_dot_product": 0.023557323962450027
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 1.0,
    "right_subspace_overlap_bottom_k": 1.0,
    "interaction_matrix_overlap_top_k": 0.85,
    "interaction_matrix_overlap_bottom_k": 0.9,
    "effective_rank": 0.6,
    "effective_rank_mergeability_score": 0.6,
    "stable_rank": 0.5,
    "spectral_gap": 0.55,
    "singular_value_ratio": 0.5,
    "layerwise_effective_rank": 0.75,
    "layerwise_effective_rank_mergeability_score": 0.8,
    "task_vector_cosine_similarity": 0.75,
    "task_vector_l2_distance": 0.8,
    "task_vector_dot_product": 1.0,
    "weight_space_angle": 0.85,
    "task_vector_magnitude_ratio": 0.75,
    "singular_value_overlap": 0.65,
    "subspace_overlap": 0.75,
    "right_subspace_overlap": 1.0,
    "activation_l2_distance": 0.8,
    "activation_cosine_similarity": 1.0,
    "activation_magnitude_ratio": 0.85,
    "activation_dot_product": 0.85,
    "encoder_gradient_cosine_similarity": 1.0,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.75,
    "input_gradient_cosine_similarity": 0.9,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 1.0
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7776065308397994,
      "val_r": 0.6513681151841857,
      "n_iterations": 261,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.016489706933498383,
        "right_subspace_overlap_bottom_k": -0.06836588680744171,
        "interaction_matrix_overlap_top_k": -0.004583640489727259,
        "interaction_matrix_overlap_bottom_k": 0.05946151167154312,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.01049492135643959,
        "weight_space_angle": -0.0027669533155858517,
        "task_vector_magnitude_ratio": -0.003988294396549463,
        "singular_value_overlap": -0.004805846605449915,
        "subspace_overlap": 0.0015705910045653582,
        "right_subspace_overlap": 0.005917066242545843,
        "activation_l2_distance": 0.008604173548519611,
        "activation_cosine_similarity": 0.03376626595854759,
        "activation_magnitude_ratio": -0.0048722452484071255,
        "activation_dot_product": -0.011535524390637875,
        "encoder_gradient_cosine_similarity": 0.0022052840795367956,
        "encoder_gradient_l2_distance": -0.02509288489818573,
        "encoder_gradient_dot_product": 0.0014106581220403314,
        "input_gradient_cosine_similarity": 0.003751227166503668,
        "input_gradient_l2_distance": -0.018698979169130325,
        "input_gradient_dot_product": -0.00694934232160449
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6686818838354203,
      "val_r": 0.7458696271621358,
      "n_iterations": 336,
      "n_nonzero_coefficients": 29,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.04709790647029877,
        "right_subspace_overlap_bottom_k": -0.10956456512212753,
        "interaction_matrix_overlap_top_k": 0.027517901733517647,
        "interaction_matrix_overlap_bottom_k": -0.014445317909121513,
        "effective_rank": -0.01046446617692709,
        "effective_rank_mergeability_score": 0.009951958432793617,
        "stable_rank": -0.013221104629337788,
        "spectral_gap": 0.010092781856656075,
        "singular_value_ratio": -0.009768461808562279,
        "layerwise_effective_rank": -0.015757013112306595,
        "layerwise_effective_rank_mergeability_score": 0.015876544639468193,
        "task_vector_cosine_similarity": 0.03309626504778862,
        "task_vector_l2_distance": -0.024327008053660393,
        "task_vector_dot_product": 0.021525129675865173,
        "weight_space_angle": -0.031588997691869736,
        "task_vector_magnitude_ratio": -0.009629888460040092,
        "singular_value_overlap": 0.019199734553694725,
        "subspace_overlap": 0.02502933330833912,
        "right_subspace_overlap": 0.03704699128866196,
        "activation_l2_distance": -0.01593668945133686,
        "activation_cosine_similarity": 0.07916751503944397,
        "activation_magnitude_ratio": -0.043810464441776276,
        "activation_dot_product": 0.1354008913040161,
        "encoder_gradient_cosine_similarity": 0.022565651684999466,
        "encoder_gradient_l2_distance": -0.1477605551481247,
        "encoder_gradient_dot_product": 0.034149304032325745,
        "input_gradient_cosine_similarity": 0.005772619973868132,
        "input_gradient_l2_distance": -0.17483386397361755,
        "input_gradient_dot_product": -0.06669319421052933
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6860644946680847,
      "val_r": 0.657835370044287,
      "n_iterations": 374,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.023817429319024086,
        "right_subspace_overlap_bottom_k": -0.045234791934490204,
        "interaction_matrix_overlap_top_k": 0.008929379284381866,
        "interaction_matrix_overlap_bottom_k": 0.005825758911669254,
        "effective_rank": 0.004269677679985762,
        "effective_rank_mergeability_score": -0.00462503544986248,
        "stable_rank": 0.0,
        "spectral_gap": -0.0023762427736073732,
        "singular_value_ratio": 0.0032932725735008717,
        "layerwise_effective_rank": -0.0028434554114937782,
        "layerwise_effective_rank_mergeability_score": 0.0034552770666778088,
        "task_vector_cosine_similarity": 0.01394062303006649,
        "task_vector_l2_distance": -0.004013349302113056,
        "task_vector_dot_product": 0.013612144626677036,
        "weight_space_angle": -0.012972990050911903,
        "task_vector_magnitude_ratio": 0.0024889425840228796,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.010281329043209553,
        "right_subspace_overlap": 0.027969608083367348,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.027372682467103004,
        "activation_magnitude_ratio": -0.01661415584385395,
        "activation_dot_product": 0.0434751883149147,
        "encoder_gradient_cosine_similarity": 0.01349618099629879,
        "encoder_gradient_l2_distance": -0.06246650218963623,
        "encoder_gradient_dot_product": 0.012020021677017212,
        "input_gradient_cosine_similarity": 0.01848859339952469,
        "input_gradient_l2_distance": -0.06189430505037308,
        "input_gradient_dot_product": -0.04812796786427498
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7103873978474852,
      "val_r": 0.6814323605323063,
      "n_iterations": 340,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.04434492066502571,
        "right_subspace_overlap_bottom_k": -0.08083301782608032,
        "interaction_matrix_overlap_top_k": 0.018916094675660133,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": -0.005481152329593897,
        "effective_rank_mergeability_score": 0.005421030800789595,
        "stable_rank": -0.00696607306599617,
        "spectral_gap": 0.0020579963456839323,
        "singular_value_ratio": -0.002464770805090666,
        "layerwise_effective_rank": -0.011320111341774464,
        "layerwise_effective_rank_mergeability_score": 0.012750174850225449,
        "task_vector_cosine_similarity": 0.009755585342645645,
        "task_vector_l2_distance": -0.015235042199492455,
        "task_vector_dot_product": 0.010297924280166626,
        "weight_space_angle": -0.012051456607878208,
        "task_vector_magnitude_ratio": -0.0038579627871513367,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.017986947670578957,
        "right_subspace_overlap": 0.027452990412712097,
        "activation_l2_distance": -0.00910128466784954,
        "activation_cosine_similarity": 0.05067197605967522,
        "activation_magnitude_ratio": -0.032673317939043045,
        "activation_dot_product": 0.07797358930110931,
        "encoder_gradient_cosine_similarity": 0.02918861247599125,
        "encoder_gradient_l2_distance": -0.1115749329328537,
        "encoder_gradient_dot_product": 0.021785562857985497,
        "input_gradient_cosine_similarity": 0.009599638171494007,
        "input_gradient_l2_distance": -0.12424290925264359,
        "input_gradient_dot_product": -0.07996535301208496
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7529060522522868,
      "val_r": 0.7911049472203836,
      "n_iterations": 244,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.024968139827251434,
        "right_subspace_overlap_bottom_k": -0.0724879801273346,
        "interaction_matrix_overlap_top_k": -0.005959411151707172,
        "interaction_matrix_overlap_bottom_k": 0.03750498965382576,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0015629276167601347,
        "singular_value_ratio": -0.0010714249219745398,
        "layerwise_effective_rank": -0.0016230414621531963,
        "layerwise_effective_rank_mergeability_score": 0.0016578033100813627,
        "task_vector_cosine_similarity": -0.003405152354389429,
        "task_vector_l2_distance": -0.020022636279463768,
        "task_vector_dot_product": -0.008236061781644821,
        "weight_space_angle": 0.0034227431751787663,
        "task_vector_magnitude_ratio": -0.0027453883085399866,
        "singular_value_overlap": -0.004708599764853716,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0432722344994545,
        "activation_l2_distance": -0.0048295557498931885,
        "activation_cosine_similarity": 0.055420659482479095,
        "activation_magnitude_ratio": -0.010515935719013214,
        "activation_dot_product": -0.002799175912514329,
        "encoder_gradient_cosine_similarity": 0.013421274721622467,
        "encoder_gradient_l2_distance": -0.11812543123960495,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.009977259673178196,
        "input_gradient_l2_distance": -0.06542235612869263,
        "input_gradient_dot_product": -0.01884566806256771
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7672407833578956,
      "val_r": 0.694737948808521,
      "n_iterations": 344,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010956971906125546,
        "right_subspace_overlap_bottom_k": -0.02134905569255352,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.002760514384135604,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.002617676043882966,
        "layerwise_effective_rank_mergeability_score": 0.0033272334840148687,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.011148146353662014,
        "task_vector_dot_product": -0.001641467330045998,
        "weight_space_angle": 0.0011698086746037006,
        "task_vector_magnitude_ratio": -0.007088972255587578,
        "singular_value_overlap": -0.001970464363694191,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.01896452158689499,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.03716270625591278,
        "activation_magnitude_ratio": -0.007629943545907736,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.011657814495265484,
        "encoder_gradient_l2_distance": -0.05849822610616684,
        "encoder_gradient_dot_product": 0.0034789785277098417,
        "input_gradient_cosine_similarity": 0.002341381972655654,
        "input_gradient_l2_distance": -0.022054314613342285,
        "input_gradient_dot_product": -0.015032432042062283
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7593474669132819,
      "val_r": 0.47405652992604125,
      "n_iterations": 199,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.02914358675479889,
        "right_subspace_overlap_bottom_k": -0.05130339786410332,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.010534006170928478,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0017954312497749925,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.00896418560296297,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.001427006209269166,
        "singular_value_overlap": 0.001791550312191248,
        "subspace_overlap": -0.005111257079988718,
        "right_subspace_overlap": 0.014885197393596172,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.04879432171583176,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.00824789609760046,
        "encoder_gradient_cosine_similarity": 0.013881823979318142,
        "encoder_gradient_l2_distance": -0.08276195079088211,
        "encoder_gradient_dot_product": 0.005944330245256424,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0346544124186039,
        "input_gradient_dot_product": -0.017446722835302353
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7251767441814698,
      "val_r": 0.4007056819283984,
      "n_iterations": 234,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.029717929661273956,
        "right_subspace_overlap_bottom_k": -0.08838153630495071,
        "interaction_matrix_overlap_top_k": -0.0063704028725624084,
        "interaction_matrix_overlap_bottom_k": 0.042205363512039185,
        "effective_rank": 0.0015814263606444001,
        "effective_rank_mergeability_score": -0.0012497330317273736,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.004800121299922466,
        "layerwise_effective_rank_mergeability_score": 0.005284859798848629,
        "task_vector_cosine_similarity": -0.0065510887652635574,
        "task_vector_l2_distance": -0.011463101953268051,
        "task_vector_dot_product": -0.0020668848883360624,
        "weight_space_angle": 0.007008402608335018,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.047519076615571976,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.051950011402368546,
        "activation_magnitude_ratio": -0.0066606467589735985,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.016461005434393883,
        "encoder_gradient_l2_distance": -0.10353877395391464,
        "encoder_gradient_dot_product": 0.001282063196413219,
        "input_gradient_cosine_similarity": 0.008467340841889381,
        "input_gradient_l2_distance": -0.029680021107196808,
        "input_gradient_dot_product": -0.0014702052576467395
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7879999094292558,
      "val_r": 0.4923995881630213,
      "n_iterations": 211,
      "n_nonzero_coefficients": 29,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.026570962741971016,
        "right_subspace_overlap_bottom_k": -0.11350882798433304,
        "interaction_matrix_overlap_top_k": 0.0019522549118846655,
        "interaction_matrix_overlap_bottom_k": 0.0957941859960556,
        "effective_rank": -0.004052397795021534,
        "effective_rank_mergeability_score": 0.0043953764252364635,
        "stable_rank": -0.0018002359429374337,
        "spectral_gap": -0.005578138399869204,
        "singular_value_ratio": 0.005948251113295555,
        "layerwise_effective_rank": -0.011634205467998981,
        "layerwise_effective_rank_mergeability_score": 0.009880997240543365,
        "task_vector_cosine_similarity": -0.01328075211495161,
        "task_vector_l2_distance": -0.009790489450097084,
        "task_vector_dot_product": -0.001175945857539773,
        "weight_space_angle": 0.010075841099023819,
        "task_vector_magnitude_ratio": 0.002683551050722599,
        "singular_value_overlap": -0.004370111506432295,
        "subspace_overlap": 0.005141986068338156,
        "right_subspace_overlap": 0.019164353609085083,
        "activation_l2_distance": -0.008361892774701118,
        "activation_cosine_similarity": 0.036754973232746124,
        "activation_magnitude_ratio": -0.00519710686057806,
        "activation_dot_product": -0.0038482979871332645,
        "encoder_gradient_cosine_similarity": 0.012894492596387863,
        "encoder_gradient_l2_distance": -0.06402753293514252,
        "encoder_gradient_dot_product": -0.00239877519197762,
        "input_gradient_cosine_similarity": -0.004183121956884861,
        "input_gradient_l2_distance": -0.0648917704820633,
        "input_gradient_dot_product": -0.018880339339375496
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7325031427338967,
      "val_r": 0.6722600281588205,
      "n_iterations": 277,
      "n_nonzero_coefficients": 28,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.05298300087451935,
        "right_subspace_overlap_bottom_k": -0.09465579688549042,
        "interaction_matrix_overlap_top_k": 0.013231230899691582,
        "interaction_matrix_overlap_bottom_k": 0.015593448653817177,
        "effective_rank": -0.0023325986694544554,
        "effective_rank_mergeability_score": 0.0018730657175183296,
        "stable_rank": -0.005382461939007044,
        "spectral_gap": -0.0021816191729158163,
        "singular_value_ratio": 0.002254724968224764,
        "layerwise_effective_rank": -0.010796762071549892,
        "layerwise_effective_rank_mergeability_score": 0.007280681282281876,
        "task_vector_cosine_similarity": -0.012961158528923988,
        "task_vector_l2_distance": -0.04852066561579704,
        "task_vector_dot_product": -0.011754799634218216,
        "weight_space_angle": 0.00863021332770586,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.003727172501385212,
        "subspace_overlap": 0.024866655468940735,
        "right_subspace_overlap": 0.043711934238672256,
        "activation_l2_distance": -0.003942635841667652,
        "activation_cosine_similarity": -0.009992583654820919,
        "activation_magnitude_ratio": -0.005194155033677816,
        "activation_dot_product": -0.03511252999305725,
        "encoder_gradient_cosine_similarity": 0.030196048319339752,
        "encoder_gradient_l2_distance": -0.2027202993631363,
        "encoder_gradient_dot_product": 0.002258818596601486,
        "input_gradient_cosine_similarity": 0.001095376443117857,
        "input_gradient_l2_distance": -0.19505415856838226,
        "input_gradient_dot_product": -0.005770937539637089
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7612540281827133,
      "val_r": 0.13155199903587705,
      "n_iterations": 374,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0277336947619915,
        "right_subspace_overlap_bottom_k": -0.03984960913658142,
        "interaction_matrix_overlap_top_k": 0.0015954046975821257,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": -0.004160797689110041,
        "effective_rank_mergeability_score": 0.004156691022217274,
        "stable_rank": -0.006893024779856205,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0048393611796200275,
        "task_vector_l2_distance": -0.029415201395750046,
        "task_vector_dot_product": -0.0014818175695836544,
        "weight_space_angle": 0.0033223829232156277,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.016199974343180656,
        "activation_l2_distance": -0.0424179807305336,
        "activation_cosine_similarity": 0.0840558186173439,
        "activation_magnitude_ratio": -0.017491253092885017,
        "activation_dot_product": 0.015904497355222702,
        "encoder_gradient_cosine_similarity": 0.004408098757266998,
        "encoder_gradient_l2_distance": -0.16423176229000092,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0019170191371813416,
        "input_gradient_l2_distance": -0.08290726691484451,
        "input_gradient_dot_product": -0.0018826590385288
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7699752264749276,
      "val_r": 0.7601111949101101,
      "n_iterations": 308,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.03357455134391785,
        "right_subspace_overlap_bottom_k": -0.04372955858707428,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.013848300091922283,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.018172377720475197,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.0010138292564079165,
        "weight_space_angle": 0.013479300774633884,
        "task_vector_magnitude_ratio": -0.002785195829346776,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.01811271905899048,
        "activation_l2_distance": 0.00231162179261446,
        "activation_cosine_similarity": 0.030282320454716682,
        "activation_magnitude_ratio": -0.005398460663855076,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.007077499758452177,
        "encoder_gradient_l2_distance": -0.04971189424395561,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.003309789579361677,
        "input_gradient_l2_distance": -0.027167823165655136,
        "input_gradient_dot_product": -0.011122659780085087
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7773408845704335,
      "val_r": 0.7475871195665628,
      "n_iterations": 343,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01256369985640049,
        "right_subspace_overlap_bottom_k": -0.036225996911525726,
        "interaction_matrix_overlap_top_k": -0.004748607985675335,
        "interaction_matrix_overlap_bottom_k": 0.027687974274158478,
        "effective_rank": 0.003144696820527315,
        "effective_rank_mergeability_score": -0.0032612099312245846,
        "stable_rank": 0.0011162005830556154,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.002378955250605941,
        "layerwise_effective_rank_mergeability_score": 0.0028943896759301424,
        "task_vector_cosine_similarity": 0.010298074223101139,
        "task_vector_l2_distance": 0.0010877042077481747,
        "task_vector_dot_product": -0.0010162054095417261,
        "weight_space_angle": -0.007144753821194172,
        "task_vector_magnitude_ratio": -0.0019066762179136276,
        "singular_value_overlap": -0.0011637624120339751,
        "subspace_overlap": -0.014651929028332233,
        "right_subspace_overlap": 0.006183967925608158,
        "activation_l2_distance": 0.014610028825700283,
        "activation_cosine_similarity": 0.027826718986034393,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.005909517407417297,
        "encoder_gradient_cosine_similarity": 0.004299367778003216,
        "encoder_gradient_l2_distance": -0.020214274525642395,
        "encoder_gradient_dot_product": 0.0029658132698386908,
        "input_gradient_cosine_similarity": 0.0022488594986498356,
        "input_gradient_l2_distance": -0.013594177551567554,
        "input_gradient_dot_product": -0.007552890572696924
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7862167675915087,
      "val_r": 0.8354350526542047,
      "n_iterations": 310,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005805536638945341,
        "right_subspace_overlap_bottom_k": -0.08126701414585114,
        "interaction_matrix_overlap_top_k": -0.018590833991765976,
        "interaction_matrix_overlap_bottom_k": 0.06915830820798874,
        "effective_rank": 0.0020484765991568565,
        "effective_rank_mergeability_score": -0.0020280955359339714,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.003525514155626297,
        "layerwise_effective_rank_mergeability_score": 0.004164821468293667,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.002479403745383024,
        "task_vector_dot_product": -0.0029035729821771383,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0015731846215203404,
        "singular_value_overlap": -0.0030459295958280563,
        "subspace_overlap": -0.00804264284670353,
        "right_subspace_overlap": 0.02720821090042591,
        "activation_l2_distance": -0.002322496846318245,
        "activation_cosine_similarity": 0.015887344256043434,
        "activation_magnitude_ratio": -0.0013211292680352926,
        "activation_dot_product": -0.001857072813436389,
        "encoder_gradient_cosine_similarity": 0.001944027841091156,
        "encoder_gradient_l2_distance": -0.0246804878115654,
        "encoder_gradient_dot_product": 0.003198331920430064,
        "input_gradient_cosine_similarity": 0.00348869152367115,
        "input_gradient_l2_distance": -0.017448030412197113,
        "input_gradient_dot_product": -0.009021556936204433
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7516788439172457,
      "val_r": 0.7786263782745523,
      "n_iterations": 367,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.04413336515426636,
        "right_subspace_overlap_bottom_k": -0.09365377575159073,
        "interaction_matrix_overlap_top_k": 0.002573369536548853,
        "interaction_matrix_overlap_bottom_k": 0.031086774542927742,
        "effective_rank": -0.0014635021798312664,
        "effective_rank_mergeability_score": 0.001291027758270502,
        "stable_rank": -0.006190955173224211,
        "spectral_gap": -0.001305636134929955,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.00346294860355556,
        "layerwise_effective_rank_mergeability_score": 0.003992508165538311,
        "task_vector_cosine_similarity": -0.014368738047778606,
        "task_vector_l2_distance": -0.016118623316287994,
        "task_vector_dot_product": -0.007565611507743597,
        "weight_space_angle": 0.013331414200365543,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0011057580122724175,
        "right_subspace_overlap": 0.042337752878665924,
        "activation_l2_distance": -0.027731886133551598,
        "activation_cosine_similarity": 0.047363393008708954,
        "activation_magnitude_ratio": -0.01226906105875969,
        "activation_dot_product": 0.009786522015929222,
        "encoder_gradient_cosine_similarity": 0.015368395484983921,
        "encoder_gradient_l2_distance": -0.12407097965478897,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.006123395636677742,
        "input_gradient_l2_distance": -0.10038696229457855,
        "input_gradient_dot_product": -0.010163746774196625
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7966764106427189,
      "val_r": 0.5885795273992257,
      "n_iterations": 265,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01703852042555809,
        "right_subspace_overlap_bottom_k": -0.04517157003283501,
        "interaction_matrix_overlap_top_k": -0.0011152776423841715,
        "interaction_matrix_overlap_bottom_k": 0.016794821247458458,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.002666841959580779,
        "spectral_gap": 0.0012498018331825733,
        "singular_value_ratio": -0.0012750059831887484,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.007109799422323704,
        "task_vector_l2_distance": -0.01630881242454052,
        "task_vector_dot_product": -0.0013742026640102267,
        "weight_space_angle": 0.007298558950424194,
        "task_vector_magnitude_ratio": -0.001970083685591817,
        "singular_value_overlap": 0.012371108867228031,
        "subspace_overlap": -0.009248425252735615,
        "right_subspace_overlap": 0.0307697094976902,
        "activation_l2_distance": 0.021070826798677444,
        "activation_cosine_similarity": 0.04413408413529396,
        "activation_magnitude_ratio": -0.00698558334261179,
        "activation_dot_product": -0.00418336596339941,
        "encoder_gradient_cosine_similarity": 0.007104190066456795,
        "encoder_gradient_l2_distance": -0.06706098467111588,
        "encoder_gradient_dot_product": 0.0033569163642823696,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.027307143434882164,
        "input_gradient_dot_product": -0.018552590161561966
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7700989354669148,
      "val_r": 0.7264544118899119,
      "n_iterations": 209,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.02951524406671524,
        "right_subspace_overlap_bottom_k": -0.06613843142986298,
        "interaction_matrix_overlap_top_k": -0.0059266285970807076,
        "interaction_matrix_overlap_bottom_k": 0.0376201793551445,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.003083884483203292,
        "layerwise_effective_rank_mergeability_score": 0.0024275570176541805,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.013288903050124645,
        "weight_space_angle": 0.00106092169880867,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.002760234521701932,
        "right_subspace_overlap": 0.020111996680498123,
        "activation_l2_distance": 0.0013279297854751348,
        "activation_cosine_similarity": 0.03715701773762703,
        "activation_magnitude_ratio": -0.008242611773312092,
        "activation_dot_product": -0.0051318565383553505,
        "encoder_gradient_cosine_similarity": 0.008660205639898777,
        "encoder_gradient_l2_distance": -0.05860868841409683,
        "encoder_gradient_dot_product": 0.0016630749450996518,
        "input_gradient_cosine_similarity": 0.003591675776988268,
        "input_gradient_l2_distance": -0.03070850670337677,
        "input_gradient_dot_product": -0.012892511673271656
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6887016438909406,
      "val_r": 0.5752578981795348,
      "n_iterations": 311,
      "n_nonzero_coefficients": 29,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.019681889563798904,
        "right_subspace_overlap_bottom_k": -0.06576503813266754,
        "interaction_matrix_overlap_top_k": 0.009929347783327103,
        "interaction_matrix_overlap_bottom_k": -0.010653499513864517,
        "effective_rank": -0.00842874776571989,
        "effective_rank_mergeability_score": 0.008589597418904305,
        "stable_rank": -0.011210188269615173,
        "spectral_gap": 0.006168973632156849,
        "singular_value_ratio": -0.006723667029291391,
        "layerwise_effective_rank": -0.015829946845769882,
        "layerwise_effective_rank_mergeability_score": 0.016456186771392822,
        "task_vector_cosine_similarity": 0.011813743971288204,
        "task_vector_l2_distance": -0.018275419250130653,
        "task_vector_dot_product": 0.0017395932227373123,
        "weight_space_angle": -0.010151093825697899,
        "task_vector_magnitude_ratio": -0.0064336690120399,
        "singular_value_overlap": 0.01000874862074852,
        "subspace_overlap": 0.011342315934598446,
        "right_subspace_overlap": 0.0359213761985302,
        "activation_l2_distance": -0.006908504758030176,
        "activation_cosine_similarity": 0.04818959906697273,
        "activation_magnitude_ratio": -0.020413251593708992,
        "activation_dot_product": 0.07476352900266647,
        "encoder_gradient_cosine_similarity": 0.02718469314277172,
        "encoder_gradient_l2_distance": -0.10277704894542694,
        "encoder_gradient_dot_product": 0.023677153512835503,
        "input_gradient_cosine_similarity": 0.019752154126763344,
        "input_gradient_l2_distance": -0.11616577953100204,
        "input_gradient_dot_product": -0.07384951412677765
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8088315716570929,
      "val_r": 0.4021642617530026,
      "n_iterations": 221,
      "n_nonzero_coefficients": 28,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.034528449177742004,
        "right_subspace_overlap_bottom_k": -0.08009927719831467,
        "interaction_matrix_overlap_top_k": -0.004224625416100025,
        "interaction_matrix_overlap_bottom_k": 0.06077336519956589,
        "effective_rank": 0.0033284667879343033,
        "effective_rank_mergeability_score": -0.003977722488343716,
        "stable_rank": -0.0018428363837301731,
        "spectral_gap": -0.0019571881275624037,
        "singular_value_ratio": 0.002145215170457959,
        "layerwise_effective_rank": -0.012278610840439796,
        "layerwise_effective_rank_mergeability_score": 0.004186834674328566,
        "task_vector_cosine_similarity": -0.010419966652989388,
        "task_vector_l2_distance": -0.007750289980322123,
        "task_vector_dot_product": -0.0010853213025256991,
        "weight_space_angle": 0.006198554299771786,
        "task_vector_magnitude_ratio": 0.0021137166768312454,
        "singular_value_overlap": 0.005771576426923275,
        "subspace_overlap": -0.0030728632118552923,
        "right_subspace_overlap": 0.00801078975200653,
        "activation_l2_distance": 0.0012175976298749447,
        "activation_cosine_similarity": 0.02330736815929413,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.015850931406021118,
        "encoder_gradient_cosine_similarity": 0.007734691258519888,
        "encoder_gradient_l2_distance": -0.0542776845395565,
        "encoder_gradient_dot_product": 0.0034997197799384594,
        "input_gradient_cosine_similarity": 0.0016097044572234154,
        "input_gradient_l2_distance": -0.03743886947631836,
        "input_gradient_dot_product": -0.009202555753290653
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8273009013830684,
      "val_r": 0.7189386757677257,
      "n_iterations": 459,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.007811649702489376,
        "right_subspace_overlap_bottom_k": -0.006239260081201792,
        "interaction_matrix_overlap_top_k": -0.003976557403802872,
        "interaction_matrix_overlap_bottom_k": 0.002259117318317294,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.003784013446420431,
        "singular_value_ratio": -0.0037821370642632246,
        "layerwise_effective_rank": -0.0031902361661195755,
        "layerwise_effective_rank_mergeability_score": 0.0038877439219504595,
        "task_vector_cosine_similarity": 0.001760896178893745,
        "task_vector_l2_distance": -0.06190451979637146,
        "task_vector_dot_product": 0.001974965911358595,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.006349490024149418,
        "singular_value_overlap": -0.0029022283852100372,
        "subspace_overlap": 0.001906869001686573,
        "right_subspace_overlap": -0.010746454820036888,
        "activation_l2_distance": 0.0013813512632623315,
        "activation_cosine_similarity": 0.030038706958293915,
        "activation_magnitude_ratio": -0.005343569442629814,
        "activation_dot_product": 0.0686434656381607,
        "encoder_gradient_cosine_similarity": 0.003077686997130513,
        "encoder_gradient_l2_distance": -0.12710370123386383,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0022429446689784527,
        "input_gradient_l2_distance": -0.1056857705116272,
        "input_gradient_dot_product": -0.013423141092061996
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.1,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}