{
  "aggregate_metrics": {
    "train_r": 0.34935367148004187,
    "train_p": 3.905730748119283e-93,
    "val_r": -0.16513198689428094,
    "val_p": 0.001718150848546439
  },
  "per_fold_stats": {
    "train_r_mean": 0.5731441664875355,
    "train_r_std": 0.047458090824185416,
    "val_r_mean": 0.43786942998875755,
    "val_r_std": 0.17716790757147277,
    "n_nonzero_mean": 22.3,
    "n_nonzero_std": 3.5085609585697664
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.0028467674273997545,
    "right_subspace_overlap_bottom_k": -0.007373227272182703,
    "interaction_matrix_overlap_top_k": -0.018788643181324005,
    "interaction_matrix_overlap_bottom_k": 0.07127653062343597,
    "effective_rank": -0.0015735769411548972,
    "effective_rank_mergeability_score": 0.0016040944028645754,
    "stable_rank": -0.001054840162396431,
    "spectral_gap": -0.0009712738683447242,
    "singular_value_ratio": 0.0011116729583591223,
    "layerwise_effective_rank": -0.00010908934928011149,
    "layerwise_effective_rank_mergeability_score": 0.0018412142526358366,
    "task_vector_cosine_similarity": -0.0009318022057414055,
    "task_vector_l2_distance": -0.03862891346216202,
    "task_vector_dot_product": 0.0031259481329470873,
    "weight_space_angle": 0.0008440656820312142,
    "task_vector_magnitude_ratio": -0.012088426388800144,
    "singular_value_overlap": -0.035289231687784195,
    "subspace_overlap": 0.012833970598876476,
    "right_subspace_overlap": 0.003698952030390501,
    "activation_l2_distance": -0.001064395997673273,
    "activation_cosine_similarity": -0.0008205717313103378,
    "activation_magnitude_ratio": -0.011298161000013351,
    "activation_dot_product": -0.003238723846152425,
    "encoder_gradient_cosine_similarity": -7.054345769574866e-05,
    "encoder_gradient_l2_distance": -0.026714008301496506,
    "encoder_gradient_dot_product": 0.00027558329747989774,
    "input_gradient_cosine_similarity": 0.0037261992692947388,
    "input_gradient_l2_distance": -0.04199270159006119,
    "input_gradient_dot_product": -0.00988083053380251
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.009971057996153831,
    "right_subspace_overlap_bottom_k": 0.01637353003025055,
    "interaction_matrix_overlap_top_k": 0.011992193758487701,
    "interaction_matrix_overlap_bottom_k": 0.01781393773853779,
    "effective_rank": 0.001756478799507022,
    "effective_rank_mergeability_score": 0.001851018751040101,
    "stable_rank": 0.0018390316981822252,
    "spectral_gap": 0.001787249930202961,
    "singular_value_ratio": 0.0017221757443621755,
    "layerwise_effective_rank": 0.0045245676301419735,
    "layerwise_effective_rank_mergeability_score": 0.007643452845513821,
    "task_vector_cosine_similarity": 0.0033119111321866512,
    "task_vector_l2_distance": 0.020257921889424324,
    "task_vector_dot_product": 0.007256132084876299,
    "weight_space_angle": 0.0027844842988997698,
    "task_vector_magnitude_ratio": 0.005144985392689705,
    "singular_value_overlap": 0.017193889245390892,
    "subspace_overlap": 0.010236210189759731,
    "right_subspace_overlap": 0.01542455144226551,
    "activation_l2_distance": 0.015610015951097012,
    "activation_cosine_similarity": 0.014288390055298805,
    "activation_magnitude_ratio": 0.007485215552151203,
    "activation_dot_product": 0.008264018222689629,
    "encoder_gradient_cosine_similarity": 0.0035880613140761852,
    "encoder_gradient_l2_distance": 0.030657194554805756,
    "encoder_gradient_dot_product": 0.0015485455514863133,
    "input_gradient_cosine_similarity": 0.003013133304193616,
    "input_gradient_l2_distance": 0.03136690333485603,
    "input_gradient_dot_product": 0.005449756048619747
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.55,
    "right_subspace_overlap_bottom_k": 0.85,
    "interaction_matrix_overlap_top_k": 1.0,
    "interaction_matrix_overlap_bottom_k": 1.0,
    "effective_rank": 0.65,
    "effective_rank_mergeability_score": 0.65,
    "stable_rank": 0.4,
    "spectral_gap": 0.6,
    "singular_value_ratio": 0.65,
    "layerwise_effective_rank": 0.45,
    "layerwise_effective_rank_mergeability_score": 0.45,
    "task_vector_cosine_similarity": 0.6,
    "task_vector_l2_distance": 1.0,
    "task_vector_dot_product": 0.9,
    "weight_space_angle": 0.45,
    "task_vector_magnitude_ratio": 1.0,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.95,
    "right_subspace_overlap": 0.55,
    "activation_l2_distance": 0.9,
    "activation_cosine_similarity": 0.7,
    "activation_magnitude_ratio": 0.95,
    "activation_dot_product": 0.85,
    "encoder_gradient_cosine_similarity": 0.8,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.55,
    "input_gradient_cosine_similarity": 0.85,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 1.0
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6255586729867049,
      "val_r": 0.6256389376397659,
      "n_iterations": 273,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0011197396088391542,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.029617790132761,
        "interaction_matrix_overlap_bottom_k": 0.08136450499296188,
        "effective_rank": -0.006125051062554121,
        "effective_rank_mergeability_score": 0.004592671524733305,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.013955133967101574,
        "layerwise_effective_rank_mergeability_score": -0.0033990393858402967,
        "task_vector_cosine_similarity": -0.0010508573614060879,
        "task_vector_l2_distance": -0.046745192259550095,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0041350931860506535,
        "task_vector_magnitude_ratio": -0.017776118591427803,
        "singular_value_overlap": -0.04778338223695755,
        "subspace_overlap": 0.031976912170648575,
        "right_subspace_overlap": -0.0015936257550492883,
        "activation_l2_distance": -0.0019406070932745934,
        "activation_cosine_similarity": 0.0027469205670058727,
        "activation_magnitude_ratio": -0.017085690051317215,
        "activation_dot_product": -0.011752725578844547,
        "encoder_gradient_cosine_similarity": -0.0018932900857180357,
        "encoder_gradient_l2_distance": -0.026199432089924812,
        "encoder_gradient_dot_product": -0.0010890900157392025,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.03522311896085739,
        "input_gradient_dot_product": -0.013803277164697647
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5612883016896778,
      "val_r": 0.5273116402627289,
      "n_iterations": 268,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.025829274207353592,
        "interaction_matrix_overlap_top_k": -0.0193647388368845,
        "interaction_matrix_overlap_bottom_k": 0.058085646480321884,
        "effective_rank": -0.0028045184444636106,
        "effective_rank_mergeability_score": 0.0024331100285053253,
        "stable_rank": 0.0,
        "spectral_gap": -0.0026932337787002325,
        "singular_value_ratio": 0.002807005075737834,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.019888781011104584,
        "task_vector_dot_product": 0.006304477341473103,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.01254183892160654,
        "singular_value_overlap": -0.016040891408920288,
        "subspace_overlap": 0.007496842183172703,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0021718237549066544,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.00371296308003366,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": -0.0014601859729737043,
        "encoder_gradient_l2_distance": -0.013875262811779976,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.002950392896309495,
        "input_gradient_l2_distance": -0.015399781055748463,
        "input_gradient_dot_product": -0.0022225661668926477
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5619096551714909,
      "val_r": 0.5030198907963286,
      "n_iterations": 488,
      "n_nonzero_coefficients": 28,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005420292727649212,
        "right_subspace_overlap_bottom_k": 0.011228227987885475,
        "interaction_matrix_overlap_top_k": -0.016886094585061073,
        "interaction_matrix_overlap_bottom_k": 0.07604966312646866,
        "effective_rank": -0.0013556280173361301,
        "effective_rank_mergeability_score": 0.0015844120644032955,
        "stable_rank": -0.0019754325039684772,
        "spectral_gap": 0.0028395378030836582,
        "singular_value_ratio": -0.002676052041351795,
        "layerwise_effective_rank": -0.0014810952125117183,
        "layerwise_effective_rank_mergeability_score": 0.0016190186142921448,
        "task_vector_cosine_similarity": 0.0018673641607165337,
        "task_vector_l2_distance": -0.052410684525966644,
        "task_vector_dot_product": -0.002026286209002137,
        "weight_space_angle": -0.003761597676202655,
        "task_vector_magnitude_ratio": -0.01584424264729023,
        "singular_value_overlap": -0.05500537529587746,
        "subspace_overlap": 0.016758238896727562,
        "right_subspace_overlap": 0.0038490211591124535,
        "activation_l2_distance": -0.008232520893216133,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.022359605878591537,
        "activation_dot_product": -0.021655157208442688,
        "encoder_gradient_cosine_similarity": -0.005110464990139008,
        "encoder_gradient_l2_distance": -0.03379429876804352,
        "encoder_gradient_dot_product": 0.0024900278076529503,
        "input_gradient_cosine_similarity": 0.006360665895044804,
        "input_gradient_l2_distance": -0.05899108946323395,
        "input_gradient_dot_product": -0.0067664859816432
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5689916913981444,
      "val_r": 0.5001631978869142,
      "n_iterations": 271,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.016680926084518433,
        "interaction_matrix_overlap_top_k": -0.020077720284461975,
        "interaction_matrix_overlap_bottom_k": 0.07024780660867691,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0018916982226073742,
        "singular_value_ratio": 0.0018571591936051846,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.02982645109295845,
        "task_vector_dot_product": 0.008462797850370407,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.013546925969421864,
        "singular_value_overlap": -0.028316587209701538,
        "subspace_overlap": 0.01239179540425539,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.005345283076167107,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.007961384952068329,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.011832715943455696,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.006126976106315851,
        "input_gradient_l2_distance": -0.025978470221161842,
        "input_gradient_dot_product": -0.009050117805600166
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5694373890413572,
      "val_r": 0.5315823854504689,
      "n_iterations": 348,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005495178047567606,
        "right_subspace_overlap_bottom_k": -0.0041592977941036224,
        "interaction_matrix_overlap_top_k": -0.009363223798573017,
        "interaction_matrix_overlap_bottom_k": 0.0750681608915329,
        "effective_rank": 0.0012569944374263287,
        "effective_rank_mergeability_score": -0.001123833004385233,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.002137171570211649,
        "layerwise_effective_rank_mergeability_score": -0.002802950795739889,
        "task_vector_cosine_similarity": 0.00445648655295372,
        "task_vector_l2_distance": -0.039706408977508545,
        "task_vector_dot_product": -0.010614139959216118,
        "weight_space_angle": -0.002517667831853032,
        "task_vector_magnitude_ratio": -0.008012635633349419,
        "singular_value_overlap": -0.04127219319343567,
        "subspace_overlap": 0.003067324636504054,
        "right_subspace_overlap": 0.005926131270825863,
        "activation_l2_distance": -0.003046406665816903,
        "activation_cosine_similarity": -0.0015429217601194978,
        "activation_magnitude_ratio": -0.01480564009398222,
        "activation_dot_product": -0.01452111080288887,
        "encoder_gradient_cosine_similarity": 0.0021464484743773937,
        "encoder_gradient_l2_distance": -0.02119043469429016,
        "encoder_gradient_dot_product": 0.0021445397287607193,
        "input_gradient_cosine_similarity": 0.004573083017021418,
        "input_gradient_l2_distance": -0.04267091304063797,
        "input_gradient_dot_product": -0.007735861465334892
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.48019930432722635,
      "val_r": 0.6067683544856307,
      "n_iterations": 276,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0025415755808353424,
        "right_subspace_overlap_bottom_k": -0.017836228013038635,
        "interaction_matrix_overlap_top_k": -0.03603383153676987,
        "interaction_matrix_overlap_bottom_k": 0.056785698980093,
        "effective_rank": -0.0015570134855806828,
        "effective_rank_mergeability_score": 0.0013564948458224535,
        "stable_rank": 0.001385294832289219,
        "spectral_gap": -0.003456415608525276,
        "singular_value_ratio": 0.003947386518120766,
        "layerwise_effective_rank": 0.00137956696562469,
        "layerwise_effective_rank_mergeability_score": -0.0023973151110112667,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.021011266857385635,
        "task_vector_dot_product": 0.01753825694322586,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.008276602253317833,
        "singular_value_overlap": -0.01601158268749714,
        "subspace_overlap": 0.015312003903090954,
        "right_subspace_overlap": 0.0034634023904800415,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.003846700768917799,
        "activation_dot_product": -0.0014486403670161963,
        "encoder_gradient_cosine_similarity": 0.0011374785099178553,
        "encoder_gradient_l2_distance": -0.011527678929269314,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0019836067222058773,
        "input_gradient_l2_distance": -0.014651713892817497,
        "input_gradient_dot_product": -0.0061260368674993515
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.601847446737762,
      "val_r": 0.2458894398245468,
      "n_iterations": 378,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.024499457329511642,
        "interaction_matrix_overlap_top_k": -0.007916242815554142,
        "interaction_matrix_overlap_bottom_k": 0.0603896789252758,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.003974339459091425,
        "singular_value_ratio": 0.004247634671628475,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0016376024577766657,
        "task_vector_l2_distance": -0.016483504325151443,
        "task_vector_dot_product": -0.0019057451281696558,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.014725234359502792,
        "singular_value_overlap": -0.018958861008286476,
        "subspace_overlap": 0.0017908659065142274,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.006233659572899342,
        "activation_cosine_similarity": 0.00449030427262187,
        "activation_magnitude_ratio": 0.0014438487123697996,
        "activation_dot_product": -0.01319898758083582,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.017958123236894608,
        "encoder_gradient_dot_product": 0.0010157173965126276,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.021159715950489044,
        "input_gradient_dot_product": -0.00808529183268547
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5443382323522757,
      "val_r": 0.3906726557842953,
      "n_iterations": 560,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.01012424286454916,
        "interaction_matrix_overlap_top_k": -0.03552098944783211,
        "interaction_matrix_overlap_bottom_k": 0.07402512431144714,
        "effective_rank": -0.0015761838294565678,
        "effective_rank_mergeability_score": 0.001646128366701305,
        "stable_rank": 0.0,
        "spectral_gap": -0.0017016936326399446,
        "singular_value_ratio": 0.0019676517695188522,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.04136209189891815,
        "task_vector_dot_product": 0.004723283462226391,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.013990985229611397,
        "singular_value_overlap": -0.028902215883135796,
        "subspace_overlap": 0.024580955505371094,
        "right_subspace_overlap": 0.0012585371732711792,
        "activation_l2_distance": 0.009475401602685452,
        "activation_cosine_similarity": 0.002730149310082197,
        "activation_magnitude_ratio": -0.007629234343767166,
        "activation_dot_product": -0.0030232821591198444,
        "encoder_gradient_cosine_similarity": 0.0019486534874886274,
        "encoder_gradient_l2_distance": -0.018145764246582985,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0057212659157812595,
        "input_gradient_l2_distance": -0.015000421553850174,
        "input_gradient_dot_product": -0.0023741708137094975
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.560860529705465,
      "val_r": 0.4830425539446077,
      "n_iterations": 341,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.001172429881989956,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.020153222605586052,
        "interaction_matrix_overlap_bottom_k": 0.09863678365945816,
        "effective_rank": -0.002831331454217434,
        "effective_rank_mergeability_score": 0.0033253240399062634,
        "stable_rank": -0.002708843909204006,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0036113669630140066,
        "task_vector_l2_distance": -0.060933686792850494,
        "task_vector_dot_product": 0.0037024898920208216,
        "weight_space_angle": 0.0012501501478254795,
        "task_vector_magnitude_ratio": -0.010644536465406418,
        "singular_value_overlap": -0.054059796035289764,
        "subspace_overlap": 0.0163523368537426,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0034941297490149736,
        "activation_cosine_similarity": -0.0014468784211203456,
        "activation_magnitude_ratio": -0.017956044524908066,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0023742467164993286,
        "encoder_gradient_l2_distance": -0.024305429309606552,
        "encoder_gradient_dot_product": 0.00112737319432199,
        "input_gradient_cosine_similarity": 0.0020897360518574715,
        "input_gradient_l2_distance": -0.06262420117855072,
        "input_gradient_dot_product": -0.018027057871222496
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5698148547093072,
      "val_r": -0.15651963427983903,
      "n_iterations": 322,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004495238419622183,
        "right_subspace_overlap_bottom_k": -0.022598838433623314,
        "interaction_matrix_overlap_top_k": -0.03489469364285469,
        "interaction_matrix_overlap_bottom_k": 0.054812878370285034,
        "effective_rank": -0.0035971631295979023,
        "effective_rank_mergeability_score": 0.003158506704494357,
        "stable_rank": -0.0015583516797050834,
        "spectral_gap": -0.003341522067785263,
        "singular_value_ratio": 0.0030176499858498573,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.003040853887796402,
        "task_vector_l2_distance": -0.018123222514986992,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0024781632237136364,
        "task_vector_magnitude_ratio": -0.010984078049659729,
        "singular_value_overlap": -0.02688700333237648,
        "subspace_overlap": 0.023764370009303093,
        "right_subspace_overlap": 0.004769457504153252,
        "activation_l2_distance": -0.06137600913643837,
        "activation_cosine_similarity": -0.05201835557818413,
        "activation_magnitude_ratio": -0.01168079860508442,
        "activation_dot_product": -0.004220425151288509,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.014994951896369457,
        "encoder_gradient_dot_product": 0.003242204198613763,
        "input_gradient_cosine_similarity": -0.003010892542079091,
        "input_gradient_l2_distance": -0.027319829910993576,
        "input_gradient_dot_product": -0.010323846712708473
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5338343706211505,
      "val_r": 0.3924115347553345,
      "n_iterations": 300,
      "n_nonzero_coefficients": 28,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.005601656623184681,
        "right_subspace_overlap_bottom_k": 0.03422198444604874,
        "interaction_matrix_overlap_top_k": -0.007416240405291319,
        "interaction_matrix_overlap_bottom_k": 0.0919426679611206,
        "effective_rank": -0.004143994301557541,
        "effective_rank_mergeability_score": 0.006654117256402969,
        "stable_rank": -0.0038023977540433407,
        "spectral_gap": 0.0023328769020736217,
        "singular_value_ratio": -0.001492504496127367,
        "layerwise_effective_rank": -0.0018948349170386791,
        "layerwise_effective_rank_mergeability_score": 0.0012986346846446395,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.07247309386730194,
        "task_vector_dot_product": 0.0012977754231542349,
        "weight_space_angle": 0.002060847356915474,
        "task_vector_magnitude_ratio": -0.014556784182786942,
        "singular_value_overlap": -0.06091949716210365,
        "subspace_overlap": 0.009175625629723072,
        "right_subspace_overlap": -0.006376564968377352,
        "activation_l2_distance": -0.002607855014503002,
        "activation_cosine_similarity": -0.0032008595298975706,
        "activation_magnitude_ratio": -0.01975644752383232,
        "activation_dot_product": -0.0017425562255084515,
        "encoder_gradient_cosine_similarity": -0.0045659891329705715,
        "encoder_gradient_l2_distance": -0.03769215568900108,
        "encoder_gradient_dot_product": -0.0027130485977977514,
        "input_gradient_cosine_similarity": 0.006017148960381746,
        "input_gradient_l2_distance": -0.05641360953450203,
        "input_gradient_dot_product": -0.005250285379588604
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5603775540916572,
      "val_r": 0.5243612769101097,
      "n_iterations": 361,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.02335813082754612,
        "interaction_matrix_overlap_top_k": -0.019770510494709015,
        "interaction_matrix_overlap_bottom_k": 0.0604156032204628,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0030614743009209633,
        "singular_value_ratio": 0.0029872253071516752,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.02037574164569378,
        "task_vector_dot_product": 0.007314157672226429,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.013457708060741425,
        "singular_value_overlap": -0.018356043845415115,
        "subspace_overlap": 0.01109781302511692,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.005412072408944368,
        "activation_dot_product": -0.0033145826309919357,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.012029756791889668,
        "encoder_gradient_dot_product": -0.002436983399093151,
        "input_gradient_cosine_similarity": 0.001642234856262803,
        "input_gradient_l2_distance": -0.01930541917681694,
        "input_gradient_dot_product": -0.005523913539946079
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.538277035236556,
      "val_r": 0.5148377224298938,
      "n_iterations": 362,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.012912079691886902,
        "interaction_matrix_overlap_top_k": -0.021276652812957764,
        "interaction_matrix_overlap_bottom_k": 0.0838783010840416,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0020964927971363068,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.003338051028549671,
        "task_vector_l2_distance": -0.0418686717748642,
        "task_vector_dot_product": 0.013093501329421997,
        "weight_space_angle": -0.001526283915154636,
        "task_vector_magnitude_ratio": -0.019746968522667885,
        "singular_value_overlap": -0.03617256507277489,
        "subspace_overlap": 0.005073348991572857,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.008634447120130062,
        "activation_cosine_similarity": 0.003632613457739353,
        "activation_magnitude_ratio": -0.008076703175902367,
        "activation_dot_product": -0.0029380307532846928,
        "encoder_gradient_cosine_similarity": -0.001985362498089671,
        "encoder_gradient_l2_distance": -0.02006898634135723,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.007133388426154852,
        "input_gradient_l2_distance": -0.03431306406855583,
        "input_gradient_dot_product": -0.013245704583823681
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5662442548309677,
      "val_r": 0.6081022858582936,
      "n_iterations": 452,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.0384383350610733,
        "interaction_matrix_overlap_top_k": -0.006906608585268259,
        "interaction_matrix_overlap_bottom_k": 0.07198836654424667,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0014330613194033504,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.023289304226636887,
        "task_vector_dot_product": 0.008540005423128605,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.007984270341694355,
        "singular_value_overlap": -0.023831019178032875,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0010038637556135654,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.004160567652434111,
        "activation_dot_product": -0.0036833295598626137,
        "encoder_gradient_cosine_similarity": -0.0013295038370415568,
        "encoder_gradient_l2_distance": -0.012620532885193825,
        "encoder_gradient_dot_product": -0.0020476169884204865,
        "input_gradient_cosine_similarity": 0.0049763754941523075,
        "input_gradient_l2_distance": -0.02180342935025692,
        "input_gradient_dot_product": -0.007581039797514677
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5330857690154672,
      "val_r": 0.563156544002997,
      "n_iterations": 372,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.004007193725556135,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.017933500930666924,
        "interaction_matrix_overlap_bottom_k": 0.10593242943286896,
        "effective_rank": -0.002405580598860979,
        "effective_rank_mergeability_score": 0.001732036704197526,
        "stable_rank": -0.0027170788962394,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0017577074468135834,
        "layerwise_effective_rank_mergeability_score": 0.0014367799740284681,
        "task_vector_cosine_similarity": -0.0014221478486433625,
        "task_vector_l2_distance": -0.07802008092403412,
        "task_vector_dot_product": 0.004202019423246384,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.020999528467655182,
        "singular_value_overlap": -0.0700092539191246,
        "subspace_overlap": 0.035130392760038376,
        "right_subspace_overlap": -0.0029063732363283634,
        "activation_l2_distance": -0.001990999560803175,
        "activation_cosine_similarity": -0.0029073385521769524,
        "activation_magnitude_ratio": -0.021183086559176445,
        "activation_dot_product": -0.01132587157189846,
        "encoder_gradient_cosine_similarity": -0.0018166393274441361,
        "encoder_gradient_l2_distance": -0.03652312979102135,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.004806915298104286,
        "input_gradient_l2_distance": -0.07962023466825485,
        "input_gradient_dot_product": -0.01830741949379444
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5756436150691993,
      "val_r": 0.3678858525625006,
      "n_iterations": 252,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0064362590201199055,
        "interaction_matrix_overlap_top_k": -0.001240458688698709,
        "interaction_matrix_overlap_bottom_k": 0.052260659635066986,
        "effective_rank": -0.0017205426702275872,
        "effective_rank_mergeability_score": 0.0013457490131258965,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0012391243362799287,
        "layerwise_effective_rank": 0.0015510983066633344,
        "layerwise_effective_rank_mergeability_score": -0.001335010165348649,
        "task_vector_cosine_similarity": -0.0013965535908937454,
        "task_vector_l2_distance": -0.04379516839981079,
        "task_vector_dot_product": 0.0029778270982205868,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.014786962419748306,
        "singular_value_overlap": -0.02276633121073246,
        "subspace_overlap": 0.0027379202656447887,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.017096105962991714,
        "activation_cosine_similarity": 0.006078317295759916,
        "activation_magnitude_ratio": -0.013904618099331856,
        "activation_dot_product": -0.007607273291796446,
        "encoder_gradient_cosine_similarity": -0.0034560482017695904,
        "encoder_gradient_l2_distance": -0.023877358064055443,
        "encoder_gradient_dot_product": 0.002044013701379299,
        "input_gradient_cosine_similarity": 0.0022081814240664244,
        "input_gradient_l2_distance": -0.033499717712402344,
        "input_gradient_dot_product": -0.013317348435521126
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5633588878193307,
      "val_r": 0.46120094210869417,
      "n_iterations": 345,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.007311064749956131,
        "interaction_matrix_overlap_top_k": -0.0041586123406887054,
        "interaction_matrix_overlap_bottom_k": 0.10044475644826889,
        "effective_rank": -0.002377826254814863,
        "effective_rank_mergeability_score": 0.002497876761481166,
        "stable_rank": -0.0032433720771223307,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0019963502418249846,
        "task_vector_l2_distance": -0.07589387148618698,
        "task_vector_dot_product": 0.00208712974563241,
        "weight_space_angle": 0.005322104319930077,
        "task_vector_magnitude_ratio": -0.012950848788022995,
        "singular_value_overlap": -0.06091611832380295,
        "subspace_overlap": 0.01334764901548624,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0152795584872365,
        "activation_cosine_similarity": -0.0022916540037840605,
        "activation_magnitude_ratio": -0.019225720316171646,
        "activation_dot_product": 0.006342749111354351,
        "encoder_gradient_cosine_similarity": 0.0045432355254888535,
        "encoder_gradient_l2_distance": -0.024264222010970116,
        "encoder_gradient_dot_product": 0.0017345290398225188,
        "input_gradient_cosine_similarity": 0.009884772822260857,
        "input_gradient_l2_distance": -0.06181155517697334,
        "input_gradient_dot_product": -0.017452050000429153
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6104428027031141,
      "val_r": 0.23751745926376067,
      "n_iterations": 288,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0088077113032341,
        "right_subspace_overlap_bottom_k": 0.005039295181632042,
        "interaction_matrix_overlap_top_k": -0.043715715408325195,
        "interaction_matrix_overlap_bottom_k": 0.06350643932819366,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0022030731197446585,
        "layerwise_effective_rank_mergeability_score": 0.00887567549943924,
        "task_vector_cosine_similarity": -0.0012308945879340172,
        "task_vector_l2_distance": -0.0364132821559906,
        "task_vector_dot_product": 0.001228060806170106,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.004152111709117889,
        "singular_value_overlap": -0.019131336361169815,
        "subspace_overlap": 0.013255040161311626,
        "right_subspace_overlap": 0.011902139522135258,
        "activation_l2_distance": 0.006089456379413605,
        "activation_cosine_similarity": -0.006350652780383825,
        "activation_magnitude_ratio": -0.006353247445076704,
        "activation_dot_product": 0.009057938121259212,
        "encoder_gradient_cosine_similarity": -0.0024995650164783,
        "encoder_gradient_l2_distance": -0.008575733751058578,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.005258273798972368,
        "input_gradient_l2_distance": -0.03862564265727997,
        "input_gradient_dot_product": -0.006234833970665932
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7287692838131573,
      "val_r": 0.5528217105455469,
      "n_iterations": 291,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0438171811401844,
        "right_subspace_overlap_bottom_k": -0.018380558118224144,
        "interaction_matrix_overlap_top_k": -0.0020874382462352514,
        "interaction_matrix_overlap_bottom_k": 0.05198632553219795,
        "effective_rank": -0.002233702689409256,
        "effective_rank_mergeability_score": 0.0028792941011488438,
        "stable_rank": -0.006476621143519878,
        "spectral_gap": -0.0012580958427861333,
        "singular_value_ratio": 0.001485816785134375,
        "layerwise_effective_rank": -0.01386804599314928,
        "layerwise_effective_rank_mergeability_score": 0.033528491854667664,
        "task_vector_cosine_similarity": -0.012911317870020866,
        "task_vector_l2_distance": -0.007979756221175194,
        "task_vector_dot_product": -0.015076518058776855,
        "weight_space_angle": 0.009440504014492035,
        "task_vector_magnitude_ratio": 0.0016337028937414289,
        "singular_value_overlap": -0.04442860931158066,
        "subspace_overlap": -0.0050471932627260685,
        "right_subspace_overlap": 0.06753294914960861,
        "activation_l2_distance": -0.012595253996551037,
        "activation_cosine_similarity": 0.03513559699058533,
        "activation_magnitude_ratio": -0.022296549752354622,
        "activation_dot_product": 0.008602997288107872,
        "encoder_gradient_cosine_similarity": 0.011835791170597076,
        "encoder_gradient_l2_distance": -0.15515413880348206,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.1531587839126587,
        "input_gradient_dot_product": -0.021268241107463837
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6086036784306991,
      "val_r": 0.2775238495425718,
      "n_iterations": 434,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.00408566789701581,
        "right_subspace_overlap_bottom_k": 0.0031159999780356884,
        "interaction_matrix_overlap_top_k": -0.021438604220747948,
        "interaction_matrix_overlap_bottom_k": 0.037709012627601624,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0011229265946894884,
        "singular_value_ratio": 0.0014123020227998495,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.025977976620197296,
        "task_vector_dot_product": 0.010669861920177937,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.00842384621500969,
        "singular_value_overlap": -0.016015945002436638,
        "subspace_overlap": 0.018417129293084145,
        "right_subspace_overlap": -0.01384603139013052,
        "activation_l2_distance": 0.008145319297909737,
        "activation_cosine_similarity": -0.001466677407734096,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.01165381632745266,
        "encoder_gradient_cosine_similarity": -0.001279671909287572,
        "encoder_gradient_l2_distance": -0.009650119580328465,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.005801853258162737,
        "input_gradient_l2_distance": -0.022283313795924187,
        "input_gradient_dot_product": -0.004921041429042816
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.1,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}