{
  "weight_avg": {
    "aggregate_metrics": {
      "train_r": 0.5136176975362746,
      "train_p": 1.9826254112934166e-216,
      "val_r": 0.2806640519184891,
      "val_p": 6.635287004186968e-08
    },
    "per_fold_stats": {
      "train_r_mean": 0.7552994809918221,
      "train_r_std": 0.040983991659465105,
      "val_r_mean": 0.6263238358279405,
      "val_r_std": 0.16764940520451446,
      "n_nonzero_mean": 23.75,
      "n_nonzero_std": 4.085033659592048
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.02614269219338894,
      "right_subspace_overlap_bottom_k": -0.06519121676683426,
      "interaction_matrix_overlap_top_k": 0.0014574499800801277,
      "interaction_matrix_overlap_bottom_k": 0.02519049122929573,
      "effective_rank": -0.001100545865483582,
      "effective_rank_mergeability_score": 0.0010268473997712135,
      "stable_rank": -0.002752876142039895,
      "spectral_gap": 0.0005758834886364639,
      "singular_value_ratio": -0.0005722002242691815,
      "layerwise_effective_rank": -0.005257123149931431,
      "layerwise_effective_rank_mergeability_score": 0.004965951666235924,
      "task_vector_cosine_similarity": -0.0005221606115810573,
      "task_vector_l2_distance": -0.01453630905598402,
      "task_vector_dot_product": -0.0012456985423341393,
      "weight_space_angle": -8.390508446609601e-05,
      "task_vector_magnitude_ratio": -0.002123479964211583,
      "singular_value_overlap": 0.0011224301997572184,
      "subspace_overlap": 0.0027066455222666264,
      "right_subspace_overlap": 0.024000700563192368,
      "activation_l2_distance": -0.0035514694172888994,
      "activation_cosine_similarity": 0.03996554762125015,
      "activation_magnitude_ratio": -0.010531645268201828,
      "activation_dot_product": 0.018158668652176857,
      "encoder_gradient_cosine_similarity": 0.012641352601349354,
      "encoder_gradient_l2_distance": -0.08846522867679596,
      "encoder_gradient_dot_product": 0.005914599634706974,
      "input_gradient_cosine_similarity": 0.004979727324098349,
      "input_gradient_l2_distance": -0.06751187145709991,
      "input_gradient_dot_product": -0.022342301905155182
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.014460334554314613,
      "right_subspace_overlap_bottom_k": 0.02796490490436554,
      "interaction_matrix_overlap_top_k": 0.009935401380062103,
      "interaction_matrix_overlap_bottom_k": 0.028310995548963547,
      "effective_rank": 0.0036985131446272135,
      "effective_rank_mergeability_score": 0.0037176483310759068,
      "stable_rank": 0.00404495419934392,
      "spectral_gap": 0.0031851481180638075,
      "singular_value_ratio": 0.00326457223854959,
      "layerwise_effective_rank": 0.005326064303517342,
      "layerwise_effective_rank_mergeability_score": 0.004898867104202509,
      "task_vector_cosine_similarity": 0.011718063615262508,
      "task_vector_l2_distance": 0.016348131000995636,
      "task_vector_dot_product": 0.008321672677993774,
      "weight_space_angle": 0.01042709406465292,
      "task_vector_magnitude_ratio": 0.0032441476359963417,
      "singular_value_overlap": 0.006059568375349045,
      "subspace_overlap": 0.010242149233818054,
      "right_subspace_overlap": 0.014824566431343555,
      "activation_l2_distance": 0.013335608877241611,
      "activation_cosine_similarity": 0.02013869397342205,
      "activation_magnitude_ratio": 0.010919869877398014,
      "activation_dot_product": 0.040092989802360535,
      "encoder_gradient_cosine_similarity": 0.008577995002269745,
      "encoder_gradient_l2_distance": 0.04789772257208824,
      "encoder_gradient_dot_product": 0.009363388642668724,
      "input_gradient_cosine_similarity": 0.005748338531702757,
      "input_gradient_l2_distance": 0.05199272558093071,
      "input_gradient_dot_product": 0.023557323962450027
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 1.0,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.85,
      "interaction_matrix_overlap_bottom_k": 0.9,
      "effective_rank": 0.6,
      "effective_rank_mergeability_score": 0.6,
      "stable_rank": 0.5,
      "spectral_gap": 0.55,
      "singular_value_ratio": 0.5,
      "layerwise_effective_rank": 0.75,
      "layerwise_effective_rank_mergeability_score": 0.8,
      "task_vector_cosine_similarity": 0.75,
      "task_vector_l2_distance": 0.8,
      "task_vector_dot_product": 1.0,
      "weight_space_angle": 0.85,
      "task_vector_magnitude_ratio": 0.75,
      "singular_value_overlap": 0.65,
      "subspace_overlap": 0.75,
      "right_subspace_overlap": 1.0,
      "activation_l2_distance": 0.8,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.85,
      "activation_dot_product": 0.85,
      "encoder_gradient_cosine_similarity": 1.0,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.75,
      "input_gradient_cosine_similarity": 0.9,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 1.0
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7776065308397994,
        "val_r": 0.6513681151841857,
        "n_iterations": 261,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.016489706933498383,
          "right_subspace_overlap_bottom_k": -0.06836588680744171,
          "interaction_matrix_overlap_top_k": -0.004583640489727259,
          "interaction_matrix_overlap_bottom_k": 0.05946151167154312,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.01049492135643959,
          "weight_space_angle": -0.0027669533155858517,
          "task_vector_magnitude_ratio": -0.003988294396549463,
          "singular_value_overlap": -0.004805846605449915,
          "subspace_overlap": 0.0015705910045653582,
          "right_subspace_overlap": 0.005917066242545843,
          "activation_l2_distance": 0.008604173548519611,
          "activation_cosine_similarity": 0.03376626595854759,
          "activation_magnitude_ratio": -0.0048722452484071255,
          "activation_dot_product": -0.011535524390637875,
          "encoder_gradient_cosine_similarity": 0.0022052840795367956,
          "encoder_gradient_l2_distance": -0.02509288489818573,
          "encoder_gradient_dot_product": 0.0014106581220403314,
          "input_gradient_cosine_similarity": 0.003751227166503668,
          "input_gradient_l2_distance": -0.018698979169130325,
          "input_gradient_dot_product": -0.00694934232160449
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6686818838354203,
        "val_r": 0.7458696271621358,
        "n_iterations": 336,
        "n_nonzero_coefficients": 29,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.04709790647029877,
          "right_subspace_overlap_bottom_k": -0.10956456512212753,
          "interaction_matrix_overlap_top_k": 0.027517901733517647,
          "interaction_matrix_overlap_bottom_k": -0.014445317909121513,
          "effective_rank": -0.01046446617692709,
          "effective_rank_mergeability_score": 0.009951958432793617,
          "stable_rank": -0.013221104629337788,
          "spectral_gap": 0.010092781856656075,
          "singular_value_ratio": -0.009768461808562279,
          "layerwise_effective_rank": -0.015757013112306595,
          "layerwise_effective_rank_mergeability_score": 0.015876544639468193,
          "task_vector_cosine_similarity": 0.03309626504778862,
          "task_vector_l2_distance": -0.024327008053660393,
          "task_vector_dot_product": 0.021525129675865173,
          "weight_space_angle": -0.031588997691869736,
          "task_vector_magnitude_ratio": -0.009629888460040092,
          "singular_value_overlap": 0.019199734553694725,
          "subspace_overlap": 0.02502933330833912,
          "right_subspace_overlap": 0.03704699128866196,
          "activation_l2_distance": -0.01593668945133686,
          "activation_cosine_similarity": 0.07916751503944397,
          "activation_magnitude_ratio": -0.043810464441776276,
          "activation_dot_product": 0.1354008913040161,
          "encoder_gradient_cosine_similarity": 0.022565651684999466,
          "encoder_gradient_l2_distance": -0.1477605551481247,
          "encoder_gradient_dot_product": 0.034149304032325745,
          "input_gradient_cosine_similarity": 0.005772619973868132,
          "input_gradient_l2_distance": -0.17483386397361755,
          "input_gradient_dot_product": -0.06669319421052933
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6860644946680847,
        "val_r": 0.657835370044287,
        "n_iterations": 374,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.023817429319024086,
          "right_subspace_overlap_bottom_k": -0.045234791934490204,
          "interaction_matrix_overlap_top_k": 0.008929379284381866,
          "interaction_matrix_overlap_bottom_k": 0.005825758911669254,
          "effective_rank": 0.004269677679985762,
          "effective_rank_mergeability_score": -0.00462503544986248,
          "stable_rank": 0.0,
          "spectral_gap": -0.0023762427736073732,
          "singular_value_ratio": 0.0032932725735008717,
          "layerwise_effective_rank": -0.0028434554114937782,
          "layerwise_effective_rank_mergeability_score": 0.0034552770666778088,
          "task_vector_cosine_similarity": 0.01394062303006649,
          "task_vector_l2_distance": -0.004013349302113056,
          "task_vector_dot_product": 0.013612144626677036,
          "weight_space_angle": -0.012972990050911903,
          "task_vector_magnitude_ratio": 0.0024889425840228796,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.010281329043209553,
          "right_subspace_overlap": 0.027969608083367348,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.027372682467103004,
          "activation_magnitude_ratio": -0.01661415584385395,
          "activation_dot_product": 0.0434751883149147,
          "encoder_gradient_cosine_similarity": 0.01349618099629879,
          "encoder_gradient_l2_distance": -0.06246650218963623,
          "encoder_gradient_dot_product": 0.012020021677017212,
          "input_gradient_cosine_similarity": 0.01848859339952469,
          "input_gradient_l2_distance": -0.06189430505037308,
          "input_gradient_dot_product": -0.04812796786427498
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7103873978474852,
        "val_r": 0.6814323605323063,
        "n_iterations": 340,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.04434492066502571,
          "right_subspace_overlap_bottom_k": -0.08083301782608032,
          "interaction_matrix_overlap_top_k": 0.018916094675660133,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": -0.005481152329593897,
          "effective_rank_mergeability_score": 0.005421030800789595,
          "stable_rank": -0.00696607306599617,
          "spectral_gap": 0.0020579963456839323,
          "singular_value_ratio": -0.002464770805090666,
          "layerwise_effective_rank": -0.011320111341774464,
          "layerwise_effective_rank_mergeability_score": 0.012750174850225449,
          "task_vector_cosine_similarity": 0.009755585342645645,
          "task_vector_l2_distance": -0.015235042199492455,
          "task_vector_dot_product": 0.010297924280166626,
          "weight_space_angle": -0.012051456607878208,
          "task_vector_magnitude_ratio": -0.0038579627871513367,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.017986947670578957,
          "right_subspace_overlap": 0.027452990412712097,
          "activation_l2_distance": -0.00910128466784954,
          "activation_cosine_similarity": 0.05067197605967522,
          "activation_magnitude_ratio": -0.032673317939043045,
          "activation_dot_product": 0.07797358930110931,
          "encoder_gradient_cosine_similarity": 0.02918861247599125,
          "encoder_gradient_l2_distance": -0.1115749329328537,
          "encoder_gradient_dot_product": 0.021785562857985497,
          "input_gradient_cosine_similarity": 0.009599638171494007,
          "input_gradient_l2_distance": -0.12424290925264359,
          "input_gradient_dot_product": -0.07996535301208496
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7529060522522868,
        "val_r": 0.7911049472203836,
        "n_iterations": 244,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.024968139827251434,
          "right_subspace_overlap_bottom_k": -0.0724879801273346,
          "interaction_matrix_overlap_top_k": -0.005959411151707172,
          "interaction_matrix_overlap_bottom_k": 0.03750498965382576,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0015629276167601347,
          "singular_value_ratio": -0.0010714249219745398,
          "layerwise_effective_rank": -0.0016230414621531963,
          "layerwise_effective_rank_mergeability_score": 0.0016578033100813627,
          "task_vector_cosine_similarity": -0.003405152354389429,
          "task_vector_l2_distance": -0.020022636279463768,
          "task_vector_dot_product": -0.008236061781644821,
          "weight_space_angle": 0.0034227431751787663,
          "task_vector_magnitude_ratio": -0.0027453883085399866,
          "singular_value_overlap": -0.004708599764853716,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0432722344994545,
          "activation_l2_distance": -0.0048295557498931885,
          "activation_cosine_similarity": 0.055420659482479095,
          "activation_magnitude_ratio": -0.010515935719013214,
          "activation_dot_product": -0.002799175912514329,
          "encoder_gradient_cosine_similarity": 0.013421274721622467,
          "encoder_gradient_l2_distance": -0.11812543123960495,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.009977259673178196,
          "input_gradient_l2_distance": -0.06542235612869263,
          "input_gradient_dot_product": -0.01884566806256771
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7672407833578956,
        "val_r": 0.694737948808521,
        "n_iterations": 344,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010956971906125546,
          "right_subspace_overlap_bottom_k": -0.02134905569255352,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.002760514384135604,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002617676043882966,
          "layerwise_effective_rank_mergeability_score": 0.0033272334840148687,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.011148146353662014,
          "task_vector_dot_product": -0.001641467330045998,
          "weight_space_angle": 0.0011698086746037006,
          "task_vector_magnitude_ratio": -0.007088972255587578,
          "singular_value_overlap": -0.001970464363694191,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.01896452158689499,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.03716270625591278,
          "activation_magnitude_ratio": -0.007629943545907736,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.011657814495265484,
          "encoder_gradient_l2_distance": -0.05849822610616684,
          "encoder_gradient_dot_product": 0.0034789785277098417,
          "input_gradient_cosine_similarity": 0.002341381972655654,
          "input_gradient_l2_distance": -0.022054314613342285,
          "input_gradient_dot_product": -0.015032432042062283
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7593474669132819,
        "val_r": 0.47405652992604125,
        "n_iterations": 199,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.02914358675479889,
          "right_subspace_overlap_bottom_k": -0.05130339786410332,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.010534006170928478,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0017954312497749925,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.00896418560296297,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.001427006209269166,
          "singular_value_overlap": 0.001791550312191248,
          "subspace_overlap": -0.005111257079988718,
          "right_subspace_overlap": 0.014885197393596172,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.04879432171583176,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.00824789609760046,
          "encoder_gradient_cosine_similarity": 0.013881823979318142,
          "encoder_gradient_l2_distance": -0.08276195079088211,
          "encoder_gradient_dot_product": 0.005944330245256424,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0346544124186039,
          "input_gradient_dot_product": -0.017446722835302353
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7251767441814698,
        "val_r": 0.4007056819283984,
        "n_iterations": 234,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.029717929661273956,
          "right_subspace_overlap_bottom_k": -0.08838153630495071,
          "interaction_matrix_overlap_top_k": -0.0063704028725624084,
          "interaction_matrix_overlap_bottom_k": 0.042205363512039185,
          "effective_rank": 0.0015814263606444001,
          "effective_rank_mergeability_score": -0.0012497330317273736,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.004800121299922466,
          "layerwise_effective_rank_mergeability_score": 0.005284859798848629,
          "task_vector_cosine_similarity": -0.0065510887652635574,
          "task_vector_l2_distance": -0.011463101953268051,
          "task_vector_dot_product": -0.0020668848883360624,
          "weight_space_angle": 0.007008402608335018,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.047519076615571976,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.051950011402368546,
          "activation_magnitude_ratio": -0.0066606467589735985,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.016461005434393883,
          "encoder_gradient_l2_distance": -0.10353877395391464,
          "encoder_gradient_dot_product": 0.001282063196413219,
          "input_gradient_cosine_similarity": 0.008467340841889381,
          "input_gradient_l2_distance": -0.029680021107196808,
          "input_gradient_dot_product": -0.0014702052576467395
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7879999094292558,
        "val_r": 0.4923995881630213,
        "n_iterations": 211,
        "n_nonzero_coefficients": 29,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.026570962741971016,
          "right_subspace_overlap_bottom_k": -0.11350882798433304,
          "interaction_matrix_overlap_top_k": 0.0019522549118846655,
          "interaction_matrix_overlap_bottom_k": 0.0957941859960556,
          "effective_rank": -0.004052397795021534,
          "effective_rank_mergeability_score": 0.0043953764252364635,
          "stable_rank": -0.0018002359429374337,
          "spectral_gap": -0.005578138399869204,
          "singular_value_ratio": 0.005948251113295555,
          "layerwise_effective_rank": -0.011634205467998981,
          "layerwise_effective_rank_mergeability_score": 0.009880997240543365,
          "task_vector_cosine_similarity": -0.01328075211495161,
          "task_vector_l2_distance": -0.009790489450097084,
          "task_vector_dot_product": -0.001175945857539773,
          "weight_space_angle": 0.010075841099023819,
          "task_vector_magnitude_ratio": 0.002683551050722599,
          "singular_value_overlap": -0.004370111506432295,
          "subspace_overlap": 0.005141986068338156,
          "right_subspace_overlap": 0.019164353609085083,
          "activation_l2_distance": -0.008361892774701118,
          "activation_cosine_similarity": 0.036754973232746124,
          "activation_magnitude_ratio": -0.00519710686057806,
          "activation_dot_product": -0.0038482979871332645,
          "encoder_gradient_cosine_similarity": 0.012894492596387863,
          "encoder_gradient_l2_distance": -0.06402753293514252,
          "encoder_gradient_dot_product": -0.00239877519197762,
          "input_gradient_cosine_similarity": -0.004183121956884861,
          "input_gradient_l2_distance": -0.0648917704820633,
          "input_gradient_dot_product": -0.018880339339375496
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7325031427338967,
        "val_r": 0.6722600281588205,
        "n_iterations": 277,
        "n_nonzero_coefficients": 28,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.05298300087451935,
          "right_subspace_overlap_bottom_k": -0.09465579688549042,
          "interaction_matrix_overlap_top_k": 0.013231230899691582,
          "interaction_matrix_overlap_bottom_k": 0.015593448653817177,
          "effective_rank": -0.0023325986694544554,
          "effective_rank_mergeability_score": 0.0018730657175183296,
          "stable_rank": -0.005382461939007044,
          "spectral_gap": -0.0021816191729158163,
          "singular_value_ratio": 0.002254724968224764,
          "layerwise_effective_rank": -0.010796762071549892,
          "layerwise_effective_rank_mergeability_score": 0.007280681282281876,
          "task_vector_cosine_similarity": -0.012961158528923988,
          "task_vector_l2_distance": -0.04852066561579704,
          "task_vector_dot_product": -0.011754799634218216,
          "weight_space_angle": 0.00863021332770586,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.003727172501385212,
          "subspace_overlap": 0.024866655468940735,
          "right_subspace_overlap": 0.043711934238672256,
          "activation_l2_distance": -0.003942635841667652,
          "activation_cosine_similarity": -0.009992583654820919,
          "activation_magnitude_ratio": -0.005194155033677816,
          "activation_dot_product": -0.03511252999305725,
          "encoder_gradient_cosine_similarity": 0.030196048319339752,
          "encoder_gradient_l2_distance": -0.2027202993631363,
          "encoder_gradient_dot_product": 0.002258818596601486,
          "input_gradient_cosine_similarity": 0.001095376443117857,
          "input_gradient_l2_distance": -0.19505415856838226,
          "input_gradient_dot_product": -0.005770937539637089
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7612540281827133,
        "val_r": 0.13155199903587705,
        "n_iterations": 374,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0277336947619915,
          "right_subspace_overlap_bottom_k": -0.03984960913658142,
          "interaction_matrix_overlap_top_k": 0.0015954046975821257,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": -0.004160797689110041,
          "effective_rank_mergeability_score": 0.004156691022217274,
          "stable_rank": -0.006893024779856205,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0048393611796200275,
          "task_vector_l2_distance": -0.029415201395750046,
          "task_vector_dot_product": -0.0014818175695836544,
          "weight_space_angle": 0.0033223829232156277,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.016199974343180656,
          "activation_l2_distance": -0.0424179807305336,
          "activation_cosine_similarity": 0.0840558186173439,
          "activation_magnitude_ratio": -0.017491253092885017,
          "activation_dot_product": 0.015904497355222702,
          "encoder_gradient_cosine_similarity": 0.004408098757266998,
          "encoder_gradient_l2_distance": -0.16423176229000092,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0019170191371813416,
          "input_gradient_l2_distance": -0.08290726691484451,
          "input_gradient_dot_product": -0.0018826590385288
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7699752264749276,
        "val_r": 0.7601111949101101,
        "n_iterations": 308,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.03357455134391785,
          "right_subspace_overlap_bottom_k": -0.04372955858707428,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.013848300091922283,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.018172377720475197,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.0010138292564079165,
          "weight_space_angle": 0.013479300774633884,
          "task_vector_magnitude_ratio": -0.002785195829346776,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.01811271905899048,
          "activation_l2_distance": 0.00231162179261446,
          "activation_cosine_similarity": 0.030282320454716682,
          "activation_magnitude_ratio": -0.005398460663855076,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.007077499758452177,
          "encoder_gradient_l2_distance": -0.04971189424395561,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.003309789579361677,
          "input_gradient_l2_distance": -0.027167823165655136,
          "input_gradient_dot_product": -0.011122659780085087
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7773408845704335,
        "val_r": 0.7475871195665628,
        "n_iterations": 343,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01256369985640049,
          "right_subspace_overlap_bottom_k": -0.036225996911525726,
          "interaction_matrix_overlap_top_k": -0.004748607985675335,
          "interaction_matrix_overlap_bottom_k": 0.027687974274158478,
          "effective_rank": 0.003144696820527315,
          "effective_rank_mergeability_score": -0.0032612099312245846,
          "stable_rank": 0.0011162005830556154,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002378955250605941,
          "layerwise_effective_rank_mergeability_score": 0.0028943896759301424,
          "task_vector_cosine_similarity": 0.010298074223101139,
          "task_vector_l2_distance": 0.0010877042077481747,
          "task_vector_dot_product": -0.0010162054095417261,
          "weight_space_angle": -0.007144753821194172,
          "task_vector_magnitude_ratio": -0.0019066762179136276,
          "singular_value_overlap": -0.0011637624120339751,
          "subspace_overlap": -0.014651929028332233,
          "right_subspace_overlap": 0.006183967925608158,
          "activation_l2_distance": 0.014610028825700283,
          "activation_cosine_similarity": 0.027826718986034393,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.005909517407417297,
          "encoder_gradient_cosine_similarity": 0.004299367778003216,
          "encoder_gradient_l2_distance": -0.020214274525642395,
          "encoder_gradient_dot_product": 0.0029658132698386908,
          "input_gradient_cosine_similarity": 0.0022488594986498356,
          "input_gradient_l2_distance": -0.013594177551567554,
          "input_gradient_dot_product": -0.007552890572696924
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7862167675915087,
        "val_r": 0.8354350526542047,
        "n_iterations": 310,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005805536638945341,
          "right_subspace_overlap_bottom_k": -0.08126701414585114,
          "interaction_matrix_overlap_top_k": -0.018590833991765976,
          "interaction_matrix_overlap_bottom_k": 0.06915830820798874,
          "effective_rank": 0.0020484765991568565,
          "effective_rank_mergeability_score": -0.0020280955359339714,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.003525514155626297,
          "layerwise_effective_rank_mergeability_score": 0.004164821468293667,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.002479403745383024,
          "task_vector_dot_product": -0.0029035729821771383,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0015731846215203404,
          "singular_value_overlap": -0.0030459295958280563,
          "subspace_overlap": -0.00804264284670353,
          "right_subspace_overlap": 0.02720821090042591,
          "activation_l2_distance": -0.002322496846318245,
          "activation_cosine_similarity": 0.015887344256043434,
          "activation_magnitude_ratio": -0.0013211292680352926,
          "activation_dot_product": -0.001857072813436389,
          "encoder_gradient_cosine_similarity": 0.001944027841091156,
          "encoder_gradient_l2_distance": -0.0246804878115654,
          "encoder_gradient_dot_product": 0.003198331920430064,
          "input_gradient_cosine_similarity": 0.00348869152367115,
          "input_gradient_l2_distance": -0.017448030412197113,
          "input_gradient_dot_product": -0.009021556936204433
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7516788439172457,
        "val_r": 0.7786263782745523,
        "n_iterations": 367,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.04413336515426636,
          "right_subspace_overlap_bottom_k": -0.09365377575159073,
          "interaction_matrix_overlap_top_k": 0.002573369536548853,
          "interaction_matrix_overlap_bottom_k": 0.031086774542927742,
          "effective_rank": -0.0014635021798312664,
          "effective_rank_mergeability_score": 0.001291027758270502,
          "stable_rank": -0.006190955173224211,
          "spectral_gap": -0.001305636134929955,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.00346294860355556,
          "layerwise_effective_rank_mergeability_score": 0.003992508165538311,
          "task_vector_cosine_similarity": -0.014368738047778606,
          "task_vector_l2_distance": -0.016118623316287994,
          "task_vector_dot_product": -0.007565611507743597,
          "weight_space_angle": 0.013331414200365543,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0011057580122724175,
          "right_subspace_overlap": 0.042337752878665924,
          "activation_l2_distance": -0.027731886133551598,
          "activation_cosine_similarity": 0.047363393008708954,
          "activation_magnitude_ratio": -0.01226906105875969,
          "activation_dot_product": 0.009786522015929222,
          "encoder_gradient_cosine_similarity": 0.015368395484983921,
          "encoder_gradient_l2_distance": -0.12407097965478897,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.006123395636677742,
          "input_gradient_l2_distance": -0.10038696229457855,
          "input_gradient_dot_product": -0.010163746774196625
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.7966764106427189,
        "val_r": 0.5885795273992257,
        "n_iterations": 265,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01703852042555809,
          "right_subspace_overlap_bottom_k": -0.04517157003283501,
          "interaction_matrix_overlap_top_k": -0.0011152776423841715,
          "interaction_matrix_overlap_bottom_k": 0.016794821247458458,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.002666841959580779,
          "spectral_gap": 0.0012498018331825733,
          "singular_value_ratio": -0.0012750059831887484,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.007109799422323704,
          "task_vector_l2_distance": -0.01630881242454052,
          "task_vector_dot_product": -0.0013742026640102267,
          "weight_space_angle": 0.007298558950424194,
          "task_vector_magnitude_ratio": -0.001970083685591817,
          "singular_value_overlap": 0.012371108867228031,
          "subspace_overlap": -0.009248425252735615,
          "right_subspace_overlap": 0.0307697094976902,
          "activation_l2_distance": 0.021070826798677444,
          "activation_cosine_similarity": 0.04413408413529396,
          "activation_magnitude_ratio": -0.00698558334261179,
          "activation_dot_product": -0.00418336596339941,
          "encoder_gradient_cosine_similarity": 0.007104190066456795,
          "encoder_gradient_l2_distance": -0.06706098467111588,
          "encoder_gradient_dot_product": 0.0033569163642823696,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.027307143434882164,
          "input_gradient_dot_product": -0.018552590161561966
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7700989354669148,
        "val_r": 0.7264544118899119,
        "n_iterations": 209,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.02951524406671524,
          "right_subspace_overlap_bottom_k": -0.06613843142986298,
          "interaction_matrix_overlap_top_k": -0.0059266285970807076,
          "interaction_matrix_overlap_bottom_k": 0.0376201793551445,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.003083884483203292,
          "layerwise_effective_rank_mergeability_score": 0.0024275570176541805,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.013288903050124645,
          "weight_space_angle": 0.00106092169880867,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.002760234521701932,
          "right_subspace_overlap": 0.020111996680498123,
          "activation_l2_distance": 0.0013279297854751348,
          "activation_cosine_similarity": 0.03715701773762703,
          "activation_magnitude_ratio": -0.008242611773312092,
          "activation_dot_product": -0.0051318565383553505,
          "encoder_gradient_cosine_similarity": 0.008660205639898777,
          "encoder_gradient_l2_distance": -0.05860868841409683,
          "encoder_gradient_dot_product": 0.0016630749450996518,
          "input_gradient_cosine_similarity": 0.003591675776988268,
          "input_gradient_l2_distance": -0.03070850670337677,
          "input_gradient_dot_product": -0.012892511673271656
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6887016438909406,
        "val_r": 0.5752578981795348,
        "n_iterations": 311,
        "n_nonzero_coefficients": 29,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.019681889563798904,
          "right_subspace_overlap_bottom_k": -0.06576503813266754,
          "interaction_matrix_overlap_top_k": 0.009929347783327103,
          "interaction_matrix_overlap_bottom_k": -0.010653499513864517,
          "effective_rank": -0.00842874776571989,
          "effective_rank_mergeability_score": 0.008589597418904305,
          "stable_rank": -0.011210188269615173,
          "spectral_gap": 0.006168973632156849,
          "singular_value_ratio": -0.006723667029291391,
          "layerwise_effective_rank": -0.015829946845769882,
          "layerwise_effective_rank_mergeability_score": 0.016456186771392822,
          "task_vector_cosine_similarity": 0.011813743971288204,
          "task_vector_l2_distance": -0.018275419250130653,
          "task_vector_dot_product": 0.0017395932227373123,
          "weight_space_angle": -0.010151093825697899,
          "task_vector_magnitude_ratio": -0.0064336690120399,
          "singular_value_overlap": 0.01000874862074852,
          "subspace_overlap": 0.011342315934598446,
          "right_subspace_overlap": 0.0359213761985302,
          "activation_l2_distance": -0.006908504758030176,
          "activation_cosine_similarity": 0.04818959906697273,
          "activation_magnitude_ratio": -0.020413251593708992,
          "activation_dot_product": 0.07476352900266647,
          "encoder_gradient_cosine_similarity": 0.02718469314277172,
          "encoder_gradient_l2_distance": -0.10277704894542694,
          "encoder_gradient_dot_product": 0.023677153512835503,
          "input_gradient_cosine_similarity": 0.019752154126763344,
          "input_gradient_l2_distance": -0.11616577953100204,
          "input_gradient_dot_product": -0.07384951412677765
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8088315716570929,
        "val_r": 0.4021642617530026,
        "n_iterations": 221,
        "n_nonzero_coefficients": 28,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.034528449177742004,
          "right_subspace_overlap_bottom_k": -0.08009927719831467,
          "interaction_matrix_overlap_top_k": -0.004224625416100025,
          "interaction_matrix_overlap_bottom_k": 0.06077336519956589,
          "effective_rank": 0.0033284667879343033,
          "effective_rank_mergeability_score": -0.003977722488343716,
          "stable_rank": -0.0018428363837301731,
          "spectral_gap": -0.0019571881275624037,
          "singular_value_ratio": 0.002145215170457959,
          "layerwise_effective_rank": -0.012278610840439796,
          "layerwise_effective_rank_mergeability_score": 0.004186834674328566,
          "task_vector_cosine_similarity": -0.010419966652989388,
          "task_vector_l2_distance": -0.007750289980322123,
          "task_vector_dot_product": -0.0010853213025256991,
          "weight_space_angle": 0.006198554299771786,
          "task_vector_magnitude_ratio": 0.0021137166768312454,
          "singular_value_overlap": 0.005771576426923275,
          "subspace_overlap": -0.0030728632118552923,
          "right_subspace_overlap": 0.00801078975200653,
          "activation_l2_distance": 0.0012175976298749447,
          "activation_cosine_similarity": 0.02330736815929413,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.015850931406021118,
          "encoder_gradient_cosine_similarity": 0.007734691258519888,
          "encoder_gradient_l2_distance": -0.0542776845395565,
          "encoder_gradient_dot_product": 0.0034997197799384594,
          "input_gradient_cosine_similarity": 0.0016097044572234154,
          "input_gradient_l2_distance": -0.03743886947631836,
          "input_gradient_dot_product": -0.009202555753290653
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8273009013830684,
        "val_r": 0.7189386757677257,
        "n_iterations": 459,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.007811649702489376,
          "right_subspace_overlap_bottom_k": -0.006239260081201792,
          "interaction_matrix_overlap_top_k": -0.003976557403802872,
          "interaction_matrix_overlap_bottom_k": 0.002259117318317294,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.003784013446420431,
          "singular_value_ratio": -0.0037821370642632246,
          "layerwise_effective_rank": -0.0031902361661195755,
          "layerwise_effective_rank_mergeability_score": 0.0038877439219504595,
          "task_vector_cosine_similarity": 0.001760896178893745,
          "task_vector_l2_distance": -0.06190451979637146,
          "task_vector_dot_product": 0.001974965911358595,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.006349490024149418,
          "singular_value_overlap": -0.0029022283852100372,
          "subspace_overlap": 0.001906869001686573,
          "right_subspace_overlap": -0.010746454820036888,
          "activation_l2_distance": 0.0013813512632623315,
          "activation_cosine_similarity": 0.030038706958293915,
          "activation_magnitude_ratio": -0.005343569442629814,
          "activation_dot_product": 0.0686434656381607,
          "encoder_gradient_cosine_similarity": 0.003077686997130513,
          "encoder_gradient_l2_distance": -0.12710370123386383,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0022429446689784527,
          "input_gradient_l2_distance": -0.1056857705116272,
          "input_gradient_dot_product": -0.013423141092061996
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.1,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "arithmetic": {
    "aggregate_metrics": {
      "train_r": 0.3911569467644164,
      "train_p": 2.7801838480791395e-118,
      "val_r": -0.05378638247523405,
      "val_p": 0.3101717083869684
    },
    "per_fold_stats": {
      "train_r_mean": 0.6067059645344435,
      "train_r_std": 0.059091197810535755,
      "val_r_mean": 0.47831982843692933,
      "val_r_std": 0.16561817884569371,
      "n_nonzero_mean": 23.15,
      "n_nonzero_std": 3.004579837514723
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.00981130637228489,
      "right_subspace_overlap_bottom_k": -0.013489723205566406,
      "interaction_matrix_overlap_top_k": 0.000632117036730051,
      "interaction_matrix_overlap_bottom_k": 0.05698845908045769,
      "effective_rank": -0.0023472930770367384,
      "effective_rank_mergeability_score": 0.002166495192795992,
      "stable_rank": -0.002921773586422205,
      "spectral_gap": 0.000522012822329998,
      "singular_value_ratio": -0.0006755044450983405,
      "layerwise_effective_rank": -0.00040010566590353847,
      "layerwise_effective_rank_mergeability_score": 0.0007460342603735626,
      "task_vector_cosine_similarity": -0.0022719050757586956,
      "task_vector_l2_distance": -0.04810795933008194,
      "task_vector_dot_product": -0.002098564989864826,
      "weight_space_angle": 0.0023016647901386023,
      "task_vector_magnitude_ratio": -0.011253916658461094,
      "singular_value_overlap": -0.0339774489402771,
      "subspace_overlap": 0.008511914871633053,
      "right_subspace_overlap": 0.010036087594926357,
      "activation_l2_distance": 9.106225479627028e-05,
      "activation_cosine_similarity": 0.009381154552102089,
      "activation_magnitude_ratio": -0.008931493386626244,
      "activation_dot_product": 0.011531488038599491,
      "encoder_gradient_cosine_similarity": 0.005572055000811815,
      "encoder_gradient_l2_distance": -0.06421003490686417,
      "encoder_gradient_dot_product": 0.005697900895029306,
      "input_gradient_cosine_similarity": 0.003183626336976886,
      "input_gradient_l2_distance": -0.06095961481332779,
      "input_gradient_dot_product": -0.02310163527727127
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.013322144746780396,
      "right_subspace_overlap_bottom_k": 0.01761561445891857,
      "interaction_matrix_overlap_top_k": 0.01141596119850874,
      "interaction_matrix_overlap_bottom_k": 0.022986769676208496,
      "effective_rank": 0.0032653133384883404,
      "effective_rank_mergeability_score": 0.0022738156840205193,
      "stable_rank": 0.0036193944979459047,
      "spectral_gap": 0.001850150991231203,
      "singular_value_ratio": 0.001749534043483436,
      "layerwise_effective_rank": 0.004254015628248453,
      "layerwise_effective_rank_mergeability_score": 0.003520891536027193,
      "task_vector_cosine_similarity": 0.009062557481229305,
      "task_vector_l2_distance": 0.024330006912350655,
      "task_vector_dot_product": 0.010543761774897575,
      "weight_space_angle": 0.00911787897348404,
      "task_vector_magnitude_ratio": 0.006031245458871126,
      "singular_value_overlap": 0.0195195022970438,
      "subspace_overlap": 0.008922035805881023,
      "right_subspace_overlap": 0.01286387536674738,
      "activation_l2_distance": 0.010175001807510853,
      "activation_cosine_similarity": 0.011034545488655567,
      "activation_magnitude_ratio": 0.007011127192527056,
      "activation_dot_product": 0.025531131774187088,
      "encoder_gradient_cosine_similarity": 0.00718772504478693,
      "encoder_gradient_l2_distance": 0.038600217550992966,
      "encoder_gradient_dot_product": 0.006412499584257603,
      "input_gradient_cosine_similarity": 0.004397028591483831,
      "input_gradient_l2_distance": 0.03746887668967247,
      "input_gradient_dot_product": 0.020608363673090935
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.9,
      "right_subspace_overlap_bottom_k": 0.95,
      "interaction_matrix_overlap_top_k": 0.7,
      "interaction_matrix_overlap_bottom_k": 1.0,
      "effective_rank": 0.6,
      "effective_rank_mergeability_score": 0.65,
      "stable_rank": 0.6,
      "spectral_gap": 0.65,
      "singular_value_ratio": 0.5,
      "layerwise_effective_rank": 0.3,
      "layerwise_effective_rank_mergeability_score": 0.3,
      "task_vector_cosine_similarity": 0.7,
      "task_vector_l2_distance": 1.0,
      "task_vector_dot_product": 0.85,
      "weight_space_angle": 0.7,
      "task_vector_magnitude_ratio": 0.95,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.7,
      "right_subspace_overlap": 0.95,
      "activation_l2_distance": 0.85,
      "activation_cosine_similarity": 0.95,
      "activation_magnitude_ratio": 0.95,
      "activation_dot_product": 0.9,
      "encoder_gradient_cosine_similarity": 0.85,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.8,
      "input_gradient_cosine_similarity": 0.85,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 1.0
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6398428718802955,
        "val_r": 0.625189258635213,
        "n_iterations": 278,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0011107976315543056,
          "right_subspace_overlap_bottom_k": 0.008589335717260838,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.08726958930492401,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0038268868811428547,
          "stable_rank": 0.0,
          "spectral_gap": 0.0032725450582802296,
          "singular_value_ratio": -0.0032649007625877857,
          "layerwise_effective_rank": 0.012673968449234962,
          "layerwise_effective_rank_mergeability_score": -0.004728790372610092,
          "task_vector_cosine_similarity": -0.003011570777744055,
          "task_vector_l2_distance": -0.07513544708490372,
          "task_vector_dot_product": -0.011218334548175335,
          "weight_space_angle": 0.004182769916951656,
          "task_vector_magnitude_ratio": -0.020300354808568954,
          "singular_value_overlap": -0.059035900980234146,
          "subspace_overlap": 0.02354365773499012,
          "right_subspace_overlap": 0.0038467689882963896,
          "activation_l2_distance": 0.008914357051253319,
          "activation_cosine_similarity": 0.018960287794470787,
          "activation_magnitude_ratio": -0.020969416946172714,
          "activation_dot_product": 0.0023681744933128357,
          "encoder_gradient_cosine_similarity": 0.0010559405200183392,
          "encoder_gradient_l2_distance": -0.0834868848323822,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.06925777345895767,
          "input_gradient_dot_product": -0.026176419109106064
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6062433820910322,
        "val_r": 0.5269652117721659,
        "n_iterations": 214,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0034338454715907574,
          "right_subspace_overlap_bottom_k": -0.016718847677111626,
          "interaction_matrix_overlap_top_k": -0.0013427194207906723,
          "interaction_matrix_overlap_bottom_k": 0.05038980767130852,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0018441778374835849,
          "stable_rank": 0.0,
          "spectral_gap": -0.0017790067940950394,
          "singular_value_ratio": 0.0022365287877619267,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.02947762981057167,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.01377051044255495,
          "singular_value_overlap": -0.018689801916480064,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0032757034059613943,
          "activation_l2_distance": 0.004876673221588135,
          "activation_cosine_similarity": 0.0029446410480886698,
          "activation_magnitude_ratio": -0.004253655672073364,
          "activation_dot_product": 0.008281907998025417,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.03605343773961067,
          "encoder_gradient_dot_product": 0.004793229978531599,
          "input_gradient_cosine_similarity": 0.0037995039019733667,
          "input_gradient_l2_distance": -0.028814662247896194,
          "input_gradient_dot_product": -0.00688762916252017
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6125844339039015,
        "val_r": 0.5258198139558772,
        "n_iterations": 376,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004178992006927729,
          "right_subspace_overlap_bottom_k": -0.01773279905319214,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.04536595195531845,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0021585715003311634,
          "singular_value_ratio": 0.0016282895812764764,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.024011921137571335,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.012498323805630207,
          "singular_value_overlap": -0.01799972914159298,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005474657751619816,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0014019202208146453,
          "activation_magnitude_ratio": -0.005678580142557621,
          "activation_dot_product": 0.004334168042987585,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.026540549471974373,
          "encoder_gradient_dot_product": 0.0021663750521838665,
          "input_gradient_cosine_similarity": 0.003697680775076151,
          "input_gradient_l2_distance": -0.02613353729248047,
          "input_gradient_dot_product": -0.00924925971776247
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5996668240326422,
        "val_r": 0.4579671147280855,
        "n_iterations": 258,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0052794599905610085,
          "right_subspace_overlap_bottom_k": -0.0072654676623642445,
          "interaction_matrix_overlap_top_k": -0.0013418326852843165,
          "interaction_matrix_overlap_bottom_k": 0.06921649724245071,
          "effective_rank": -0.0019787787459790707,
          "effective_rank_mergeability_score": 0.0022371397353708744,
          "stable_rank": -0.00125157053116709,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.05275386571884155,
          "task_vector_dot_product": 0.006237474735826254,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.017219865694642067,
          "singular_value_overlap": -0.03906045854091644,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0059138513170182705,
          "activation_l2_distance": 0.00510860001668334,
          "activation_cosine_similarity": 0.0024792838376015425,
          "activation_magnitude_ratio": -0.012976198457181454,
          "activation_dot_product": 0.01441480964422226,
          "encoder_gradient_cosine_similarity": 0.0029159903060644865,
          "encoder_gradient_l2_distance": -0.05195820331573486,
          "encoder_gradient_dot_product": 0.0016664748545736074,
          "input_gradient_cosine_similarity": 0.005915921181440353,
          "input_gradient_l2_distance": -0.04879796504974365,
          "input_gradient_dot_product": -0.016483644023537636
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6106349837778355,
        "val_r": 0.7105157638364187,
        "n_iterations": 458,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.026741672307252884,
          "right_subspace_overlap_bottom_k": -0.028193358331918716,
          "interaction_matrix_overlap_top_k": 0.013435512781143188,
          "interaction_matrix_overlap_bottom_k": 0.07799048721790314,
          "effective_rank": -0.003943503834307194,
          "effective_rank_mergeability_score": 0.002738300245255232,
          "stable_rank": -0.004991042427718639,
          "spectral_gap": 0.004635652527213097,
          "singular_value_ratio": -0.00532064912840724,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.01530864741653204,
          "task_vector_l2_distance": -0.07875968515872955,
          "task_vector_dot_product": -0.02497737482190132,
          "weight_space_angle": 0.015645360574126244,
          "task_vector_magnitude_ratio": -0.009070578962564468,
          "singular_value_overlap": -0.06627552211284637,
          "subspace_overlap": 0.015902256593108177,
          "right_subspace_overlap": 0.026677614077925682,
          "activation_l2_distance": -0.016524767503142357,
          "activation_cosine_similarity": 0.016840150579810143,
          "activation_magnitude_ratio": -0.004844036418944597,
          "activation_dot_product": -0.007376601919531822,
          "encoder_gradient_cosine_similarity": 0.0020709398668259382,
          "encoder_gradient_l2_distance": -0.10089460015296936,
          "encoder_gradient_dot_product": 0.01523846760392189,
          "input_gradient_cosine_similarity": 0.014624240808188915,
          "input_gradient_l2_distance": -0.11439503729343414,
          "input_gradient_dot_product": -0.05392727628350258
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.6092990055969375,
        "val_r": 0.6868596364869748,
        "n_iterations": 420,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0034008468501269817,
          "interaction_matrix_overlap_top_k": 0.0021571277175098658,
          "interaction_matrix_overlap_bottom_k": 0.08245660364627838,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0027289472054690123,
          "singular_value_ratio": -0.0020415715407580137,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0010568134021013975,
          "task_vector_l2_distance": -0.07655006647109985,
          "task_vector_dot_product": 0.007760824169963598,
          "weight_space_angle": -0.0023801608476787806,
          "task_vector_magnitude_ratio": -0.019951077178120613,
          "singular_value_overlap": -0.04943167790770531,
          "subspace_overlap": 0.0022104063536971807,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0010130270384252071,
          "activation_cosine_similarity": 0.007242802530527115,
          "activation_magnitude_ratio": -0.012894172221422195,
          "activation_dot_product": 0.013103948906064034,
          "encoder_gradient_cosine_similarity": 0.009087005630135536,
          "encoder_gradient_l2_distance": -0.07630158960819244,
          "encoder_gradient_dot_product": 0.0027565956115722656,
          "input_gradient_cosine_similarity": 0.0025834026746451855,
          "input_gradient_l2_distance": -0.04763578623533249,
          "input_gradient_dot_product": -0.023349478840827942
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.60336474064021,
        "val_r": 0.16603965936322065,
        "n_iterations": 309,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007004874292761087,
          "right_subspace_overlap_bottom_k": -0.003321294905617833,
          "interaction_matrix_overlap_top_k": 0.0014224023325368762,
          "interaction_matrix_overlap_bottom_k": 0.06340597569942474,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0018589487299323082,
          "stable_rank": -0.0019852707628160715,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0028577386401593685,
          "task_vector_l2_distance": -0.05382581055164337,
          "task_vector_dot_product": -0.01809101738035679,
          "weight_space_angle": 0.0023538446985185146,
          "task_vector_magnitude_ratio": -0.015321850776672363,
          "singular_value_overlap": -0.03431367501616478,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005979879759252071,
          "activation_l2_distance": -0.00706833228468895,
          "activation_cosine_similarity": 0.00919091422110796,
          "activation_magnitude_ratio": 0.0031077226158231497,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.006592004559934139,
          "encoder_gradient_l2_distance": -0.09211142361164093,
          "encoder_gradient_dot_product": 0.00991649180650711,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.06258735805749893,
          "input_gradient_dot_product": -0.02125726453959942
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5498470859714379,
        "val_r": 0.25550961608451206,
        "n_iterations": 306,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.012976303696632385,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.001471338327974081,
          "interaction_matrix_overlap_bottom_k": 0.08889015763998032,
          "effective_rank": -0.0011192288948222995,
          "effective_rank_mergeability_score": 0.0011211292585358024,
          "stable_rank": 0.0,
          "spectral_gap": 0.0015595178119838238,
          "singular_value_ratio": -0.001632897648960352,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.09230254590511322,
          "task_vector_dot_product": -0.012363167479634285,
          "weight_space_angle": 0.0015733762411400676,
          "task_vector_magnitude_ratio": -0.018510568886995316,
          "singular_value_overlap": -0.054430898278951645,
          "subspace_overlap": 0.01668565720319748,
          "right_subspace_overlap": 0.01026005856692791,
          "activation_l2_distance": 0.005376099143177271,
          "activation_cosine_similarity": 0.01615457981824875,
          "activation_magnitude_ratio": -0.01547282561659813,
          "activation_dot_product": 0.005073400214314461,
          "encoder_gradient_cosine_similarity": 0.010760113596916199,
          "encoder_gradient_l2_distance": -0.09289952367544174,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.008284317329525948,
          "input_gradient_l2_distance": -0.04439061880111694,
          "input_gradient_dot_product": -0.0012164392974227667
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.6143524939318445,
        "val_r": 0.35891399497258436,
        "n_iterations": 284,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.001732149627059698,
          "right_subspace_overlap_bottom_k": -0.021865949034690857,
          "interaction_matrix_overlap_top_k": -0.0011141316499561071,
          "interaction_matrix_overlap_bottom_k": 0.06040804460644722,
          "effective_rank": -0.012149283662438393,
          "effective_rank_mergeability_score": 0.0052102431654930115,
          "stable_rank": -0.001934948144480586,
          "spectral_gap": -0.0010021049529314041,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.03728557750582695,
          "task_vector_dot_product": 0.003642738563939929,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.02699718251824379,
          "subspace_overlap": 0.0016683894209563732,
          "right_subspace_overlap": 0.0038043824024498463,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.008993136696517467,
          "activation_magnitude_ratio": -0.007685475051403046,
          "activation_dot_product": 0.0015404806472361088,
          "encoder_gradient_cosine_similarity": 0.006451454944908619,
          "encoder_gradient_l2_distance": -0.03396864980459213,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.001158884959295392,
          "input_gradient_l2_distance": -0.04575560614466667,
          "input_gradient_dot_product": -0.016484055668115616
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.601876379555681,
        "val_r": 0.2590121672205592,
        "n_iterations": 428,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.02526537887752056,
          "right_subspace_overlap_bottom_k": -0.01524187158793211,
          "interaction_matrix_overlap_top_k": 0.00195913203060627,
          "interaction_matrix_overlap_bottom_k": 0.06370864063501358,
          "effective_rank": -0.002411983907222748,
          "effective_rank_mergeability_score": 0.002448116894811392,
          "stable_rank": -0.004377003759145737,
          "spectral_gap": 0.0017064145067706704,
          "singular_value_ratio": -0.0016588084399700165,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.014597427099943161,
          "task_vector_l2_distance": -0.06199321523308754,
          "task_vector_dot_product": -0.01794395223259926,
          "weight_space_angle": 0.009931963868439198,
          "task_vector_magnitude_ratio": -0.010486888699233532,
          "singular_value_overlap": -0.05387226864695549,
          "subspace_overlap": 0.02610713243484497,
          "right_subspace_overlap": 0.021433861926198006,
          "activation_l2_distance": -0.02433599904179573,
          "activation_cosine_similarity": -0.020052608102560043,
          "activation_magnitude_ratio": -0.00959934014827013,
          "activation_dot_product": -0.018088290467858315,
          "encoder_gradient_cosine_similarity": 0.010495977476239204,
          "encoder_gradient_l2_distance": -0.08403213322162628,
          "encoder_gradient_dot_product": 0.01923760026693344,
          "input_gradient_cosine_similarity": -0.007466324605047703,
          "input_gradient_l2_distance": -0.0972338393330574,
          "input_gradient_dot_product": -0.027171682566404343
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.47500096919053436,
        "val_r": 0.2585524924171298,
        "n_iterations": 215,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.018023476004600525,
          "interaction_matrix_overlap_top_k": -0.0026581408455967903,
          "interaction_matrix_overlap_bottom_k": 0.03594452887773514,
          "effective_rank": -0.005217256024479866,
          "effective_rank_mergeability_score": 0.0037434077821671963,
          "stable_rank": -0.012658790685236454,
          "spectral_gap": 0.0016286354511976242,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": -0.0016768146306276321,
          "task_vector_cosine_similarity": -0.0025359478313475847,
          "task_vector_l2_distance": -0.02039831317961216,
          "task_vector_dot_product": 0.0013341712765395641,
          "weight_space_angle": 0.003936382941901684,
          "task_vector_magnitude_ratio": -0.00706237368285656,
          "singular_value_overlap": -0.016453273594379425,
          "subspace_overlap": 0.0019849601667374372,
          "right_subspace_overlap": 0.0017743106000125408,
          "activation_l2_distance": -0.003076755441725254,
          "activation_cosine_similarity": 0.007587703410536051,
          "activation_magnitude_ratio": -0.0072723859921097755,
          "activation_dot_product": 0.007152827922254801,
          "encoder_gradient_cosine_similarity": 0.002074931049719453,
          "encoder_gradient_l2_distance": -0.02472735196352005,
          "encoder_gradient_dot_product": 0.0027652704156935215,
          "input_gradient_cosine_similarity": 0.0053379167802631855,
          "input_gradient_l2_distance": -0.022810395807027817,
          "input_gradient_dot_product": -0.012545057572424412
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5882665165797416,
        "val_r": 0.4926088523899991,
        "n_iterations": 359,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002080457052215934,
          "right_subspace_overlap_bottom_k": -0.00555296940729022,
          "interaction_matrix_overlap_top_k": 0.004739504307508469,
          "interaction_matrix_overlap_bottom_k": 0.07013123482465744,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.004088812042027712,
          "task_vector_l2_distance": -0.05654565244913101,
          "task_vector_dot_product": 0.0013837250880897045,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.012574865482747555,
          "singular_value_overlap": -0.041550688445568085,
          "subspace_overlap": 0.009631596505641937,
          "right_subspace_overlap": 0.0017074828501790762,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.014673592522740364,
          "activation_magnitude_ratio": -0.014526525512337685,
          "activation_dot_product": 0.00422904547303915,
          "encoder_gradient_cosine_similarity": 0.0011060707038268447,
          "encoder_gradient_l2_distance": -0.07432599365711212,
          "encoder_gradient_dot_product": 0.0023841536603868008,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0680486336350441,
          "input_gradient_dot_product": -0.017847873270511627
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5114904016426023,
        "val_r": 0.534033909096285,
        "n_iterations": 571,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.014457223936915398,
          "right_subspace_overlap_bottom_k": -0.031479138880968094,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.05238265544176102,
          "effective_rank": -0.0011614044196903706,
          "effective_rank_mergeability_score": 0.0011085058795288205,
          "stable_rank": -0.0017524058930575848,
          "spectral_gap": -0.0016460366314277053,
          "singular_value_ratio": 0.0014103814028203487,
          "layerwise_effective_rank": -0.0019128703279420733,
          "layerwise_effective_rank_mergeability_score": 0.0011174161918461323,
          "task_vector_cosine_similarity": 0.02992950938642025,
          "task_vector_l2_distance": -0.013590855523943901,
          "task_vector_dot_product": 0.010801976546645164,
          "weight_space_angle": -0.029850659891963005,
          "task_vector_magnitude_ratio": -0.015122683718800545,
          "singular_value_overlap": -0.029834870249032974,
          "subspace_overlap": 0.012292344123125076,
          "right_subspace_overlap": 0.014029677025973797,
          "activation_l2_distance": -0.004342599306255579,
          "activation_cosine_similarity": 0.022684941068291664,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.020044924691319466,
          "encoder_gradient_cosine_similarity": 0.022492483258247375,
          "encoder_gradient_l2_distance": -0.044156499207019806,
          "encoder_gradient_dot_product": 0.01953602209687233,
          "input_gradient_cosine_similarity": 0.006513036787509918,
          "input_gradient_l2_distance": -0.058810461312532425,
          "input_gradient_dot_product": -0.04850469157099724
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5980818461482318,
        "val_r": 0.7417257851836587,
        "n_iterations": 303,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01716560870409012,
          "right_subspace_overlap_bottom_k": 0.0011459961533546448,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.07668864727020264,
          "effective_rank": -0.003160810796543956,
          "effective_rank_mergeability_score": 0.004017347935587168,
          "stable_rank": -0.004798769485205412,
          "spectral_gap": 0.0019097782205790281,
          "singular_value_ratio": -0.002823619870468974,
          "layerwise_effective_rank": -0.001769729540683329,
          "layerwise_effective_rank_mergeability_score": 0.0021860874257981777,
          "task_vector_cosine_similarity": -0.007483283989131451,
          "task_vector_l2_distance": -0.08827012032270432,
          "task_vector_dot_product": 0.001496435608714819,
          "weight_space_angle": 0.006364630069583654,
          "task_vector_magnitude_ratio": -0.01349311601370573,
          "singular_value_overlap": -0.069808728992939,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.020792830735445023,
          "activation_l2_distance": 0.003031593980267644,
          "activation_cosine_similarity": 0.015879681333899498,
          "activation_magnitude_ratio": -0.015187614597380161,
          "activation_dot_product": 0.00881805457174778,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.10542257875204086,
          "encoder_gradient_dot_product": 0.0012868113117292523,
          "input_gradient_cosine_similarity": 0.0037429826334118843,
          "input_gradient_l2_distance": -0.10166376084089279,
          "input_gradient_dot_product": -0.03137421980500221
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5694912503427552,
        "val_r": 0.6259882450917377,
        "n_iterations": 402,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01580440066754818,
          "right_subspace_overlap_bottom_k": -0.022355925291776657,
          "interaction_matrix_overlap_top_k": 0.0019255302613601089,
          "interaction_matrix_overlap_bottom_k": 0.06142405793070793,
          "effective_rank": -0.003067178186029196,
          "effective_rank_mergeability_score": 0.004275206942111254,
          "stable_rank": -0.0061149136163294315,
          "spectral_gap": 0.002137152710929513,
          "singular_value_ratio": -0.0020428416319191456,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.010221735574305058,
          "task_vector_l2_distance": -0.0545949786901474,
          "task_vector_dot_product": -0.015369292348623276,
          "weight_space_angle": 0.013394743204116821,
          "task_vector_magnitude_ratio": -0.010981089435517788,
          "singular_value_overlap": -0.04221964627504349,
          "subspace_overlap": 0.025631308555603027,
          "right_subspace_overlap": 0.014165224507451057,
          "activation_l2_distance": -0.0135352723300457,
          "activation_cosine_similarity": 0.010230723768472672,
          "activation_magnitude_ratio": -0.010379559360444546,
          "activation_dot_product": -0.005848342552781105,
          "encoder_gradient_cosine_similarity": 0.007263366598635912,
          "encoder_gradient_l2_distance": -0.06661257147789001,
          "encoder_gradient_dot_product": 0.0073528168722987175,
          "input_gradient_cosine_similarity": -0.0017617419362068176,
          "input_gradient_l2_distance": -0.07639626413583755,
          "input_gradient_dot_product": -0.01703449711203575
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.6349248016447244,
        "val_r": 0.3373369226632869,
        "n_iterations": 296,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009119822643697262,
          "right_subspace_overlap_bottom_k": -0.005601134616881609,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.03843885660171509,
          "effective_rank": -0.0010250138584524393,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0016335448017343879,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0011276446748524904,
          "task_vector_l2_distance": -0.03999275341629982,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0013224183348938823,
          "task_vector_magnitude_ratio": -0.013806847855448723,
          "singular_value_overlap": -0.012539427727460861,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005867294035851955,
          "activation_l2_distance": 0.020368188619613647,
          "activation_cosine_similarity": 0.0181301049888134,
          "activation_magnitude_ratio": -0.00931365042924881,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": -0.0011059476528316736,
          "encoder_gradient_l2_distance": -0.040849827229976654,
          "encoder_gradient_dot_product": 0.004928359761834145,
          "input_gradient_cosine_similarity": 0.00249181198887527,
          "input_gradient_l2_distance": -0.035366181284189224,
          "input_gradient_dot_product": -0.01724444329738617
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6191315343595165,
        "val_r": 0.4995954533471319,
        "n_iterations": 414,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003992356825619936,
          "right_subspace_overlap_bottom_k": -0.014021914452314377,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.053443361073732376,
          "effective_rank": -0.0018743412801995873,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.006262331269681454,
          "spectral_gap": -0.0025526678655296564,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.002307548886165023,
          "task_vector_l2_distance": -0.03894898667931557,
          "task_vector_dot_product": -0.0012897669803351164,
          "weight_space_angle": 0.005133720580488443,
          "task_vector_magnitude_ratio": -0.005542089696973562,
          "singular_value_overlap": -0.02117946743965149,
          "subspace_overlap": 0.004696819931268692,
          "right_subspace_overlap": 0.005104591138660908,
          "activation_l2_distance": 0.011546609923243523,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.005755561403930187,
          "activation_dot_product": 0.02114071696996689,
          "encoder_gradient_cosine_similarity": 0.004699856974184513,
          "encoder_gradient_l2_distance": -0.030420931056141853,
          "encoder_gradient_dot_product": 0.0025832222308963537,
          "input_gradient_cosine_similarity": 0.005184592213481665,
          "input_gradient_l2_distance": -0.032604608684778214,
          "input_gradient_dot_product": -0.012654099613428116
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6307269821214702,
        "val_r": 0.3936374657579433,
        "n_iterations": 232,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01318141259253025,
          "right_subspace_overlap_bottom_k": -0.005714092403650284,
          "interaction_matrix_overlap_top_k": -0.03360503166913986,
          "interaction_matrix_overlap_bottom_k": 0.044671572744846344,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.006030018907040358,
          "layerwise_effective_rank_mergeability_score": 0.003290654392912984,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.02739427238702774,
          "task_vector_dot_product": 0.006722790654748678,
          "weight_space_angle": -0.00101682567037642,
          "task_vector_magnitude_ratio": -0.0019110373686999083,
          "singular_value_overlap": -0.009355245158076286,
          "subspace_overlap": 0.004788586404174566,
          "right_subspace_overlap": 0.010328021831810474,
          "activation_l2_distance": 0.00871803518384695,
          "activation_cosine_similarity": 0.0030371907632797956,
          "activation_magnitude_ratio": -0.0017179199494421482,
          "activation_dot_product": 0.012723029591143131,
          "encoder_gradient_cosine_similarity": 0.001237828517332673,
          "encoder_gradient_l2_distance": -0.0191821102052927,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.005117275286465883,
          "input_gradient_l2_distance": -0.032712869346141815,
          "input_gradient_dot_product": -0.00690149562433362
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7813040628345558,
        "val_r": 0.6834877156845268,
        "n_iterations": 295,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.05009404197335243,
          "right_subspace_overlap_bottom_k": -0.0739716961979866,
          "interaction_matrix_overlap_top_k": 0.03484414890408516,
          "interaction_matrix_overlap_bottom_k": -0.012612705118954182,
          "effective_rank": -0.009837080724537373,
          "effective_rank_mergeability_score": 0.008900491520762444,
          "stable_rank": -0.01066605094820261,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.012597007676959038,
          "layerwise_effective_rank_mergeability_score": 0.01473213266581297,
          "task_vector_cosine_similarity": -0.013892977498471737,
          "task_vector_l2_distance": -0.008146004751324654,
          "task_vector_dot_product": 0.01461591012775898,
          "weight_space_angle": 0.015441731549799442,
          "task_vector_magnitude_ratio": 0.0010814907727763057,
          "singular_value_overlap": -0.003473130986094475,
          "subspace_overlap": 0.01165000256150961,
          "right_subspace_overlap": 0.052488282322883606,
          "activation_l2_distance": -0.007778314873576164,
          "activation_cosine_similarity": 0.03411860391497612,
          "activation_magnitude_ratio": -0.024559319019317627,
          "activation_dot_product": 0.11408679187297821,
          "encoder_gradient_cosine_similarity": 0.025608891621232033,
          "encoder_gradient_l2_distance": -0.17950789630413055,
          "encoder_gradient_dot_product": 0.0157770998775959,
          "input_gradient_cosine_similarity": 0.0011674156412482262,
          "input_gradient_l2_distance": -0.17898070812225342,
          "input_gradient_dot_product": -0.09242300689220428
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6779887244429215,
        "val_r": 0.4266374900512776,
        "n_iterations": 419,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.017392661422491074,
          "right_subspace_overlap_bottom_k": 0.004129296168684959,
          "interaction_matrix_overlap_top_k": -0.006307822186499834,
          "interaction_matrix_overlap_bottom_k": 0.030155297368764877,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0016423675697296858,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0010089143179357052,
          "task_vector_l2_distance": -0.03218135982751846,
          "task_vector_dot_product": 0.005285570863634348,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.008535710163414478,
          "singular_value_overlap": -0.013027417473495007,
          "subspace_overlap": 0.01344518456608057,
          "right_subspace_overlap": -0.012202730402350426,
          "activation_l2_distance": 0.009530100971460342,
          "activation_cosine_similarity": -0.002874555066227913,
          "activation_magnitude_ratio": 0.0013486386742442846,
          "activation_dot_product": 0.02463071048259735,
          "encoder_gradient_cosine_similarity": -0.0013658103998750448,
          "encoder_gradient_l2_distance": -0.020748136565089226,
          "encoder_gradient_dot_product": 0.0015690349973738194,
          "input_gradient_cosine_similarity": 0.005599379539489746,
          "input_gradient_l2_distance": -0.02679615095257759,
          "input_gradient_dot_product": -0.0033001680858433247
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.1,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "tsv": {
    "aggregate_metrics": {
      "train_r": 0.438980796821664,
      "train_p": 6.724466343789123e-152,
      "val_r": 0.4159104598373235,
      "val_p": 2.0844921215022924e-16
    },
    "per_fold_stats": {
      "train_r_mean": 0.7968741573787207,
      "train_r_std": 0.036367077032669594,
      "val_r_mean": 0.6629868873977324,
      "val_r_std": 0.16993783895203574,
      "n_nonzero_mean": 22.8,
      "n_nonzero_std": 3.2341923257592455
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.030056670308113098,
      "right_subspace_overlap_bottom_k": -0.1013614758849144,
      "interaction_matrix_overlap_top_k": -0.005001015029847622,
      "interaction_matrix_overlap_bottom_k": 0.050837256014347076,
      "effective_rank": 0.003884870558977127,
      "effective_rank_mergeability_score": -0.0034219257067888975,
      "stable_rank": -0.0016614932101219893,
      "spectral_gap": -0.0003077681176364422,
      "singular_value_ratio": 0.00042055780068039894,
      "layerwise_effective_rank": -0.006883519701659679,
      "layerwise_effective_rank_mergeability_score": 0.007575678173452616,
      "task_vector_cosine_similarity": -0.0015233650337904692,
      "task_vector_l2_distance": -0.0013908336404711008,
      "task_vector_dot_product": -0.0013836368452757597,
      "weight_space_angle": 0.0007174712372943759,
      "task_vector_magnitude_ratio": -9.522870823275298e-05,
      "singular_value_overlap": 0.014255454763770103,
      "subspace_overlap": -0.005170200485736132,
      "right_subspace_overlap": 0.028200801461935043,
      "activation_l2_distance": -0.003984223119914532,
      "activation_cosine_similarity": 0.036967821419239044,
      "activation_magnitude_ratio": -0.0069925785064697266,
      "activation_dot_product": 0.009557710029184818,
      "encoder_gradient_cosine_similarity": 0.008791299536824226,
      "encoder_gradient_l2_distance": -0.06361252814531326,
      "encoder_gradient_dot_product": 0.0014922574628144503,
      "input_gradient_cosine_similarity": 0.0027093091048300266,
      "input_gradient_l2_distance": -0.041553299874067307,
      "input_gradient_dot_product": -0.009057190269231796
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.01743181422352791,
      "right_subspace_overlap_bottom_k": 0.02706310711801052,
      "interaction_matrix_overlap_top_k": 0.01399348396807909,
      "interaction_matrix_overlap_bottom_k": 0.036805566400289536,
      "effective_rank": 0.004970437381416559,
      "effective_rank_mergeability_score": 0.0046432469971477985,
      "stable_rank": 0.0033464787993580103,
      "spectral_gap": 0.002550069708377123,
      "singular_value_ratio": 0.0025158466305583715,
      "layerwise_effective_rank": 0.005976445507258177,
      "layerwise_effective_rank_mergeability_score": 0.0059612467885017395,
      "task_vector_cosine_similarity": 0.011031746864318848,
      "task_vector_l2_distance": 0.01269769947975874,
      "task_vector_dot_product": 0.006659740582108498,
      "weight_space_angle": 0.011874698102474213,
      "task_vector_magnitude_ratio": 0.0024170682299882174,
      "singular_value_overlap": 0.01306287944316864,
      "subspace_overlap": 0.01193271391093731,
      "right_subspace_overlap": 0.01852329634130001,
      "activation_l2_distance": 0.011264074593782425,
      "activation_cosine_similarity": 0.020354721695184708,
      "activation_magnitude_ratio": 0.012040982022881508,
      "activation_dot_product": 0.03572951257228851,
      "encoder_gradient_cosine_similarity": 0.013342869468033314,
      "encoder_gradient_l2_distance": 0.0410960391163826,
      "encoder_gradient_dot_product": 0.0029736030846834183,
      "input_gradient_cosine_similarity": 0.002769788494333625,
      "input_gradient_l2_distance": 0.03963271155953407,
      "input_gradient_dot_product": 0.013722820207476616
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 1.0,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.8,
      "interaction_matrix_overlap_bottom_k": 0.95,
      "effective_rank": 0.7,
      "effective_rank_mergeability_score": 0.7,
      "stable_rank": 0.6,
      "spectral_gap": 0.35,
      "singular_value_ratio": 0.4,
      "layerwise_effective_rank": 0.8,
      "layerwise_effective_rank_mergeability_score": 0.75,
      "task_vector_cosine_similarity": 0.75,
      "task_vector_l2_distance": 0.95,
      "task_vector_dot_product": 0.7,
      "weight_space_angle": 0.8,
      "task_vector_magnitude_ratio": 0.55,
      "singular_value_overlap": 0.85,
      "subspace_overlap": 0.8,
      "right_subspace_overlap": 1.0,
      "activation_l2_distance": 0.75,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.65,
      "activation_dot_product": 0.95,
      "encoder_gradient_cosine_similarity": 0.85,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.55,
      "input_gradient_cosine_similarity": 0.7,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.9
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7674318569194027,
        "val_r": 0.4484381159593573,
        "n_iterations": 322,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01963035576045513,
          "right_subspace_overlap_bottom_k": -0.11471404880285263,
          "interaction_matrix_overlap_top_k": -0.031062589958310127,
          "interaction_matrix_overlap_bottom_k": 0.1044297143816948,
          "effective_rank": 0.0057217334397137165,
          "effective_rank_mergeability_score": -0.005751829594373703,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.00455058179795742,
          "task_vector_l2_distance": 0.003051408799365163,
          "task_vector_dot_product": -0.0014805591199547052,
          "weight_space_angle": -0.003721419954672456,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005833246745169163,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.024433594197034836,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.02772456780076027,
          "activation_magnitude_ratio": -0.0027715791948139668,
          "activation_dot_product": -0.005095755215734243,
          "encoder_gradient_cosine_similarity": 0.003424876369535923,
          "encoder_gradient_l2_distance": -0.02468065731227398,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.006127507425844669,
          "input_gradient_l2_distance": -0.022938765585422516,
          "input_gradient_dot_product": -0.00618253368884325
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.771941273532615,
        "val_r": 0.8078412005939141,
        "n_iterations": 231,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009869561530649662,
          "right_subspace_overlap_bottom_k": -0.11643677204847336,
          "interaction_matrix_overlap_top_k": -0.01102204155176878,
          "interaction_matrix_overlap_bottom_k": 0.0793951228260994,
          "effective_rank": 0.006519319489598274,
          "effective_rank_mergeability_score": -0.001498304889537394,
          "stable_rank": -0.0029130750335752964,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.005274685565382242,
          "layerwise_effective_rank_mergeability_score": 0.0147336320951581,
          "task_vector_cosine_similarity": -0.01251072809100151,
          "task_vector_l2_distance": -0.005954214371740818,
          "task_vector_dot_product": -0.004023891407996416,
          "weight_space_angle": 0.010560942813754082,
          "task_vector_magnitude_ratio": -0.0011142862495034933,
          "singular_value_overlap": 0.01289702020585537,
          "subspace_overlap": 0.004557320848107338,
          "right_subspace_overlap": 0.03905551880598068,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.03533171862363815,
          "activation_magnitude_ratio": -0.0058800228871405125,
          "activation_dot_product": 0.006872063968330622,
          "encoder_gradient_cosine_similarity": 0.008403354324400425,
          "encoder_gradient_l2_distance": -0.06926456093788147,
          "encoder_gradient_dot_product": 0.007246136665344238,
          "input_gradient_cosine_similarity": 0.0016016119625419378,
          "input_gradient_l2_distance": -0.044693540781736374,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7713546895340353,
        "val_r": 0.781232332630473,
        "n_iterations": 298,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.03669136017560959,
          "right_subspace_overlap_bottom_k": -0.10945488512516022,
          "interaction_matrix_overlap_top_k": 0.018611561506986618,
          "interaction_matrix_overlap_bottom_k": 0.018971987068653107,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.004006428178399801,
          "spectral_gap": -0.0025916588492691517,
          "singular_value_ratio": 0.001997384475544095,
          "layerwise_effective_rank": -0.022436315193772316,
          "layerwise_effective_rank_mergeability_score": 0.011690162122249603,
          "task_vector_cosine_similarity": -0.013292193412780762,
          "task_vector_l2_distance": -0.021290719509124756,
          "task_vector_dot_product": -0.00883319042623043,
          "weight_space_angle": 0.012111136689782143,
          "task_vector_magnitude_ratio": 0.002418435411527753,
          "singular_value_overlap": 0.0340283066034317,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.06334427744150162,
          "activation_l2_distance": -0.015524733811616898,
          "activation_cosine_similarity": 0.05451330915093422,
          "activation_magnitude_ratio": -0.010952770709991455,
          "activation_dot_product": 0.0376710444688797,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.14645056426525116,
          "encoder_gradient_dot_product": 0.002583912806585431,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.11314693838357925,
          "input_gradient_dot_product": 0.0030524726025760174
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8197728350725311,
        "val_r": 0.8108741777717086,
        "n_iterations": 501,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005518726073205471,
          "right_subspace_overlap_bottom_k": -0.10027695447206497,
          "interaction_matrix_overlap_top_k": -0.016652105376124382,
          "interaction_matrix_overlap_bottom_k": 0.08631615340709686,
          "effective_rank": 0.010555700398981571,
          "effective_rank_mergeability_score": -0.011319081299006939,
          "stable_rank": -0.0014907543081790209,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.00817175954580307,
          "layerwise_effective_rank_mergeability_score": 0.013272492215037346,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.005722522735595703,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0019158257637172937,
          "subspace_overlap": -0.0011413625907152891,
          "right_subspace_overlap": 0.025112444534897804,
          "activation_l2_distance": 0.0014269538223743439,
          "activation_cosine_similarity": 0.01915149949491024,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.003730164375156164,
          "encoder_gradient_cosine_similarity": 0.0018215118907392025,
          "encoder_gradient_l2_distance": -0.017880184575915337,
          "encoder_gradient_dot_product": 0.002532169222831726,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.012151137925684452,
          "input_gradient_dot_product": -0.0023086632136255503
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7995133395557238,
        "val_r": 0.7650896527722779,
        "n_iterations": 308,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.03599615395069122,
          "right_subspace_overlap_bottom_k": -0.11231553554534912,
          "interaction_matrix_overlap_top_k": -0.015456902794539928,
          "interaction_matrix_overlap_bottom_k": 0.08413047343492508,
          "effective_rank": 0.01286693848669529,
          "effective_rank_mergeability_score": -0.010422374121844769,
          "stable_rank": -0.005663004238158464,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.001194292213767767,
          "layerwise_effective_rank": -0.010417742654681206,
          "layerwise_effective_rank_mergeability_score": 0.007032470311969519,
          "task_vector_cosine_similarity": -0.005699130240827799,
          "task_vector_l2_distance": 0.0018833719659596682,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.004686628933995962,
          "task_vector_magnitude_ratio": 0.0011619884753599763,
          "singular_value_overlap": 0.004894136916846037,
          "subspace_overlap": -0.0018163046333938837,
          "right_subspace_overlap": 0.018592096865177155,
          "activation_l2_distance": -0.0015923463506624103,
          "activation_cosine_similarity": 0.025467567145824432,
          "activation_magnitude_ratio": -0.003783827181905508,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0066008432768285275,
          "encoder_gradient_l2_distance": -0.04385312274098396,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0038647635374218225,
          "input_gradient_l2_distance": -0.023015355691313744,
          "input_gradient_dot_product": -0.004183616954833269
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7195312972699152,
        "val_r": 0.6892903517074052,
        "n_iterations": 375,
        "n_nonzero_coefficients": 28,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.04730851948261261,
          "right_subspace_overlap_bottom_k": -0.15644074976444244,
          "interaction_matrix_overlap_top_k": 0.030360912904143333,
          "interaction_matrix_overlap_bottom_k": -0.010450848378241062,
          "effective_rank": -0.006759911775588989,
          "effective_rank_mergeability_score": 0.006713410839438438,
          "stable_rank": -0.01176681462675333,
          "spectral_gap": 0.009280247613787651,
          "singular_value_ratio": -0.008836875669658184,
          "layerwise_effective_rank": -0.019158905372023582,
          "layerwise_effective_rank_mergeability_score": 0.020002776756882668,
          "task_vector_cosine_similarity": 0.03577582910656929,
          "task_vector_l2_distance": -0.027345366775989532,
          "task_vector_dot_product": 0.021247517317533493,
          "weight_space_angle": -0.04185526818037033,
          "task_vector_magnitude_ratio": -0.008772184140980244,
          "singular_value_overlap": 0.0479060597717762,
          "subspace_overlap": 0.022295471280813217,
          "right_subspace_overlap": 0.04919459670782089,
          "activation_l2_distance": -0.03318082168698311,
          "activation_cosine_similarity": 0.07902733981609344,
          "activation_magnitude_ratio": -0.05613492429256439,
          "activation_dot_product": 0.13716913759708405,
          "encoder_gradient_cosine_similarity": 0.06283914297819138,
          "encoder_gradient_l2_distance": -0.12820081412792206,
          "encoder_gradient_dot_product": 0.0020087200682610273,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.15519022941589355,
          "input_gradient_dot_product": -0.059458229690790176
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7291207463546748,
        "val_r": 0.6171089820978894,
        "n_iterations": 291,
        "n_nonzero_coefficients": 29,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.032229792326688766,
          "right_subspace_overlap_bottom_k": -0.08984437584877014,
          "interaction_matrix_overlap_top_k": 0.004168340470641851,
          "interaction_matrix_overlap_bottom_k": 0.03143477439880371,
          "effective_rank": 0.004820946138352156,
          "effective_rank_mergeability_score": -0.0044808052480220795,
          "stable_rank": 0.0013353475369513035,
          "spectral_gap": -0.002590474672615528,
          "singular_value_ratio": 0.003441112581640482,
          "layerwise_effective_rank": -0.001685063005425036,
          "layerwise_effective_rank_mergeability_score": 0.0016441521001979709,
          "task_vector_cosine_similarity": 0.005538849160075188,
          "task_vector_l2_distance": -0.009463952854275703,
          "task_vector_dot_product": 0.0033239307813346386,
          "weight_space_angle": -0.006874145939946175,
          "task_vector_magnitude_ratio": 0.0025017333682626486,
          "singular_value_overlap": 0.01872309297323227,
          "subspace_overlap": 0.008907695300877094,
          "right_subspace_overlap": 0.012579855509102345,
          "activation_l2_distance": 0.008608666248619556,
          "activation_cosine_similarity": 0.04269815608859062,
          "activation_magnitude_ratio": -0.005912551656365395,
          "activation_dot_product": 0.03131917864084244,
          "encoder_gradient_cosine_similarity": 0.013735847547650337,
          "encoder_gradient_l2_distance": -0.0728398859500885,
          "encoder_gradient_dot_product": 0.011044754646718502,
          "input_gradient_cosine_similarity": 0.0075733899138867855,
          "input_gradient_l2_distance": -0.06928267329931259,
          "input_gradient_dot_product": -0.03125787153840065
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.780574654898055,
        "val_r": 0.37075940241764305,
        "n_iterations": 370,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.06272883713245392,
          "right_subspace_overlap_bottom_k": -0.12480125576257706,
          "interaction_matrix_overlap_top_k": 0.004737778566777706,
          "interaction_matrix_overlap_bottom_k": 0.04050017148256302,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.002074427902698517,
          "spectral_gap": -0.004173255525529385,
          "singular_value_ratio": 0.004181772004812956,
          "layerwise_effective_rank": -0.0073715029284358025,
          "layerwise_effective_rank_mergeability_score": 0.0060626547783613205,
          "task_vector_cosine_similarity": -0.019421666860580444,
          "task_vector_l2_distance": -0.001323436270467937,
          "task_vector_dot_product": -0.008421351201832294,
          "weight_space_angle": 0.0210723914206028,
          "task_vector_magnitude_ratio": 0.0020881269592791796,
          "singular_value_overlap": 0.011056353338062763,
          "subspace_overlap": -0.009664081037044525,
          "right_subspace_overlap": 0.05463835224509239,
          "activation_l2_distance": -0.028638124465942383,
          "activation_cosine_similarity": 0.06260645389556885,
          "activation_magnitude_ratio": -0.015163451433181763,
          "activation_dot_product": -0.012982867658138275,
          "encoder_gradient_cosine_similarity": 0.01679292879998684,
          "encoder_gradient_l2_distance": -0.11099714040756226,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.007534513249993324,
          "input_gradient_l2_distance": -0.04657342657446861,
          "input_gradient_dot_product": 0.0011879266239702702
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.8703726300704653,
        "val_r": 0.35261318811597475,
        "n_iterations": 826,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01377064548432827,
          "right_subspace_overlap_bottom_k": -0.10628422349691391,
          "interaction_matrix_overlap_top_k": -0.028126824647188187,
          "interaction_matrix_overlap_bottom_k": 0.09949558228254318,
          "effective_rank": 0.003782300977036357,
          "effective_rank_mergeability_score": -0.004409360699355602,
          "stable_rank": 0.0,
          "spectral_gap": -0.001052685547620058,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002173621905967593,
          "layerwise_effective_rank_mergeability_score": 0.014270767569541931,
          "task_vector_cosine_similarity": -0.0011207431089133024,
          "task_vector_l2_distance": 0.00528627447783947,
          "task_vector_dot_product": 0.004329116083681583,
          "weight_space_angle": -0.0027923118323087692,
          "task_vector_magnitude_ratio": 0.0022181274835020304,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.014022380113601685,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.019153928384184837,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.012499413453042507,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.008760460652410984,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0017531519988551736,
          "input_gradient_l2_distance": -0.013094248250126839,
          "input_gradient_dot_product": -0.003561051795259118
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7990119390652979,
        "val_r": 0.5904187223872387,
        "n_iterations": 287,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.05268121138215065,
          "right_subspace_overlap_bottom_k": -0.1320262998342514,
          "interaction_matrix_overlap_top_k": -0.008647006936371326,
          "interaction_matrix_overlap_bottom_k": 0.07437389343976974,
          "effective_rank": 0.0030593411065638065,
          "effective_rank_mergeability_score": -0.0034882300533354282,
          "stable_rank": 0.002717456081882119,
          "spectral_gap": -0.0017266711220145226,
          "singular_value_ratio": 0.0018279465148225427,
          "layerwise_effective_rank": -0.006283259484916925,
          "layerwise_effective_rank_mergeability_score": 0.012388870120048523,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.008313314989209175,
          "task_vector_dot_product": -0.0043460107408463955,
          "weight_space_angle": 0.0017427755519747734,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.007463868707418442,
          "subspace_overlap": -0.007393007632344961,
          "right_subspace_overlap": 0.02328440733253956,
          "activation_l2_distance": -0.009903808124363422,
          "activation_cosine_similarity": -0.002378950361162424,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.019171910360455513,
          "encoder_gradient_cosine_similarity": 0.012958293780684471,
          "encoder_gradient_l2_distance": -0.04805904999375343,
          "encoder_gradient_dot_product": 0.0027804572600871325,
          "input_gradient_cosine_similarity": 0.005468939896672964,
          "input_gradient_l2_distance": -0.02858654595911503,
          "input_gradient_dot_product": -0.009589515626430511
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8104690424650616,
        "val_r": 0.2362852093473216,
        "n_iterations": 233,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.049209970980882645,
          "right_subspace_overlap_bottom_k": -0.06643228232860565,
          "interaction_matrix_overlap_top_k": 0.002340862527489662,
          "interaction_matrix_overlap_bottom_k": 0.008703320287168026,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0021660870406776667,
          "task_vector_l2_distance": 0.012770534493029118,
          "task_vector_dot_product": -0.0019515047315508127,
          "weight_space_angle": 0.0021229260601103306,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.025562254711985588,
          "subspace_overlap": -0.029598059132695198,
          "right_subspace_overlap": 0.015978429466485977,
          "activation_l2_distance": -0.00894690677523613,
          "activation_cosine_similarity": 0.05295422673225403,
          "activation_magnitude_ratio": -0.004973527044057846,
          "activation_dot_product": -0.00195766007527709,
          "encoder_gradient_cosine_similarity": 0.0015732678584754467,
          "encoder_gradient_l2_distance": -0.06257523596286774,
          "encoder_gradient_dot_product": 0.002060783328488469,
          "input_gradient_cosine_similarity": 0.0032012229785323143,
          "input_gradient_l2_distance": -0.008488493040204048,
          "input_gradient_dot_product": -0.0017669845838099718
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.8032700045075876,
        "val_r": 0.7476920294000085,
        "n_iterations": 354,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01964999921619892,
          "right_subspace_overlap_bottom_k": -0.07547663152217865,
          "interaction_matrix_overlap_top_k": -0.0030373618938028812,
          "interaction_matrix_overlap_bottom_k": 0.029347887262701988,
          "effective_rank": 0.0012174341827630997,
          "effective_rank_mergeability_score": -0.00195487798191607,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.015559349209070206,
          "task_vector_l2_distance": 0.007511953357607126,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.012718630023300648,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.009271588176488876,
          "subspace_overlap": -0.0024871351197361946,
          "right_subspace_overlap": 0.04209384694695473,
          "activation_l2_distance": 0.015043631196022034,
          "activation_cosine_similarity": 0.05061688274145126,
          "activation_magnitude_ratio": -0.004303815774619579,
          "activation_dot_product": -0.011475986801087856,
          "encoder_gradient_cosine_similarity": 0.006162513047456741,
          "encoder_gradient_l2_distance": -0.043800558894872665,
          "encoder_gradient_dot_product": -0.0011187184136360884,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.022208206355571747,
          "input_gradient_dot_product": -0.004782133270055056
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7773810872640365,
        "val_r": 0.7818297702820192,
        "n_iterations": 389,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.02882099710404873,
          "right_subspace_overlap_bottom_k": -0.08743973821401596,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.021245257928967476,
          "effective_rank": 0.0010515697067603469,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0015479987487196922,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.012487109750509262,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0025010660756379366,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.016053665429353714,
          "subspace_overlap": -0.015258722938597202,
          "right_subspace_overlap": 0.03884014114737511,
          "activation_l2_distance": 0.0026693129912018776,
          "activation_cosine_similarity": 0.060859255492687225,
          "activation_magnitude_ratio": -0.005834565497934818,
          "activation_dot_product": -0.015425305813550949,
          "encoder_gradient_cosine_similarity": 0.010096612386405468,
          "encoder_gradient_l2_distance": -0.0810745358467102,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.003306034253910184,
          "input_gradient_l2_distance": -0.025153907015919685,
          "input_gradient_dot_product": -0.014113114215433598
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8294592282881545,
        "val_r": 0.8358442794544827,
        "n_iterations": 300,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.03394048288464546,
          "right_subspace_overlap_bottom_k": -0.09644437581300735,
          "interaction_matrix_overlap_top_k": -0.017266426235437393,
          "interaction_matrix_overlap_bottom_k": 0.0809098482131958,
          "effective_rank": 0.004783712327480316,
          "effective_rank_mergeability_score": -0.00525104021653533,
          "stable_rank": 0.0028143206145614386,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.006398811936378479,
          "layerwise_effective_rank_mergeability_score": 0.005578687414526939,
          "task_vector_cosine_similarity": 0.0046905456110835075,
          "task_vector_l2_distance": 0.005637043155729771,
          "task_vector_dot_product": 0.0014058604137971997,
          "weight_space_angle": -0.0031706031877547503,
          "task_vector_magnitude_ratio": -0.0019431489054113626,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.02487192489206791,
          "right_subspace_overlap": 0.00584295392036438,
          "activation_l2_distance": 0.005453609861433506,
          "activation_cosine_similarity": 0.02147425338625908,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.005963167175650597,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.015826178714632988,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.004233780317008495,
          "input_gradient_l2_distance": -0.012209777720272541,
          "input_gradient_dot_product": -0.0048857699148356915
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8258821655521162,
        "val_r": 0.8009921059177965,
        "n_iterations": 592,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.008629260584712029,
          "right_subspace_overlap_bottom_k": -0.10558179020881653,
          "interaction_matrix_overlap_top_k": -0.014241974800825119,
          "interaction_matrix_overlap_bottom_k": 0.08683852106332779,
          "effective_rank": 0.010775544680655003,
          "effective_rank_mergeability_score": -0.013458224013447762,
          "stable_rank": -0.006484506651759148,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.009074307046830654,
          "layerwise_effective_rank_mergeability_score": 0.009211142547428608,
          "task_vector_cosine_similarity": 0.0016881102928891778,
          "task_vector_l2_distance": 0.008684411644935608,
          "task_vector_dot_product": -0.0026188238989561796,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0013570302398875356,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.014209505170583725,
          "activation_l2_distance": -0.0051995315589010715,
          "activation_cosine_similarity": 0.016419902443885803,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.010872146114706993,
          "encoder_gradient_cosine_similarity": 0.0016879482427611947,
          "encoder_gradient_l2_distance": -0.01208570972084999,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.011205845512449741,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.8196899248039113,
        "val_r": 0.7136440569306393,
        "n_iterations": 263,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.04481792449951172,
          "right_subspace_overlap_bottom_k": -0.07275110483169556,
          "interaction_matrix_overlap_top_k": -0.004536018706858158,
          "interaction_matrix_overlap_bottom_k": 0.007823394611477852,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0011317281750962138,
          "task_vector_l2_distance": 0.0015360212419182062,
          "task_vector_dot_product": -0.011079948395490646,
          "weight_space_angle": -0.001775022828951478,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.026019684970378876,
          "subspace_overlap": -0.02797703444957733,
          "right_subspace_overlap": 0.047291118651628494,
          "activation_l2_distance": 0.0036026365123689175,
          "activation_cosine_similarity": 0.048700131475925446,
          "activation_magnitude_ratio": -0.009408175013959408,
          "activation_dot_product": -0.01718882843852043,
          "encoder_gradient_cosine_similarity": 0.004349647089838982,
          "encoder_gradient_l2_distance": -0.07581435143947601,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.019071808084845543,
          "input_gradient_dot_product": -0.011222224682569504
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.8011389978021523,
        "val_r": 0.7734663939773697,
        "n_iterations": 217,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.04676549509167671,
          "right_subspace_overlap_bottom_k": -0.11911236494779587,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.07466328889131546,
          "effective_rank": 0.006242389790713787,
          "effective_rank_mergeability_score": -0.0033150098752230406,
          "stable_rank": -0.0017933847848325968,
          "spectral_gap": -0.0033008644822984934,
          "singular_value_ratio": 0.003596107941120863,
          "layerwise_effective_rank": -0.010181856341660023,
          "layerwise_effective_rank_mergeability_score": 0.012070016004145145,
          "task_vector_cosine_similarity": -0.011100090108811855,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.0094254519790411,
          "weight_space_angle": 0.00950655061751604,
          "task_vector_magnitude_ratio": 0.002691621659323573,
          "singular_value_overlap": 0.009914559312164783,
          "subspace_overlap": -0.003977013286203146,
          "right_subspace_overlap": 0.019458139315247536,
          "activation_l2_distance": -0.002181436400860548,
          "activation_cosine_similarity": 0.02948758751153946,
          "activation_magnitude_ratio": -0.009683242999017239,
          "activation_dot_product": 0.008686789311468601,
          "encoder_gradient_cosine_similarity": 0.01012042723596096,
          "encoder_gradient_l2_distance": -0.0599873922765255,
          "encoder_gradient_dot_product": -0.0011609925422817469,
          "input_gradient_cosine_similarity": 0.0042988089844584465,
          "input_gradient_l2_distance": -0.02917511761188507,
          "input_gradient_dot_product": -0.009138106368482113
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.768797508020277,
        "val_r": 0.7009664642315763,
        "n_iterations": 444,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.03275538608431816,
          "right_subspace_overlap_bottom_k": -0.11306658387184143,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.01366149540990591,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0010094153694808483,
          "layerwise_effective_rank": -0.008724241517484188,
          "layerwise_effective_rank_mergeability_score": 0.008528485894203186,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.005761174019426107,
          "task_vector_dot_product": -0.005798427853733301,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.03565770760178566,
          "subspace_overlap": -0.005544393789023161,
          "right_subspace_overlap": 0.05365310609340668,
          "activation_l2_distance": -0.011321578174829483,
          "activation_cosine_similarity": 0.0597548671066761,
          "activation_magnitude_ratio": -0.005049116909503937,
          "activation_dot_product": 0.02747291699051857,
          "encoder_gradient_cosine_similarity": 0.010599849745631218,
          "encoder_gradient_l2_distance": -0.13135136663913727,
          "encoder_gradient_dot_product": 0.0035267015919089317,
          "input_gradient_cosine_similarity": -0.0024720404762774706,
          "input_gradient_l2_distance": -0.10901626944541931,
          "input_gradient_dot_product": -0.015084308572113514
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8193951842384096,
        "val_r": 0.7180083532085991,
        "n_iterations": 336,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.02551516331732273,
          "right_subspace_overlap_bottom_k": -0.10423911362886429,
          "interaction_matrix_overlap_top_k": -0.010190502740442753,
          "interaction_matrix_overlap_bottom_k": 0.08495497703552246,
          "effective_rank": 0.013060382567346096,
          "effective_rank_mergeability_score": -0.00843674037605524,
          "stable_rank": -0.0039045941084623337,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.011031667701900005,
          "layerwise_effective_rank_mergeability_score": 0.011708109639585018,
          "task_vector_cosine_similarity": -0.002972960937768221,
          "task_vector_l2_distance": 0.005684764124453068,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.002517280401661992,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0033251584973186255,
          "subspace_overlap": -0.008260194212198257,
          "right_subspace_overlap": 0.007750269956886768,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.018525488674640656,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.002540506422519684,
          "encoder_gradient_cosine_similarity": 0.002358047291636467,
          "encoder_gradient_l2_distance": -0.022565932944417,
          "encoder_gradient_dot_product": -0.0016587763093411922,
          "input_gradient_cosine_similarity": 0.002299696207046509,
          "input_gradient_l2_distance": -0.008824353106319904,
          "input_gradient_dot_product": -0.0030956841073930264
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8533747423599914,
        "val_r": 0.717342958750952,
        "n_iterations": 236,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.00539645180106163,
          "right_subspace_overlap_bottom_k": -0.02409028261899948,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": -0.0013660467229783535,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.007738652639091015,
          "layerwise_effective_rank_mergeability_score": 0.003319147974252701,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.03524653613567352,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0017979579279199243,
          "singular_value_overlap": 0.014586539939045906,
          "subspace_overlap": -0.0011752640129998326,
          "right_subspace_overlap": -0.005359017290174961,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.017268221825361252,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.060866761952638626,
          "encoder_gradient_cosine_similarity": 0.0023008910939097404,
          "encoder_gradient_l2_distance": -0.09618279337882996,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0053947982378304005,
          "input_gradient_l2_distance": -0.057039353996515274,
          "input_gradient_dot_product": -0.0047543905675411224
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.1,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "isotropic": {
    "aggregate_metrics": {
      "train_r": 0.34935367148004187,
      "train_p": 3.905730748119283e-93,
      "val_r": -0.16513198689428094,
      "val_p": 0.001718150848546439
    },
    "per_fold_stats": {
      "train_r_mean": 0.5731441664875355,
      "train_r_std": 0.047458090824185416,
      "val_r_mean": 0.43786942998875755,
      "val_r_std": 0.17716790757147277,
      "n_nonzero_mean": 22.3,
      "n_nonzero_std": 3.5085609585697664
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.0028467674273997545,
      "right_subspace_overlap_bottom_k": -0.007373227272182703,
      "interaction_matrix_overlap_top_k": -0.018788643181324005,
      "interaction_matrix_overlap_bottom_k": 0.07127653062343597,
      "effective_rank": -0.0015735769411548972,
      "effective_rank_mergeability_score": 0.0016040944028645754,
      "stable_rank": -0.001054840162396431,
      "spectral_gap": -0.0009712738683447242,
      "singular_value_ratio": 0.0011116729583591223,
      "layerwise_effective_rank": -0.00010908934928011149,
      "layerwise_effective_rank_mergeability_score": 0.0018412142526358366,
      "task_vector_cosine_similarity": -0.0009318022057414055,
      "task_vector_l2_distance": -0.03862891346216202,
      "task_vector_dot_product": 0.0031259481329470873,
      "weight_space_angle": 0.0008440656820312142,
      "task_vector_magnitude_ratio": -0.012088426388800144,
      "singular_value_overlap": -0.035289231687784195,
      "subspace_overlap": 0.012833970598876476,
      "right_subspace_overlap": 0.003698952030390501,
      "activation_l2_distance": -0.001064395997673273,
      "activation_cosine_similarity": -0.0008205717313103378,
      "activation_magnitude_ratio": -0.011298161000013351,
      "activation_dot_product": -0.003238723846152425,
      "encoder_gradient_cosine_similarity": -7.054345769574866e-05,
      "encoder_gradient_l2_distance": -0.026714008301496506,
      "encoder_gradient_dot_product": 0.00027558329747989774,
      "input_gradient_cosine_similarity": 0.0037261992692947388,
      "input_gradient_l2_distance": -0.04199270159006119,
      "input_gradient_dot_product": -0.00988083053380251
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.009971057996153831,
      "right_subspace_overlap_bottom_k": 0.01637353003025055,
      "interaction_matrix_overlap_top_k": 0.011992193758487701,
      "interaction_matrix_overlap_bottom_k": 0.01781393773853779,
      "effective_rank": 0.001756478799507022,
      "effective_rank_mergeability_score": 0.001851018751040101,
      "stable_rank": 0.0018390316981822252,
      "spectral_gap": 0.001787249930202961,
      "singular_value_ratio": 0.0017221757443621755,
      "layerwise_effective_rank": 0.0045245676301419735,
      "layerwise_effective_rank_mergeability_score": 0.007643452845513821,
      "task_vector_cosine_similarity": 0.0033119111321866512,
      "task_vector_l2_distance": 0.020257921889424324,
      "task_vector_dot_product": 0.007256132084876299,
      "weight_space_angle": 0.0027844842988997698,
      "task_vector_magnitude_ratio": 0.005144985392689705,
      "singular_value_overlap": 0.017193889245390892,
      "subspace_overlap": 0.010236210189759731,
      "right_subspace_overlap": 0.01542455144226551,
      "activation_l2_distance": 0.015610015951097012,
      "activation_cosine_similarity": 0.014288390055298805,
      "activation_magnitude_ratio": 0.007485215552151203,
      "activation_dot_product": 0.008264018222689629,
      "encoder_gradient_cosine_similarity": 0.0035880613140761852,
      "encoder_gradient_l2_distance": 0.030657194554805756,
      "encoder_gradient_dot_product": 0.0015485455514863133,
      "input_gradient_cosine_similarity": 0.003013133304193616,
      "input_gradient_l2_distance": 0.03136690333485603,
      "input_gradient_dot_product": 0.005449756048619747
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.55,
      "right_subspace_overlap_bottom_k": 0.85,
      "interaction_matrix_overlap_top_k": 1.0,
      "interaction_matrix_overlap_bottom_k": 1.0,
      "effective_rank": 0.65,
      "effective_rank_mergeability_score": 0.65,
      "stable_rank": 0.4,
      "spectral_gap": 0.6,
      "singular_value_ratio": 0.65,
      "layerwise_effective_rank": 0.45,
      "layerwise_effective_rank_mergeability_score": 0.45,
      "task_vector_cosine_similarity": 0.6,
      "task_vector_l2_distance": 1.0,
      "task_vector_dot_product": 0.9,
      "weight_space_angle": 0.45,
      "task_vector_magnitude_ratio": 1.0,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.95,
      "right_subspace_overlap": 0.55,
      "activation_l2_distance": 0.9,
      "activation_cosine_similarity": 0.7,
      "activation_magnitude_ratio": 0.95,
      "activation_dot_product": 0.85,
      "encoder_gradient_cosine_similarity": 0.8,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.55,
      "input_gradient_cosine_similarity": 0.85,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 1.0
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6255586729867049,
        "val_r": 0.6256389376397659,
        "n_iterations": 273,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0011197396088391542,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.029617790132761,
          "interaction_matrix_overlap_bottom_k": 0.08136450499296188,
          "effective_rank": -0.006125051062554121,
          "effective_rank_mergeability_score": 0.004592671524733305,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.013955133967101574,
          "layerwise_effective_rank_mergeability_score": -0.0033990393858402967,
          "task_vector_cosine_similarity": -0.0010508573614060879,
          "task_vector_l2_distance": -0.046745192259550095,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0041350931860506535,
          "task_vector_magnitude_ratio": -0.017776118591427803,
          "singular_value_overlap": -0.04778338223695755,
          "subspace_overlap": 0.031976912170648575,
          "right_subspace_overlap": -0.0015936257550492883,
          "activation_l2_distance": -0.0019406070932745934,
          "activation_cosine_similarity": 0.0027469205670058727,
          "activation_magnitude_ratio": -0.017085690051317215,
          "activation_dot_product": -0.011752725578844547,
          "encoder_gradient_cosine_similarity": -0.0018932900857180357,
          "encoder_gradient_l2_distance": -0.026199432089924812,
          "encoder_gradient_dot_product": -0.0010890900157392025,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.03522311896085739,
          "input_gradient_dot_product": -0.013803277164697647
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5612883016896778,
        "val_r": 0.5273116402627289,
        "n_iterations": 268,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.025829274207353592,
          "interaction_matrix_overlap_top_k": -0.0193647388368845,
          "interaction_matrix_overlap_bottom_k": 0.058085646480321884,
          "effective_rank": -0.0028045184444636106,
          "effective_rank_mergeability_score": 0.0024331100285053253,
          "stable_rank": 0.0,
          "spectral_gap": -0.0026932337787002325,
          "singular_value_ratio": 0.002807005075737834,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.019888781011104584,
          "task_vector_dot_product": 0.006304477341473103,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.01254183892160654,
          "singular_value_overlap": -0.016040891408920288,
          "subspace_overlap": 0.007496842183172703,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0021718237549066544,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.00371296308003366,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": -0.0014601859729737043,
          "encoder_gradient_l2_distance": -0.013875262811779976,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.002950392896309495,
          "input_gradient_l2_distance": -0.015399781055748463,
          "input_gradient_dot_product": -0.0022225661668926477
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5619096551714909,
        "val_r": 0.5030198907963286,
        "n_iterations": 488,
        "n_nonzero_coefficients": 28,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005420292727649212,
          "right_subspace_overlap_bottom_k": 0.011228227987885475,
          "interaction_matrix_overlap_top_k": -0.016886094585061073,
          "interaction_matrix_overlap_bottom_k": 0.07604966312646866,
          "effective_rank": -0.0013556280173361301,
          "effective_rank_mergeability_score": 0.0015844120644032955,
          "stable_rank": -0.0019754325039684772,
          "spectral_gap": 0.0028395378030836582,
          "singular_value_ratio": -0.002676052041351795,
          "layerwise_effective_rank": -0.0014810952125117183,
          "layerwise_effective_rank_mergeability_score": 0.0016190186142921448,
          "task_vector_cosine_similarity": 0.0018673641607165337,
          "task_vector_l2_distance": -0.052410684525966644,
          "task_vector_dot_product": -0.002026286209002137,
          "weight_space_angle": -0.003761597676202655,
          "task_vector_magnitude_ratio": -0.01584424264729023,
          "singular_value_overlap": -0.05500537529587746,
          "subspace_overlap": 0.016758238896727562,
          "right_subspace_overlap": 0.0038490211591124535,
          "activation_l2_distance": -0.008232520893216133,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.022359605878591537,
          "activation_dot_product": -0.021655157208442688,
          "encoder_gradient_cosine_similarity": -0.005110464990139008,
          "encoder_gradient_l2_distance": -0.03379429876804352,
          "encoder_gradient_dot_product": 0.0024900278076529503,
          "input_gradient_cosine_similarity": 0.006360665895044804,
          "input_gradient_l2_distance": -0.05899108946323395,
          "input_gradient_dot_product": -0.0067664859816432
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5689916913981444,
        "val_r": 0.5001631978869142,
        "n_iterations": 271,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.016680926084518433,
          "interaction_matrix_overlap_top_k": -0.020077720284461975,
          "interaction_matrix_overlap_bottom_k": 0.07024780660867691,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0018916982226073742,
          "singular_value_ratio": 0.0018571591936051846,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.02982645109295845,
          "task_vector_dot_product": 0.008462797850370407,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.013546925969421864,
          "singular_value_overlap": -0.028316587209701538,
          "subspace_overlap": 0.01239179540425539,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.005345283076167107,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.007961384952068329,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.011832715943455696,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.006126976106315851,
          "input_gradient_l2_distance": -0.025978470221161842,
          "input_gradient_dot_product": -0.009050117805600166
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5694373890413572,
        "val_r": 0.5315823854504689,
        "n_iterations": 348,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005495178047567606,
          "right_subspace_overlap_bottom_k": -0.0041592977941036224,
          "interaction_matrix_overlap_top_k": -0.009363223798573017,
          "interaction_matrix_overlap_bottom_k": 0.0750681608915329,
          "effective_rank": 0.0012569944374263287,
          "effective_rank_mergeability_score": -0.001123833004385233,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.002137171570211649,
          "layerwise_effective_rank_mergeability_score": -0.002802950795739889,
          "task_vector_cosine_similarity": 0.00445648655295372,
          "task_vector_l2_distance": -0.039706408977508545,
          "task_vector_dot_product": -0.010614139959216118,
          "weight_space_angle": -0.002517667831853032,
          "task_vector_magnitude_ratio": -0.008012635633349419,
          "singular_value_overlap": -0.04127219319343567,
          "subspace_overlap": 0.003067324636504054,
          "right_subspace_overlap": 0.005926131270825863,
          "activation_l2_distance": -0.003046406665816903,
          "activation_cosine_similarity": -0.0015429217601194978,
          "activation_magnitude_ratio": -0.01480564009398222,
          "activation_dot_product": -0.01452111080288887,
          "encoder_gradient_cosine_similarity": 0.0021464484743773937,
          "encoder_gradient_l2_distance": -0.02119043469429016,
          "encoder_gradient_dot_product": 0.0021445397287607193,
          "input_gradient_cosine_similarity": 0.004573083017021418,
          "input_gradient_l2_distance": -0.04267091304063797,
          "input_gradient_dot_product": -0.007735861465334892
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.48019930432722635,
        "val_r": 0.6067683544856307,
        "n_iterations": 276,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0025415755808353424,
          "right_subspace_overlap_bottom_k": -0.017836228013038635,
          "interaction_matrix_overlap_top_k": -0.03603383153676987,
          "interaction_matrix_overlap_bottom_k": 0.056785698980093,
          "effective_rank": -0.0015570134855806828,
          "effective_rank_mergeability_score": 0.0013564948458224535,
          "stable_rank": 0.001385294832289219,
          "spectral_gap": -0.003456415608525276,
          "singular_value_ratio": 0.003947386518120766,
          "layerwise_effective_rank": 0.00137956696562469,
          "layerwise_effective_rank_mergeability_score": -0.0023973151110112667,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.021011266857385635,
          "task_vector_dot_product": 0.01753825694322586,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.008276602253317833,
          "singular_value_overlap": -0.01601158268749714,
          "subspace_overlap": 0.015312003903090954,
          "right_subspace_overlap": 0.0034634023904800415,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.003846700768917799,
          "activation_dot_product": -0.0014486403670161963,
          "encoder_gradient_cosine_similarity": 0.0011374785099178553,
          "encoder_gradient_l2_distance": -0.011527678929269314,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0019836067222058773,
          "input_gradient_l2_distance": -0.014651713892817497,
          "input_gradient_dot_product": -0.0061260368674993515
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.601847446737762,
        "val_r": 0.2458894398245468,
        "n_iterations": 378,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.024499457329511642,
          "interaction_matrix_overlap_top_k": -0.007916242815554142,
          "interaction_matrix_overlap_bottom_k": 0.0603896789252758,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.003974339459091425,
          "singular_value_ratio": 0.004247634671628475,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0016376024577766657,
          "task_vector_l2_distance": -0.016483504325151443,
          "task_vector_dot_product": -0.0019057451281696558,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.014725234359502792,
          "singular_value_overlap": -0.018958861008286476,
          "subspace_overlap": 0.0017908659065142274,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.006233659572899342,
          "activation_cosine_similarity": 0.00449030427262187,
          "activation_magnitude_ratio": 0.0014438487123697996,
          "activation_dot_product": -0.01319898758083582,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.017958123236894608,
          "encoder_gradient_dot_product": 0.0010157173965126276,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.021159715950489044,
          "input_gradient_dot_product": -0.00808529183268547
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5443382323522757,
        "val_r": 0.3906726557842953,
        "n_iterations": 560,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.01012424286454916,
          "interaction_matrix_overlap_top_k": -0.03552098944783211,
          "interaction_matrix_overlap_bottom_k": 0.07402512431144714,
          "effective_rank": -0.0015761838294565678,
          "effective_rank_mergeability_score": 0.001646128366701305,
          "stable_rank": 0.0,
          "spectral_gap": -0.0017016936326399446,
          "singular_value_ratio": 0.0019676517695188522,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.04136209189891815,
          "task_vector_dot_product": 0.004723283462226391,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.013990985229611397,
          "singular_value_overlap": -0.028902215883135796,
          "subspace_overlap": 0.024580955505371094,
          "right_subspace_overlap": 0.0012585371732711792,
          "activation_l2_distance": 0.009475401602685452,
          "activation_cosine_similarity": 0.002730149310082197,
          "activation_magnitude_ratio": -0.007629234343767166,
          "activation_dot_product": -0.0030232821591198444,
          "encoder_gradient_cosine_similarity": 0.0019486534874886274,
          "encoder_gradient_l2_distance": -0.018145764246582985,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0057212659157812595,
          "input_gradient_l2_distance": -0.015000421553850174,
          "input_gradient_dot_product": -0.0023741708137094975
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.560860529705465,
        "val_r": 0.4830425539446077,
        "n_iterations": 341,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.001172429881989956,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.020153222605586052,
          "interaction_matrix_overlap_bottom_k": 0.09863678365945816,
          "effective_rank": -0.002831331454217434,
          "effective_rank_mergeability_score": 0.0033253240399062634,
          "stable_rank": -0.002708843909204006,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0036113669630140066,
          "task_vector_l2_distance": -0.060933686792850494,
          "task_vector_dot_product": 0.0037024898920208216,
          "weight_space_angle": 0.0012501501478254795,
          "task_vector_magnitude_ratio": -0.010644536465406418,
          "singular_value_overlap": -0.054059796035289764,
          "subspace_overlap": 0.0163523368537426,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0034941297490149736,
          "activation_cosine_similarity": -0.0014468784211203456,
          "activation_magnitude_ratio": -0.017956044524908066,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0023742467164993286,
          "encoder_gradient_l2_distance": -0.024305429309606552,
          "encoder_gradient_dot_product": 0.00112737319432199,
          "input_gradient_cosine_similarity": 0.0020897360518574715,
          "input_gradient_l2_distance": -0.06262420117855072,
          "input_gradient_dot_product": -0.018027057871222496
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5698148547093072,
        "val_r": -0.15651963427983903,
        "n_iterations": 322,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004495238419622183,
          "right_subspace_overlap_bottom_k": -0.022598838433623314,
          "interaction_matrix_overlap_top_k": -0.03489469364285469,
          "interaction_matrix_overlap_bottom_k": 0.054812878370285034,
          "effective_rank": -0.0035971631295979023,
          "effective_rank_mergeability_score": 0.003158506704494357,
          "stable_rank": -0.0015583516797050834,
          "spectral_gap": -0.003341522067785263,
          "singular_value_ratio": 0.0030176499858498573,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.003040853887796402,
          "task_vector_l2_distance": -0.018123222514986992,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0024781632237136364,
          "task_vector_magnitude_ratio": -0.010984078049659729,
          "singular_value_overlap": -0.02688700333237648,
          "subspace_overlap": 0.023764370009303093,
          "right_subspace_overlap": 0.004769457504153252,
          "activation_l2_distance": -0.06137600913643837,
          "activation_cosine_similarity": -0.05201835557818413,
          "activation_magnitude_ratio": -0.01168079860508442,
          "activation_dot_product": -0.004220425151288509,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.014994951896369457,
          "encoder_gradient_dot_product": 0.003242204198613763,
          "input_gradient_cosine_similarity": -0.003010892542079091,
          "input_gradient_l2_distance": -0.027319829910993576,
          "input_gradient_dot_product": -0.010323846712708473
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5338343706211505,
        "val_r": 0.3924115347553345,
        "n_iterations": 300,
        "n_nonzero_coefficients": 28,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.005601656623184681,
          "right_subspace_overlap_bottom_k": 0.03422198444604874,
          "interaction_matrix_overlap_top_k": -0.007416240405291319,
          "interaction_matrix_overlap_bottom_k": 0.0919426679611206,
          "effective_rank": -0.004143994301557541,
          "effective_rank_mergeability_score": 0.006654117256402969,
          "stable_rank": -0.0038023977540433407,
          "spectral_gap": 0.0023328769020736217,
          "singular_value_ratio": -0.001492504496127367,
          "layerwise_effective_rank": -0.0018948349170386791,
          "layerwise_effective_rank_mergeability_score": 0.0012986346846446395,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.07247309386730194,
          "task_vector_dot_product": 0.0012977754231542349,
          "weight_space_angle": 0.002060847356915474,
          "task_vector_magnitude_ratio": -0.014556784182786942,
          "singular_value_overlap": -0.06091949716210365,
          "subspace_overlap": 0.009175625629723072,
          "right_subspace_overlap": -0.006376564968377352,
          "activation_l2_distance": -0.002607855014503002,
          "activation_cosine_similarity": -0.0032008595298975706,
          "activation_magnitude_ratio": -0.01975644752383232,
          "activation_dot_product": -0.0017425562255084515,
          "encoder_gradient_cosine_similarity": -0.0045659891329705715,
          "encoder_gradient_l2_distance": -0.03769215568900108,
          "encoder_gradient_dot_product": -0.0027130485977977514,
          "input_gradient_cosine_similarity": 0.006017148960381746,
          "input_gradient_l2_distance": -0.05641360953450203,
          "input_gradient_dot_product": -0.005250285379588604
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5603775540916572,
        "val_r": 0.5243612769101097,
        "n_iterations": 361,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.02335813082754612,
          "interaction_matrix_overlap_top_k": -0.019770510494709015,
          "interaction_matrix_overlap_bottom_k": 0.0604156032204628,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0030614743009209633,
          "singular_value_ratio": 0.0029872253071516752,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.02037574164569378,
          "task_vector_dot_product": 0.007314157672226429,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.013457708060741425,
          "singular_value_overlap": -0.018356043845415115,
          "subspace_overlap": 0.01109781302511692,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.005412072408944368,
          "activation_dot_product": -0.0033145826309919357,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.012029756791889668,
          "encoder_gradient_dot_product": -0.002436983399093151,
          "input_gradient_cosine_similarity": 0.001642234856262803,
          "input_gradient_l2_distance": -0.01930541917681694,
          "input_gradient_dot_product": -0.005523913539946079
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.538277035236556,
        "val_r": 0.5148377224298938,
        "n_iterations": 362,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.012912079691886902,
          "interaction_matrix_overlap_top_k": -0.021276652812957764,
          "interaction_matrix_overlap_bottom_k": 0.0838783010840416,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0020964927971363068,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.003338051028549671,
          "task_vector_l2_distance": -0.0418686717748642,
          "task_vector_dot_product": 0.013093501329421997,
          "weight_space_angle": -0.001526283915154636,
          "task_vector_magnitude_ratio": -0.019746968522667885,
          "singular_value_overlap": -0.03617256507277489,
          "subspace_overlap": 0.005073348991572857,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.008634447120130062,
          "activation_cosine_similarity": 0.003632613457739353,
          "activation_magnitude_ratio": -0.008076703175902367,
          "activation_dot_product": -0.0029380307532846928,
          "encoder_gradient_cosine_similarity": -0.001985362498089671,
          "encoder_gradient_l2_distance": -0.02006898634135723,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.007133388426154852,
          "input_gradient_l2_distance": -0.03431306406855583,
          "input_gradient_dot_product": -0.013245704583823681
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5662442548309677,
        "val_r": 0.6081022858582936,
        "n_iterations": 452,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.0384383350610733,
          "interaction_matrix_overlap_top_k": -0.006906608585268259,
          "interaction_matrix_overlap_bottom_k": 0.07198836654424667,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0014330613194033504,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.023289304226636887,
          "task_vector_dot_product": 0.008540005423128605,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.007984270341694355,
          "singular_value_overlap": -0.023831019178032875,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0010038637556135654,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.004160567652434111,
          "activation_dot_product": -0.0036833295598626137,
          "encoder_gradient_cosine_similarity": -0.0013295038370415568,
          "encoder_gradient_l2_distance": -0.012620532885193825,
          "encoder_gradient_dot_product": -0.0020476169884204865,
          "input_gradient_cosine_similarity": 0.0049763754941523075,
          "input_gradient_l2_distance": -0.02180342935025692,
          "input_gradient_dot_product": -0.007581039797514677
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5330857690154672,
        "val_r": 0.563156544002997,
        "n_iterations": 372,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.004007193725556135,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.017933500930666924,
          "interaction_matrix_overlap_bottom_k": 0.10593242943286896,
          "effective_rank": -0.002405580598860979,
          "effective_rank_mergeability_score": 0.001732036704197526,
          "stable_rank": -0.0027170788962394,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0017577074468135834,
          "layerwise_effective_rank_mergeability_score": 0.0014367799740284681,
          "task_vector_cosine_similarity": -0.0014221478486433625,
          "task_vector_l2_distance": -0.07802008092403412,
          "task_vector_dot_product": 0.004202019423246384,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.020999528467655182,
          "singular_value_overlap": -0.0700092539191246,
          "subspace_overlap": 0.035130392760038376,
          "right_subspace_overlap": -0.0029063732363283634,
          "activation_l2_distance": -0.001990999560803175,
          "activation_cosine_similarity": -0.0029073385521769524,
          "activation_magnitude_ratio": -0.021183086559176445,
          "activation_dot_product": -0.01132587157189846,
          "encoder_gradient_cosine_similarity": -0.0018166393274441361,
          "encoder_gradient_l2_distance": -0.03652312979102135,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.004806915298104286,
          "input_gradient_l2_distance": -0.07962023466825485,
          "input_gradient_dot_product": -0.01830741949379444
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.5756436150691993,
        "val_r": 0.3678858525625006,
        "n_iterations": 252,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0064362590201199055,
          "interaction_matrix_overlap_top_k": -0.001240458688698709,
          "interaction_matrix_overlap_bottom_k": 0.052260659635066986,
          "effective_rank": -0.0017205426702275872,
          "effective_rank_mergeability_score": 0.0013457490131258965,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0012391243362799287,
          "layerwise_effective_rank": 0.0015510983066633344,
          "layerwise_effective_rank_mergeability_score": -0.001335010165348649,
          "task_vector_cosine_similarity": -0.0013965535908937454,
          "task_vector_l2_distance": -0.04379516839981079,
          "task_vector_dot_product": 0.0029778270982205868,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.014786962419748306,
          "singular_value_overlap": -0.02276633121073246,
          "subspace_overlap": 0.0027379202656447887,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.017096105962991714,
          "activation_cosine_similarity": 0.006078317295759916,
          "activation_magnitude_ratio": -0.013904618099331856,
          "activation_dot_product": -0.007607273291796446,
          "encoder_gradient_cosine_similarity": -0.0034560482017695904,
          "encoder_gradient_l2_distance": -0.023877358064055443,
          "encoder_gradient_dot_product": 0.002044013701379299,
          "input_gradient_cosine_similarity": 0.0022081814240664244,
          "input_gradient_l2_distance": -0.033499717712402344,
          "input_gradient_dot_product": -0.013317348435521126
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5633588878193307,
        "val_r": 0.46120094210869417,
        "n_iterations": 345,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.007311064749956131,
          "interaction_matrix_overlap_top_k": -0.0041586123406887054,
          "interaction_matrix_overlap_bottom_k": 0.10044475644826889,
          "effective_rank": -0.002377826254814863,
          "effective_rank_mergeability_score": 0.002497876761481166,
          "stable_rank": -0.0032433720771223307,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0019963502418249846,
          "task_vector_l2_distance": -0.07589387148618698,
          "task_vector_dot_product": 0.00208712974563241,
          "weight_space_angle": 0.005322104319930077,
          "task_vector_magnitude_ratio": -0.012950848788022995,
          "singular_value_overlap": -0.06091611832380295,
          "subspace_overlap": 0.01334764901548624,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0152795584872365,
          "activation_cosine_similarity": -0.0022916540037840605,
          "activation_magnitude_ratio": -0.019225720316171646,
          "activation_dot_product": 0.006342749111354351,
          "encoder_gradient_cosine_similarity": 0.0045432355254888535,
          "encoder_gradient_l2_distance": -0.024264222010970116,
          "encoder_gradient_dot_product": 0.0017345290398225188,
          "input_gradient_cosine_similarity": 0.009884772822260857,
          "input_gradient_l2_distance": -0.06181155517697334,
          "input_gradient_dot_product": -0.017452050000429153
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6104428027031141,
        "val_r": 0.23751745926376067,
        "n_iterations": 288,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0088077113032341,
          "right_subspace_overlap_bottom_k": 0.005039295181632042,
          "interaction_matrix_overlap_top_k": -0.043715715408325195,
          "interaction_matrix_overlap_bottom_k": 0.06350643932819366,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0022030731197446585,
          "layerwise_effective_rank_mergeability_score": 0.00887567549943924,
          "task_vector_cosine_similarity": -0.0012308945879340172,
          "task_vector_l2_distance": -0.0364132821559906,
          "task_vector_dot_product": 0.001228060806170106,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.004152111709117889,
          "singular_value_overlap": -0.019131336361169815,
          "subspace_overlap": 0.013255040161311626,
          "right_subspace_overlap": 0.011902139522135258,
          "activation_l2_distance": 0.006089456379413605,
          "activation_cosine_similarity": -0.006350652780383825,
          "activation_magnitude_ratio": -0.006353247445076704,
          "activation_dot_product": 0.009057938121259212,
          "encoder_gradient_cosine_similarity": -0.0024995650164783,
          "encoder_gradient_l2_distance": -0.008575733751058578,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.005258273798972368,
          "input_gradient_l2_distance": -0.03862564265727997,
          "input_gradient_dot_product": -0.006234833970665932
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7287692838131573,
        "val_r": 0.5528217105455469,
        "n_iterations": 291,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0438171811401844,
          "right_subspace_overlap_bottom_k": -0.018380558118224144,
          "interaction_matrix_overlap_top_k": -0.0020874382462352514,
          "interaction_matrix_overlap_bottom_k": 0.05198632553219795,
          "effective_rank": -0.002233702689409256,
          "effective_rank_mergeability_score": 0.0028792941011488438,
          "stable_rank": -0.006476621143519878,
          "spectral_gap": -0.0012580958427861333,
          "singular_value_ratio": 0.001485816785134375,
          "layerwise_effective_rank": -0.01386804599314928,
          "layerwise_effective_rank_mergeability_score": 0.033528491854667664,
          "task_vector_cosine_similarity": -0.012911317870020866,
          "task_vector_l2_distance": -0.007979756221175194,
          "task_vector_dot_product": -0.015076518058776855,
          "weight_space_angle": 0.009440504014492035,
          "task_vector_magnitude_ratio": 0.0016337028937414289,
          "singular_value_overlap": -0.04442860931158066,
          "subspace_overlap": -0.0050471932627260685,
          "right_subspace_overlap": 0.06753294914960861,
          "activation_l2_distance": -0.012595253996551037,
          "activation_cosine_similarity": 0.03513559699058533,
          "activation_magnitude_ratio": -0.022296549752354622,
          "activation_dot_product": 0.008602997288107872,
          "encoder_gradient_cosine_similarity": 0.011835791170597076,
          "encoder_gradient_l2_distance": -0.15515413880348206,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.1531587839126587,
          "input_gradient_dot_product": -0.021268241107463837
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6086036784306991,
        "val_r": 0.2775238495425718,
        "n_iterations": 434,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.00408566789701581,
          "right_subspace_overlap_bottom_k": 0.0031159999780356884,
          "interaction_matrix_overlap_top_k": -0.021438604220747948,
          "interaction_matrix_overlap_bottom_k": 0.037709012627601624,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0011229265946894884,
          "singular_value_ratio": 0.0014123020227998495,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.025977976620197296,
          "task_vector_dot_product": 0.010669861920177937,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.00842384621500969,
          "singular_value_overlap": -0.016015945002436638,
          "subspace_overlap": 0.018417129293084145,
          "right_subspace_overlap": -0.01384603139013052,
          "activation_l2_distance": 0.008145319297909737,
          "activation_cosine_similarity": -0.001466677407734096,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.01165381632745266,
          "encoder_gradient_cosine_similarity": -0.001279671909287572,
          "encoder_gradient_l2_distance": -0.009650119580328465,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.005801853258162737,
          "input_gradient_l2_distance": -0.022283313795924187,
          "input_gradient_dot_product": -0.004921041429042816
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.1,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  }
}