{
  "weight_avg": {
    "aggregate_metrics": {
      "train_r": 0.5732672128184724,
      "train_p": 6.202093137380893e-281,
      "val_r": 0.5141345528513949,
      "val_p": 1.5158152437614106e-25
    },
    "per_fold_stats": {
      "train_r_mean": 0.725547515382024,
      "train_r_std": 0.026382606463823222,
      "val_r_mean": 0.5614779613604306,
      "val_r_std": 0.17210797669719335,
      "n_nonzero_mean": 24.65,
      "n_nonzero_std": 2.1277922830953213
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.007256903685629368,
      "right_subspace_overlap_bottom_k": -0.006256594322621822,
      "interaction_matrix_overlap_top_k": 0.0023141668643802404,
      "interaction_matrix_overlap_bottom_k": -5.2033381507499143e-05,
      "effective_rank": 0.050724614411592484,
      "effective_rank_mergeability_score": 0.03915776312351227,
      "stable_rank": 0.00378103693947196,
      "spectral_gap": 0.040649522095918655,
      "singular_value_ratio": 0.038104742765426636,
      "layerwise_effective_rank": 0.04318822920322418,
      "layerwise_effective_rank_mergeability_score": 0.06268628686666489,
      "task_vector_cosine_similarity": 0.07740236818790436,
      "task_vector_l2_distance": -0.0037744524888694286,
      "task_vector_dot_product": 0.0021373070776462555,
      "weight_space_angle": 0.09100255370140076,
      "task_vector_magnitude_ratio": 0.0020202784799039364,
      "singular_value_overlap": 0.0004897821927443147,
      "subspace_overlap": 0.0039537991397082806,
      "right_subspace_overlap": 0.006161978468298912,
      "activation_l2_distance": 0.019640948623418808,
      "activation_cosine_similarity": 0.02699042297899723,
      "activation_magnitude_ratio": -0.0006416704854927957,
      "activation_dot_product": 0.002063560765236616,
      "encoder_gradient_cosine_similarity": 0.004193493165075779,
      "encoder_gradient_l2_distance": -0.014128519222140312,
      "encoder_gradient_dot_product": 0.0024707228876650333,
      "input_gradient_cosine_similarity": 0.0035860624630004168,
      "input_gradient_l2_distance": -0.013320401310920715,
      "input_gradient_dot_product": -0.0005674147978425026
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.003232428105548024,
      "right_subspace_overlap_bottom_k": 0.0028295996598899364,
      "interaction_matrix_overlap_top_k": 0.0017639865400269628,
      "interaction_matrix_overlap_bottom_k": 0.0009884311584755778,
      "effective_rank": 0.013661222532391548,
      "effective_rank_mergeability_score": 0.013331720605492592,
      "stable_rank": 0.006728705950081348,
      "spectral_gap": 0.00991460494697094,
      "singular_value_ratio": 0.01055691484361887,
      "layerwise_effective_rank": 0.011544610373675823,
      "layerwise_effective_rank_mergeability_score": 0.015954403206706047,
      "task_vector_cosine_similarity": 0.01015794649720192,
      "task_vector_l2_distance": 0.0028690630570054054,
      "task_vector_dot_product": 0.0017767813988029957,
      "weight_space_angle": 0.012260559014976025,
      "task_vector_magnitude_ratio": 0.001797739416360855,
      "singular_value_overlap": 0.0010779222939163446,
      "subspace_overlap": 0.0030988906510174274,
      "right_subspace_overlap": 0.0036388146691024303,
      "activation_l2_distance": 0.009562560357153416,
      "activation_cosine_similarity": 0.010763346217572689,
      "activation_magnitude_ratio": 0.0013862296473234892,
      "activation_dot_product": 0.0027211711276322603,
      "encoder_gradient_cosine_similarity": 0.0016030835686251521,
      "encoder_gradient_l2_distance": 0.003162519307807088,
      "encoder_gradient_dot_product": 0.0017200745642185211,
      "input_gradient_cosine_similarity": 0.0026457614731043577,
      "input_gradient_l2_distance": 0.004842014517635107,
      "input_gradient_dot_product": 0.0013075278839096427
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.95,
      "right_subspace_overlap_bottom_k": 0.95,
      "interaction_matrix_overlap_top_k": 0.8,
      "interaction_matrix_overlap_bottom_k": 0.35,
      "effective_rank": 1.0,
      "effective_rank_mergeability_score": 1.0,
      "stable_rank": 0.75,
      "spectral_gap": 1.0,
      "singular_value_ratio": 1.0,
      "layerwise_effective_rank": 1.0,
      "layerwise_effective_rank_mergeability_score": 1.0,
      "task_vector_cosine_similarity": 1.0,
      "task_vector_l2_distance": 0.9,
      "task_vector_dot_product": 0.75,
      "weight_space_angle": 1.0,
      "task_vector_magnitude_ratio": 0.7,
      "singular_value_overlap": 0.6,
      "subspace_overlap": 0.9,
      "right_subspace_overlap": 0.9,
      "activation_l2_distance": 1.0,
      "activation_cosine_similarity": 0.95,
      "activation_magnitude_ratio": 0.3,
      "activation_dot_product": 0.65,
      "encoder_gradient_cosine_similarity": 1.0,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.8,
      "input_gradient_cosine_similarity": 0.9,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.5
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7299705056590243,
        "val_r": 0.5551635884900401,
        "n_iterations": 286,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010652112774550915,
          "right_subspace_overlap_bottom_k": -0.003294107737019658,
          "interaction_matrix_overlap_top_k": 0.002259379019960761,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.03700217977166176,
          "effective_rank_mergeability_score": 0.03944568708539009,
          "stable_rank": 0.0035182505380362272,
          "spectral_gap": 0.034511685371398926,
          "singular_value_ratio": 0.029475906863808632,
          "layerwise_effective_rank": 0.03159857913851738,
          "layerwise_effective_rank_mergeability_score": 0.03871572017669678,
          "task_vector_cosine_similarity": 0.09456640481948853,
          "task_vector_l2_distance": -0.010124141350388527,
          "task_vector_dot_product": 0.004792379215359688,
          "weight_space_angle": 0.12145605683326721,
          "task_vector_magnitude_ratio": 0.006178956013172865,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.005327718332409859,
          "right_subspace_overlap": 0.011404250748455524,
          "activation_l2_distance": 0.02828570082783699,
          "activation_cosine_similarity": 0.04101958125829697,
          "activation_magnitude_ratio": -0.004440027289092541,
          "activation_dot_product": 0.005319193471223116,
          "encoder_gradient_cosine_similarity": 0.008160467259585857,
          "encoder_gradient_l2_distance": -0.021943191066384315,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.011319334618747234,
          "input_gradient_l2_distance": -0.02481919154524803,
          "input_gradient_dot_product": 0.0026031741872429848
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7071004946409631,
        "val_r": 0.5889615569174086,
        "n_iterations": 412,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.013867753557860851,
          "right_subspace_overlap_bottom_k": -0.006684088613837957,
          "interaction_matrix_overlap_top_k": 0.0021539817098528147,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.05782417953014374,
          "effective_rank_mergeability_score": 0.04128323867917061,
          "stable_rank": 0.001700354041531682,
          "spectral_gap": 0.036437876522541046,
          "singular_value_ratio": 0.03441515937447548,
          "layerwise_effective_rank": 0.04424477368593216,
          "layerwise_effective_rank_mergeability_score": 0.06413581967353821,
          "task_vector_cosine_similarity": 0.07208438962697983,
          "task_vector_l2_distance": -0.004073963034898043,
          "task_vector_dot_product": 0.0038360124453902245,
          "weight_space_angle": 0.08899416029453278,
          "task_vector_magnitude_ratio": 0.00116393540520221,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.00506768561899662,
          "right_subspace_overlap": 0.008391750045120716,
          "activation_l2_distance": 0.023534148931503296,
          "activation_cosine_similarity": 0.031987790018320084,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.00395481800660491,
          "encoder_gradient_l2_distance": -0.014683985151350498,
          "encoder_gradient_dot_product": 0.004922904074192047,
          "input_gradient_cosine_similarity": 0.001357418135739863,
          "input_gradient_l2_distance": -0.013432914391160011,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7055792046488323,
        "val_r": 0.680066734510155,
        "n_iterations": 331,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010123279877007008,
          "right_subspace_overlap_bottom_k": -0.004662083927541971,
          "interaction_matrix_overlap_top_k": 0.002997229341417551,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.07364872843027115,
          "effective_rank_mergeability_score": 0.05758683383464813,
          "stable_rank": 0.006648491136729717,
          "spectral_gap": 0.03624473884701729,
          "singular_value_ratio": 0.03198671713471413,
          "layerwise_effective_rank": 0.029955608770251274,
          "layerwise_effective_rank_mergeability_score": 0.05991050601005554,
          "task_vector_cosine_similarity": 0.07075385749340057,
          "task_vector_l2_distance": -0.0023899273946881294,
          "task_vector_dot_product": 0.0036671538837254047,
          "weight_space_angle": 0.0811660885810852,
          "task_vector_magnitude_ratio": 0.001374998944811523,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.004944056738168001,
          "right_subspace_overlap": 0.009518186561763287,
          "activation_l2_distance": 0.018263675272464752,
          "activation_cosine_similarity": 0.027491802349686623,
          "activation_magnitude_ratio": -0.0021524359472095966,
          "activation_dot_product": 0.004190477076917887,
          "encoder_gradient_cosine_similarity": 0.0031634115148335695,
          "encoder_gradient_l2_distance": -0.011382377706468105,
          "encoder_gradient_dot_product": 0.0023106071166694164,
          "input_gradient_cosine_similarity": 0.0023047160357236862,
          "input_gradient_l2_distance": -0.013926905579864979,
          "input_gradient_dot_product": -0.0024718751665204763
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7113545088731207,
        "val_r": 0.6321037868009347,
        "n_iterations": 265,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009817564859986305,
          "right_subspace_overlap_bottom_k": -0.003275918308645487,
          "interaction_matrix_overlap_top_k": 0.0052430639043450356,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.07277730107307434,
          "effective_rank_mergeability_score": 0.055337853729724884,
          "stable_rank": 0.003879319177940488,
          "spectral_gap": 0.04953338950872421,
          "singular_value_ratio": 0.04872004687786102,
          "layerwise_effective_rank": 0.013371269218623638,
          "layerwise_effective_rank_mergeability_score": 0.043116092681884766,
          "task_vector_cosine_similarity": 0.05486813932657242,
          "task_vector_l2_distance": -0.0037829638458788395,
          "task_vector_dot_product": 0.0029809807892888784,
          "weight_space_angle": 0.07801777124404907,
          "task_vector_magnitude_ratio": 0.004383991938084364,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0026108170859515667,
          "right_subspace_overlap": 0.00773673877120018,
          "activation_l2_distance": 0.027388855814933777,
          "activation_cosine_similarity": 0.0369512103497982,
          "activation_magnitude_ratio": 0.0011216300772503018,
          "activation_dot_product": 0.004714303649961948,
          "encoder_gradient_cosine_similarity": 0.004861517809331417,
          "encoder_gradient_l2_distance": -0.017323369160294533,
          "encoder_gradient_dot_product": 0.005021573044359684,
          "input_gradient_cosine_similarity": 0.006020974833518267,
          "input_gradient_l2_distance": -0.02470904402434826,
          "input_gradient_dot_product": -0.001774105243384838
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.728181791137263,
        "val_r": 0.6920051601907778,
        "n_iterations": 328,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009020921774208546,
          "right_subspace_overlap_bottom_k": -0.006064691115170717,
          "interaction_matrix_overlap_top_k": 0.0016289276536554098,
          "interaction_matrix_overlap_bottom_k": 0.0012105291243642569,
          "effective_rank": 0.05067787319421768,
          "effective_rank_mergeability_score": 0.03619230538606644,
          "stable_rank": 0.0,
          "spectral_gap": 0.03846118226647377,
          "singular_value_ratio": 0.035251911729574203,
          "layerwise_effective_rank": 0.04365047067403793,
          "layerwise_effective_rank_mergeability_score": 0.06086773797869682,
          "task_vector_cosine_similarity": 0.0942806527018547,
          "task_vector_l2_distance": -0.006310341879725456,
          "task_vector_dot_product": 0.0015132722910493612,
          "weight_space_angle": 0.103736013174057,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.004419977776706219,
          "right_subspace_overlap": 0.0049092997796833515,
          "activation_l2_distance": 0.014453105628490448,
          "activation_cosine_similarity": 0.021731138229370117,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0033211386762559414,
          "encoder_gradient_cosine_similarity": 0.0030149894300848246,
          "encoder_gradient_l2_distance": -0.01381415594369173,
          "encoder_gradient_dot_product": 0.0019237210508435965,
          "input_gradient_cosine_similarity": 0.004849226213991642,
          "input_gradient_l2_distance": -0.013469822704792023,
          "input_gradient_dot_product": -0.0018117236904799938
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.749197238381563,
        "val_r": 0.7219357464278046,
        "n_iterations": 347,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00885577592998743,
          "right_subspace_overlap_bottom_k": -0.005592481233179569,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0012584580108523369,
          "effective_rank": 0.04768598452210426,
          "effective_rank_mergeability_score": 0.03396258130669594,
          "stable_rank": 0.001156987389549613,
          "spectral_gap": 0.06069417670369148,
          "singular_value_ratio": 0.05896078422665596,
          "layerwise_effective_rank": 0.04953683167695999,
          "layerwise_effective_rank_mergeability_score": 0.0651233047246933,
          "task_vector_cosine_similarity": 0.07261301577091217,
          "task_vector_l2_distance": -0.002041037194430828,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.08311732113361359,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0034951562993228436,
          "right_subspace_overlap": 0.0021572187542915344,
          "activation_l2_distance": 0.008105498738586903,
          "activation_cosine_similarity": 0.017522120848298073,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0034186793491244316,
          "encoder_gradient_l2_distance": -0.013241183944046497,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.002440276090055704,
          "input_gradient_l2_distance": -0.006760688964277506,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7245383501916309,
        "val_r": 0.4208170732507355,
        "n_iterations": 205,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006499932613223791,
          "right_subspace_overlap_bottom_k": -0.012533307075500488,
          "interaction_matrix_overlap_top_k": 0.006639027968049049,
          "interaction_matrix_overlap_bottom_k": -0.001488225650973618,
          "effective_rank": 0.05117232725024223,
          "effective_rank_mergeability_score": 0.029254069551825523,
          "stable_rank": 0.002105854917317629,
          "spectral_gap": 0.04939967766404152,
          "singular_value_ratio": 0.04415871948003769,
          "layerwise_effective_rank": 0.04128403961658478,
          "layerwise_effective_rank_mergeability_score": 0.0727430135011673,
          "task_vector_cosine_similarity": 0.0677800104022026,
          "task_vector_l2_distance": -0.0027355521451681852,
          "task_vector_dot_product": 0.0013631765032187104,
          "weight_space_angle": 0.0762789398431778,
          "task_vector_magnitude_ratio": 0.004344502929598093,
          "singular_value_overlap": 0.0014708263333886862,
          "subspace_overlap": 0.004648478236049414,
          "right_subspace_overlap": 0.005028815474361181,
          "activation_l2_distance": 0.02196209691464901,
          "activation_cosine_similarity": 0.040095627307891846,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.0016576119232922792,
          "encoder_gradient_cosine_similarity": 0.006334634032100439,
          "encoder_gradient_l2_distance": -0.019557688385248184,
          "encoder_gradient_dot_product": 0.003772786818444729,
          "input_gradient_cosine_similarity": 0.0016023452626541257,
          "input_gradient_l2_distance": -0.011473692953586578,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6831339764476685,
        "val_r": 0.3496532596433283,
        "n_iterations": 396,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010775959119200706,
          "right_subspace_overlap_bottom_k": -0.007329413201659918,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.060134872794151306,
          "effective_rank_mergeability_score": 0.04132317379117012,
          "stable_rank": 0.0027781426906585693,
          "spectral_gap": 0.04795496165752411,
          "singular_value_ratio": 0.04665835201740265,
          "layerwise_effective_rank": 0.0365806519985199,
          "layerwise_effective_rank_mergeability_score": 0.05950561538338661,
          "task_vector_cosine_similarity": 0.07150042057037354,
          "task_vector_l2_distance": -0.005150907672941685,
          "task_vector_dot_product": 0.002233077073469758,
          "weight_space_angle": 0.07849389314651489,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0016325224423781037,
          "subspace_overlap": 0.005358985159546137,
          "right_subspace_overlap": 0.00706941494718194,
          "activation_l2_distance": 0.018950868397951126,
          "activation_cosine_similarity": 0.024815429002046585,
          "activation_magnitude_ratio": -0.0012112482218071818,
          "activation_dot_product": 0.002350347116589546,
          "encoder_gradient_cosine_similarity": 0.006919724866747856,
          "encoder_gradient_l2_distance": -0.014672772958874702,
          "encoder_gradient_dot_product": 0.0030045686289668083,
          "input_gradient_cosine_similarity": 0.0021579754538834095,
          "input_gradient_l2_distance": -0.009181132540106773,
          "input_gradient_dot_product": 0.0015578812453895807
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7258136278333361,
        "val_r": 0.193291082363055,
        "n_iterations": 201,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004283341579139233,
          "right_subspace_overlap_bottom_k": -0.00772884814068675,
          "interaction_matrix_overlap_top_k": 0.0017044155392795801,
          "interaction_matrix_overlap_bottom_k": -0.0023219771683216095,
          "effective_rank": 0.027292540296912193,
          "effective_rank_mergeability_score": 0.05023341625928879,
          "stable_rank": 0.03198331221938133,
          "spectral_gap": 0.030010459944605827,
          "singular_value_ratio": 0.029209697619080544,
          "layerwise_effective_rank": 0.041181936860084534,
          "layerwise_effective_rank_mergeability_score": 0.05997186899185181,
          "task_vector_cosine_similarity": 0.06898049265146255,
          "task_vector_l2_distance": -0.0028965198434889317,
          "task_vector_dot_product": 0.004516848362982273,
          "weight_space_angle": 0.08559219539165497,
          "task_vector_magnitude_ratio": 0.002659840974956751,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.001191380200907588,
          "right_subspace_overlap": 0.007424985058605671,
          "activation_l2_distance": 0.0222152266651392,
          "activation_cosine_similarity": 0.028552241623401642,
          "activation_magnitude_ratio": -0.0036570592783391476,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0052565596997737885,
          "encoder_gradient_l2_distance": -0.011828400194644928,
          "encoder_gradient_dot_product": 0.003923060372471809,
          "input_gradient_cosine_similarity": 0.004330417141318321,
          "input_gradient_l2_distance": -0.01604398898780346,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7108073235000623,
        "val_r": 0.48828662267240003,
        "n_iterations": 341,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009772106073796749,
          "right_subspace_overlap_bottom_k": -0.007681564893573523,
          "interaction_matrix_overlap_top_k": 0.004445794969797134,
          "interaction_matrix_overlap_bottom_k": 0.002536914311349392,
          "effective_rank": 0.044177085161209106,
          "effective_rank_mergeability_score": 0.028184935450553894,
          "stable_rank": 0.0,
          "spectral_gap": 0.05584338679909706,
          "singular_value_ratio": 0.05498843267560005,
          "layerwise_effective_rank": 0.06614251434803009,
          "layerwise_effective_rank_mergeability_score": 0.08969587087631226,
          "task_vector_cosine_similarity": 0.06498917192220688,
          "task_vector_l2_distance": -0.004360982216894627,
          "task_vector_dot_product": 0.0027566379867494106,
          "weight_space_angle": 0.08249451965093613,
          "task_vector_magnitude_ratio": 0.002895105630159378,
          "singular_value_overlap": -0.0013657500967383385,
          "subspace_overlap": 0.006597355008125305,
          "right_subspace_overlap": 0.00880658533424139,
          "activation_l2_distance": 0.0028157716151326895,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.001090307254344225,
          "encoder_gradient_cosine_similarity": 0.004044767003506422,
          "encoder_gradient_l2_distance": -0.014148646034300327,
          "encoder_gradient_dot_product": 0.00286905188113451,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.015989631414413452,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7491590790332391,
        "val_r": 0.16149619340693272,
        "n_iterations": 334,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003580225631594658,
          "right_subspace_overlap_bottom_k": -0.0037005734629929066,
          "interaction_matrix_overlap_top_k": 0.0016414023702964187,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.052388980984687805,
          "effective_rank_mergeability_score": 0.06353820860385895,
          "stable_rank": 0.0022920251358300447,
          "spectral_gap": 0.040667153894901276,
          "singular_value_ratio": 0.039712902158498764,
          "layerwise_effective_rank": 0.05258651077747345,
          "layerwise_effective_rank_mergeability_score": 0.04887818545103073,
          "task_vector_cosine_similarity": 0.08046378940343857,
          "task_vector_l2_distance": -0.00286734476685524,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.085660919547081,
          "task_vector_magnitude_ratio": 0.0021295950282365084,
          "singular_value_overlap": 0.0011859023943543434,
          "subspace_overlap": -0.0010612154146656394,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.007849869318306446,
          "activation_cosine_similarity": 0.01650463417172432,
          "activation_magnitude_ratio": -0.002494269050657749,
          "activation_dot_product": 0.0017175008542835712,
          "encoder_gradient_cosine_similarity": 0.002871408360078931,
          "encoder_gradient_l2_distance": -0.014033820480108261,
          "encoder_gradient_dot_product": 0.0011935359798371792,
          "input_gradient_cosine_similarity": 0.0023803813382983208,
          "input_gradient_l2_distance": -0.005103535018861294,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7367590044829082,
        "val_r": 0.691607793952778,
        "n_iterations": 415,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006424675229936838,
          "right_subspace_overlap_bottom_k": -0.008995573036372662,
          "interaction_matrix_overlap_top_k": 0.0024379827082157135,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.026882892474532127,
          "effective_rank_mergeability_score": 0.03828616067767143,
          "stable_rank": 0.003788462607190013,
          "spectral_gap": 0.044542767107486725,
          "singular_value_ratio": 0.03960946202278137,
          "layerwise_effective_rank": 0.034224070608615875,
          "layerwise_effective_rank_mergeability_score": 0.026538429781794548,
          "task_vector_cosine_similarity": 0.08403538167476654,
          "task_vector_l2_distance": -0.0017554882215335965,
          "task_vector_dot_product": 0.0064531187526881695,
          "weight_space_angle": 0.11107612401247025,
          "task_vector_magnitude_ratio": 0.0037926621735095978,
          "singular_value_overlap": 0.0010155412601307034,
          "subspace_overlap": 0.01168283261358738,
          "right_subspace_overlap": 0.0028327093459665775,
          "activation_l2_distance": 0.035810437053442,
          "activation_cosine_similarity": 0.039703696966171265,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.004968469496816397,
          "encoder_gradient_cosine_similarity": 0.004330002702772617,
          "encoder_gradient_l2_distance": -0.012670150958001614,
          "encoder_gradient_dot_product": 0.001106677227653563,
          "input_gradient_cosine_similarity": 0.006544434931129217,
          "input_gradient_l2_distance": -0.0149656031280756,
          "input_gradient_dot_product": -0.0014396619517356157
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7231181045808794,
        "val_r": 0.6376310909896931,
        "n_iterations": 411,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0071691726334393024,
          "right_subspace_overlap_bottom_k": -0.004026518203318119,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.049762338399887085,
          "effective_rank_mergeability_score": 0.023134469985961914,
          "stable_rank": 0.002570144599303603,
          "spectral_gap": 0.032864633947610855,
          "singular_value_ratio": 0.031697746366262436,
          "layerwise_effective_rank": 0.04698869213461876,
          "layerwise_effective_rank_mergeability_score": 0.07866466790437698,
          "task_vector_cosine_similarity": 0.07683892548084259,
          "task_vector_l2_distance": -0.0010176151990890503,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.07542300969362259,
          "task_vector_magnitude_ratio": 0.00143460463732481,
          "singular_value_overlap": 0.0015761996619403362,
          "subspace_overlap": 0.0011868771398440003,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.035300273448228836,
          "activation_cosine_similarity": 0.038404904305934906,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.005850032437592745,
          "encoder_gradient_l2_distance": -0.008640985935926437,
          "encoder_gradient_dot_product": 0.004176896996796131,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010863340459764004,
          "input_gradient_dot_product": -0.0023949421010911465
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7345959517145335,
        "val_r": 0.8346019441743311,
        "n_iterations": 422,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006611368618905544,
          "right_subspace_overlap_bottom_k": -0.007789508439600468,
          "interaction_matrix_overlap_top_k": 0.0034281667321920395,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.05076514184474945,
          "effective_rank_mergeability_score": 0.03879496827721596,
          "stable_rank": 0.0060572754591703415,
          "spectral_gap": 0.047896623611450195,
          "singular_value_ratio": 0.04877520352602005,
          "layerwise_effective_rank": 0.035315144807100296,
          "layerwise_effective_rank_mergeability_score": 0.058222390711307526,
          "task_vector_cosine_similarity": 0.08443621546030045,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.09493464976549149,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0015679971547797322,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.009885418228805065,
          "activation_l2_distance": 0.012172301299870014,
          "activation_cosine_similarity": 0.02029431238770485,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.003981086425483227,
          "encoder_gradient_cosine_similarity": 0.0028616259805858135,
          "encoder_gradient_l2_distance": -0.012313893996179104,
          "encoder_gradient_dot_product": 0.003093636129051447,
          "input_gradient_cosine_similarity": 0.0031083894427865744,
          "input_gradient_l2_distance": -0.011861108243465424,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7116389015059359,
        "val_r": 0.7562881368099804,
        "n_iterations": 254,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006249363999813795,
          "right_subspace_overlap_bottom_k": -0.008535921573638916,
          "interaction_matrix_overlap_top_k": 0.0010841813636943698,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.06465297937393188,
          "effective_rank_mergeability_score": 0.051063165068626404,
          "stable_rank": 0.00195146759506315,
          "spectral_gap": 0.032512202858924866,
          "singular_value_ratio": 0.03156299516558647,
          "layerwise_effective_rank": 0.04665611684322357,
          "layerwise_effective_rank_mergeability_score": 0.061853013932704926,
          "task_vector_cosine_similarity": 0.08450044691562653,
          "task_vector_l2_distance": -0.0025105876848101616,
          "task_vector_dot_product": 0.001296613598242402,
          "weight_space_angle": 0.09625956416130066,
          "task_vector_magnitude_ratio": 0.0017599457642063498,
          "singular_value_overlap": -0.0010646459413692355,
          "subspace_overlap": 0.003869944252073765,
          "right_subspace_overlap": 0.007312229368835688,
          "activation_l2_distance": 0.006970238406211138,
          "activation_cosine_similarity": 0.01615005172789097,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.002337832935154438,
          "encoder_gradient_cosine_similarity": 0.004626682493835688,
          "encoder_gradient_l2_distance": -0.015170182101428509,
          "encoder_gradient_dot_product": 0.002000346314162016,
          "input_gradient_cosine_similarity": 0.003516371129080653,
          "input_gradient_l2_distance": -0.015147886238992214,
          "input_gradient_dot_product": -0.0013156457571312785
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.7310283359002613,
        "val_r": 0.5461072954188364,
        "n_iterations": 276,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007029427215456963,
          "right_subspace_overlap_bottom_k": -0.005796416196972132,
          "interaction_matrix_overlap_top_k": 0.004230639431625605,
          "interaction_matrix_overlap_bottom_k": -0.0010866487864404917,
          "effective_rank": 0.032814040780067444,
          "effective_rank_mergeability_score": 0.03050496242940426,
          "stable_rank": 0.0,
          "spectral_gap": 0.05485738068819046,
          "singular_value_ratio": 0.05152135342359543,
          "layerwise_effective_rank": 0.04109668731689453,
          "layerwise_effective_rank_mergeability_score": 0.05113707482814789,
          "task_vector_cosine_similarity": 0.07802028954029083,
          "task_vector_l2_distance": -0.009893644601106644,
          "task_vector_dot_product": 0.0022102310322225094,
          "weight_space_angle": 0.09446515142917633,
          "task_vector_magnitude_ratio": 0.0011394284665584564,
          "singular_value_overlap": 0.0019320063292980194,
          "subspace_overlap": 0.0011924590216949582,
          "right_subspace_overlap": 0.008616099134087563,
          "activation_l2_distance": 0.034257542341947556,
          "activation_cosine_similarity": 0.0387101024389267,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0027942790184170008,
          "encoder_gradient_l2_distance": -0.01421879231929779,
          "encoder_gradient_dot_product": 0.0021386086009442806,
          "input_gradient_cosine_similarity": 0.00272355112247169,
          "input_gradient_l2_distance": -0.01090907771140337,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6704255072323227,
        "val_r": 0.5395833185364547,
        "n_iterations": 276,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006258642300963402,
          "right_subspace_overlap_bottom_k": -0.004891207441687584,
          "interaction_matrix_overlap_top_k": 0.0016500517958775163,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.04531100019812584,
          "effective_rank_mergeability_score": 0.031877271831035614,
          "stable_rank": 0.002202631440013647,
          "spectral_gap": 0.034383270889520645,
          "singular_value_ratio": 0.0334654301404953,
          "layerwise_effective_rank": 0.04880528897047043,
          "layerwise_effective_rank_mergeability_score": 0.06560840457677841,
          "task_vector_cosine_similarity": 0.08698318898677826,
          "task_vector_l2_distance": -0.0034770960919559,
          "task_vector_dot_product": 0.0012794939102604985,
          "weight_space_angle": 0.10220761597156525,
          "task_vector_magnitude_ratio": 0.0040054405108094215,
          "singular_value_overlap": 0.0011496192310005426,
          "subspace_overlap": 0.006835200358182192,
          "right_subspace_overlap": 0.010720597580075264,
          "activation_l2_distance": 0.019971119239926338,
          "activation_cosine_similarity": 0.02650386095046997,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0014406373957172036,
          "encoder_gradient_cosine_similarity": 0.0031687559094280005,
          "encoder_gradient_l2_distance": -0.010347869247198105,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0012872666120529175,
          "input_gradient_l2_distance": -0.009889396838843822,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7396097423230633,
        "val_r": 0.5159454649370347,
        "n_iterations": 314,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0012855667155236006,
          "right_subspace_overlap_bottom_k": -0.005225132219493389,
          "interaction_matrix_overlap_top_k": 0.0027609311509877443,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.04871590435504913,
          "effective_rank_mergeability_score": 0.009528874419629574,
          "stable_rank": 0.002988019958138466,
          "spectral_gap": 0.024532627314329147,
          "singular_value_ratio": 0.018939480185508728,
          "layerwise_effective_rank": 0.04204833135008812,
          "layerwise_effective_rank_mergeability_score": 0.0840551033616066,
          "task_vector_cosine_similarity": 0.0932852029800415,
          "task_vector_l2_distance": -0.0014866129495203495,
          "task_vector_dot_product": 0.0016974823083728552,
          "weight_space_angle": 0.10439832508563995,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0014498821692541242,
          "subspace_overlap": 0.009146506898105145,
          "right_subspace_overlap": 0.00539398193359375,
          "activation_l2_distance": 0.024206260219216347,
          "activation_cosine_similarity": 0.03488028794527054,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.003817114047706127,
          "encoder_gradient_l2_distance": -0.018565600737929344,
          "encoder_gradient_dot_product": 0.0057094828225672245,
          "input_gradient_cosine_similarity": 0.006263331975787878,
          "input_gradient_l2_distance": -0.015037929639220238,
          "input_gradient_dot_product": -0.001929338090121746
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.735643404448849,
        "val_r": 0.5093971085923642,
        "n_iterations": 316,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00686088390648365,
          "right_subspace_overlap_bottom_k": -0.011324544437229633,
          "interaction_matrix_overlap_top_k": 0.001978157553821802,
          "interaction_matrix_overlap_bottom_k": -0.0011497174855321646,
          "effective_rank": 0.04483836144208908,
          "effective_rank_mergeability_score": 0.025176847353577614,
          "stable_rank": 0.0,
          "spectral_gap": 0.026177864521741867,
          "singular_value_ratio": 0.022455738857388496,
          "layerwise_effective_rank": 0.06355030834674835,
          "layerwise_effective_rank_mergeability_score": 0.08990047127008438,
          "task_vector_cosine_similarity": 0.07297249883413315,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.09360288083553314,
          "task_vector_magnitude_ratio": 0.003142560599371791,
          "singular_value_overlap": 0.0023815371096134186,
          "subspace_overlap": 0.0025617722421884537,
          "right_subspace_overlap": 0.007538631092756987,
          "activation_l2_distance": 0.021655870601534843,
          "activation_cosine_similarity": 0.02583937533199787,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.00306151295080781,
          "encoder_gradient_l2_distance": -0.010373438708484173,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.003007507650181651,
          "input_gradient_l2_distance": -0.008336995728313923,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8032952551050219,
        "val_r": 0.7146162691235663,
        "n_iterations": 510,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.07596763223409653,
          "effective_rank_mergeability_score": 0.05844622105360031,
          "stable_rank": 0.0,
          "spectral_gap": 0.03546435385942459,
          "singular_value_ratio": 0.03052879497408867,
          "layerwise_effective_rank": 0.05494677647948265,
          "layerwise_effective_rank_mergeability_score": 0.0750824362039566,
          "task_vector_cosine_similarity": 0.07409486174583435,
          "task_vector_l2_distance": -0.00861432310193777,
          "task_vector_dot_product": 0.0021496654953807592,
          "weight_space_angle": 0.08267571032047272,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.0015073411632329226,
          "activation_l2_distance": 0.008650130592286587,
          "activation_cosine_similarity": 0.01265023648738861,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.009678147733211517,
          "encoder_gradient_cosine_similarity": 0.0013588883448392153,
          "encoder_gradient_l2_distance": -0.01363985426723957,
          "encoder_gradient_dot_product": 0.002246994525194168,
          "input_gradient_cosine_similarity": 0.006507327780127525,
          "input_gradient_l2_distance": -0.014486150816082954,
          "input_gradient_dot_product": -0.002372058806940913
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "arithmetic": {
    "aggregate_metrics": {
      "train_r": 0.36523958100052206,
      "train_p": 2.9692774409609538e-102,
      "val_r": 0.1133057721352425,
      "val_p": 0.03209265218512175
    },
    "per_fold_stats": {
      "train_r_mean": 0.5465391367599152,
      "train_r_std": 0.07820556430973429,
      "val_r_mean": 0.41989531015863346,
      "val_r_std": 0.1717412182174602,
      "n_nonzero_mean": 24.85,
      "n_nonzero_std": 2.4753787588973126
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.0038630622439086437,
      "right_subspace_overlap_bottom_k": 0.0007589542656205595,
      "interaction_matrix_overlap_top_k": 0.0024459243286401033,
      "interaction_matrix_overlap_bottom_k": 0.011242149397730827,
      "effective_rank": 0.04197682812809944,
      "effective_rank_mergeability_score": 0.05645439028739929,
      "stable_rank": 0.010606127791106701,
      "spectral_gap": 0.054473478347063065,
      "singular_value_ratio": 0.04766102880239487,
      "layerwise_effective_rank": 0.05099276825785637,
      "layerwise_effective_rank_mergeability_score": 0.050280600786209106,
      "task_vector_cosine_similarity": 0.07598420232534409,
      "task_vector_l2_distance": -0.011571855284273624,
      "task_vector_dot_product": 0.0009202024666592479,
      "weight_space_angle": 0.08328479528427124,
      "task_vector_magnitude_ratio": 0.0009617680916562676,
      "singular_value_overlap": -0.005503048188984394,
      "subspace_overlap": 0.006451759487390518,
      "right_subspace_overlap": 0.0027673617005348206,
      "activation_l2_distance": 0.012015430256724358,
      "activation_cosine_similarity": 0.014312486164271832,
      "activation_magnitude_ratio": 0.00025082993670366704,
      "activation_dot_product": 0.004850971978157759,
      "encoder_gradient_cosine_similarity": 0.002875309204682708,
      "encoder_gradient_l2_distance": -0.011458508670330048,
      "encoder_gradient_dot_product": 0.003672781167551875,
      "input_gradient_cosine_similarity": 0.00384212052449584,
      "input_gradient_l2_distance": -0.016613174229860306,
      "input_gradient_dot_product": -0.00020923660486005247
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.0055230725556612015,
      "right_subspace_overlap_bottom_k": 0.0028261623810976744,
      "interaction_matrix_overlap_top_k": 0.003556023584678769,
      "interaction_matrix_overlap_bottom_k": 0.004581043031066656,
      "effective_rank": 0.01601855270564556,
      "effective_rank_mergeability_score": 0.01914389245212078,
      "stable_rank": 0.01204177550971508,
      "spectral_gap": 0.016313623636960983,
      "singular_value_ratio": 0.01590082049369812,
      "layerwise_effective_rank": 0.015462138690054417,
      "layerwise_effective_rank_mergeability_score": 0.01270507276058197,
      "task_vector_cosine_similarity": 0.013291682116687298,
      "task_vector_l2_distance": 0.003933359403163195,
      "task_vector_dot_product": 0.0027752683963626623,
      "weight_space_angle": 0.014463613741099834,
      "task_vector_magnitude_ratio": 0.0017036937642842531,
      "singular_value_overlap": 0.003941190429031849,
      "subspace_overlap": 0.006348214577883482,
      "right_subspace_overlap": 0.0037435314152389765,
      "activation_l2_distance": 0.010547442361712456,
      "activation_cosine_similarity": 0.008980074897408485,
      "activation_magnitude_ratio": 0.0051793912425637245,
      "activation_dot_product": 0.006403650622814894,
      "encoder_gradient_cosine_similarity": 0.00287380232475698,
      "encoder_gradient_l2_distance": 0.007537545170634985,
      "encoder_gradient_dot_product": 0.0034398019779473543,
      "input_gradient_cosine_similarity": 0.003652745857834816,
      "input_gradient_l2_distance": 0.005044944118708372,
      "input_gradient_dot_product": 0.0016669004689902067
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.7,
      "right_subspace_overlap_bottom_k": 0.55,
      "interaction_matrix_overlap_top_k": 0.8,
      "interaction_matrix_overlap_bottom_k": 0.95,
      "effective_rank": 1.0,
      "effective_rank_mergeability_score": 1.0,
      "stable_rank": 0.85,
      "spectral_gap": 1.0,
      "singular_value_ratio": 1.0,
      "layerwise_effective_rank": 1.0,
      "layerwise_effective_rank_mergeability_score": 1.0,
      "task_vector_cosine_similarity": 1.0,
      "task_vector_l2_distance": 0.95,
      "task_vector_dot_product": 0.7,
      "weight_space_angle": 1.0,
      "task_vector_magnitude_ratio": 0.6,
      "singular_value_overlap": 0.95,
      "subspace_overlap": 0.75,
      "right_subspace_overlap": 0.7,
      "activation_l2_distance": 0.95,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.65,
      "activation_dot_product": 0.7,
      "encoder_gradient_cosine_similarity": 0.75,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.8,
      "input_gradient_cosine_similarity": 0.9,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.6
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5953173502423217,
        "val_r": 0.5902246500404309,
        "n_iterations": 288,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0025200957898050547,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0031146849505603313,
          "interaction_matrix_overlap_bottom_k": 0.014079579152166843,
          "effective_rank": 0.023750564083456993,
          "effective_rank_mergeability_score": 0.06293374300003052,
          "stable_rank": 0.026264578104019165,
          "spectral_gap": 0.07303491979837418,
          "singular_value_ratio": 0.06425982713699341,
          "layerwise_effective_rank": 0.044390711933374405,
          "layerwise_effective_rank_mergeability_score": 0.026918241754174232,
          "task_vector_cosine_similarity": 0.08394726365804672,
          "task_vector_l2_distance": -0.010754233226180077,
          "task_vector_dot_product": -0.0014231788227334619,
          "weight_space_angle": 0.08886060118675232,
          "task_vector_magnitude_ratio": 0.0017722113989293575,
          "singular_value_overlap": -0.008807219564914703,
          "subspace_overlap": 0.007012350484728813,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.010000789538025856,
          "activation_cosine_similarity": 0.0133676677942276,
          "activation_magnitude_ratio": -0.003846755251288414,
          "activation_dot_product": 0.00207308866083622,
          "encoder_gradient_cosine_similarity": 0.0012380261905491352,
          "encoder_gradient_l2_distance": -0.01643987186253071,
          "encoder_gradient_dot_product": 0.0022866218350827694,
          "input_gradient_cosine_similarity": 0.0014597040135413408,
          "input_gradient_l2_distance": -0.016159458085894585,
          "input_gradient_dot_product": -0.001888248254545033
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5595292010868732,
        "val_r": 0.30381231584422275,
        "n_iterations": 314,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.008302178233861923,
          "interaction_matrix_overlap_bottom_k": 0.012615181505680084,
          "effective_rank": 0.06409730762243271,
          "effective_rank_mergeability_score": 0.08023659884929657,
          "stable_rank": 0.014275440946221352,
          "spectral_gap": 0.041157227009534836,
          "singular_value_ratio": 0.02973439171910286,
          "layerwise_effective_rank": 0.05195464938879013,
          "layerwise_effective_rank_mergeability_score": 0.046837951987981796,
          "task_vector_cosine_similarity": 0.06441450864076614,
          "task_vector_l2_distance": -0.013728474266827106,
          "task_vector_dot_product": 0.004226164426654577,
          "weight_space_angle": 0.0747983530163765,
          "task_vector_magnitude_ratio": 0.001516458811238408,
          "singular_value_overlap": -0.0069622076116502285,
          "subspace_overlap": 0.005341010168194771,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.01732459105551243,
          "activation_cosine_similarity": 0.0135668208822608,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0029151258058845997,
          "encoder_gradient_cosine_similarity": 0.0018405200680717826,
          "encoder_gradient_l2_distance": -0.0067168413661420345,
          "encoder_gradient_dot_product": 0.0025136617477983236,
          "input_gradient_cosine_similarity": 0.0024918264243751764,
          "input_gradient_l2_distance": -0.011859682388603687,
          "input_gradient_dot_product": 0.0011655203998088837
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5482454058863735,
        "val_r": 0.508976499049505,
        "n_iterations": 287,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0012522728648036718,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.011905405670404434,
          "effective_rank": 0.05875558778643608,
          "effective_rank_mergeability_score": 0.06772689521312714,
          "stable_rank": 0.01366003230214119,
          "spectral_gap": 0.04025785252451897,
          "singular_value_ratio": 0.035588547587394714,
          "layerwise_effective_rank": 0.048263490200042725,
          "layerwise_effective_rank_mergeability_score": 0.05027084797620773,
          "task_vector_cosine_similarity": 0.08179587125778198,
          "task_vector_l2_distance": -0.010750600136816502,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.08885475248098373,
          "task_vector_magnitude_ratio": 0.0011849055299535394,
          "singular_value_overlap": -0.007253941148519516,
          "subspace_overlap": 0.0060371593572199345,
          "right_subspace_overlap": 0.002746951300650835,
          "activation_l2_distance": 0.01137627474963665,
          "activation_cosine_similarity": 0.00881096813827753,
          "activation_magnitude_ratio": -0.0012455754913389683,
          "activation_dot_product": 0.0023634061217308044,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.00934805627912283,
          "encoder_gradient_dot_product": 0.0033154580742120743,
          "input_gradient_cosine_similarity": 0.0011513640638440847,
          "input_gradient_l2_distance": -0.014175215736031532,
          "input_gradient_dot_product": -0.0011658358853310347
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.4656485249871559,
        "val_r": 0.3671419282442522,
        "n_iterations": 313,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003423442132771015,
          "right_subspace_overlap_bottom_k": -0.0017544038128107786,
          "interaction_matrix_overlap_top_k": 0.0031988583505153656,
          "interaction_matrix_overlap_bottom_k": 0.010976781137287617,
          "effective_rank": 0.018223799765110016,
          "effective_rank_mergeability_score": 0.024319032207131386,
          "stable_rank": 0.0072894468903541565,
          "spectral_gap": 0.1038215160369873,
          "singular_value_ratio": 0.0963028222322464,
          "layerwise_effective_rank": 0.023858584463596344,
          "layerwise_effective_rank_mergeability_score": 0.03531908243894577,
          "task_vector_cosine_similarity": 0.071907177567482,
          "task_vector_l2_distance": -0.008784297853708267,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.07313016802072525,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0035012478474527597,
          "subspace_overlap": 0.010281178168952465,
          "right_subspace_overlap": 0.0018392736092209816,
          "activation_l2_distance": 0.020436178892850876,
          "activation_cosine_similarity": 0.021435951814055443,
          "activation_magnitude_ratio": -0.0014331999700516462,
          "activation_dot_product": 0.004747242201119661,
          "encoder_gradient_cosine_similarity": 0.0022222381085157394,
          "encoder_gradient_l2_distance": -0.00630585104227066,
          "encoder_gradient_dot_product": 0.0029894807375967503,
          "input_gradient_cosine_similarity": 0.0016304892487823963,
          "input_gradient_l2_distance": -0.015362540259957314,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5572576953135869,
        "val_r": 0.6089733540361635,
        "n_iterations": 366,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0034868025686591864,
          "right_subspace_overlap_bottom_k": 0.0010165320709347725,
          "interaction_matrix_overlap_top_k": 0.0016437303274869919,
          "interaction_matrix_overlap_bottom_k": 0.011513778008520603,
          "effective_rank": 0.04257991164922714,
          "effective_rank_mergeability_score": 0.047572024166584015,
          "stable_rank": 0.0,
          "spectral_gap": 0.05743873491883278,
          "singular_value_ratio": 0.051502250134944916,
          "layerwise_effective_rank": 0.04875225946307182,
          "layerwise_effective_rank_mergeability_score": 0.04843314737081528,
          "task_vector_cosine_similarity": 0.0979895144701004,
          "task_vector_l2_distance": -0.01660124585032463,
          "task_vector_dot_product": -0.0012658004416152835,
          "weight_space_angle": 0.10577890276908875,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.008797204121947289,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005154358223080635,
          "activation_l2_distance": 0.004149764310568571,
          "activation_cosine_similarity": 0.006235101260244846,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.010143267922103405,
          "encoder_gradient_dot_product": 0.0045272731222212315,
          "input_gradient_cosine_similarity": 0.00348164071328938,
          "input_gradient_l2_distance": -0.01710568368434906,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5943621444469385,
        "val_r": 0.7021736140226598,
        "n_iterations": 212,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0038912291638553143,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.002407452091574669,
          "interaction_matrix_overlap_bottom_k": 0.012662841007113457,
          "effective_rank": 0.07260574400424957,
          "effective_rank_mergeability_score": 0.08778543770313263,
          "stable_rank": 0.010721871629357338,
          "spectral_gap": 0.04926512762904167,
          "singular_value_ratio": 0.04240847006440163,
          "layerwise_effective_rank": 0.061138950288295746,
          "layerwise_effective_rank_mergeability_score": 0.05805317685008049,
          "task_vector_cosine_similarity": 0.05333588272333145,
          "task_vector_l2_distance": -0.015426275320351124,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.059535857290029526,
          "task_vector_magnitude_ratio": 0.0011226278729736805,
          "singular_value_overlap": -0.012292437255382538,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0017763508949428797,
          "activation_l2_distance": 0.005087911617010832,
          "activation_cosine_similarity": 0.008577782660722733,
          "activation_magnitude_ratio": -0.0018134041456505656,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0013101112563163042,
          "encoder_gradient_l2_distance": -0.014692799188196659,
          "encoder_gradient_dot_product": 0.0023766455706208944,
          "input_gradient_cosine_similarity": 0.004481729585677385,
          "input_gradient_l2_distance": -0.016339702531695366,
          "input_gradient_dot_product": -0.002856561215594411
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.3762535848857412,
        "val_r": 0.20816356300317138,
        "n_iterations": 266,
        "n_nonzero_coefficients": 29,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.023057298734784126,
          "right_subspace_overlap_bottom_k": 0.009199309162795544,
          "interaction_matrix_overlap_top_k": 0.01197175495326519,
          "interaction_matrix_overlap_bottom_k": 0.021495604887604713,
          "effective_rank": 0.016743676736950874,
          "effective_rank_mergeability_score": 0.03112032078206539,
          "stable_rank": 0.0015190886333584785,
          "spectral_gap": 0.06994042545557022,
          "singular_value_ratio": 0.061471499502658844,
          "layerwise_effective_rank": 0.08805953711271286,
          "layerwise_effective_rank_mergeability_score": 0.08319194614887238,
          "task_vector_cosine_similarity": 0.07076606154441833,
          "task_vector_l2_distance": -0.007320062257349491,
          "task_vector_dot_product": -0.004392554517835379,
          "weight_space_angle": 0.06071916222572327,
          "task_vector_magnitude_ratio": -0.0015217752661556005,
          "singular_value_overlap": 0.005475309677422047,
          "subspace_overlap": 0.019568707793951035,
          "right_subspace_overlap": 0.015744155272841454,
          "activation_l2_distance": -0.009426357224583626,
          "activation_cosine_similarity": 0.03216629847884178,
          "activation_magnitude_ratio": 0.022027086466550827,
          "activation_dot_product": 0.027284974232316017,
          "encoder_gradient_cosine_similarity": 0.012258246541023254,
          "encoder_gradient_l2_distance": -0.03166789188981056,
          "encoder_gradient_dot_product": 0.014581955038011074,
          "input_gradient_cosine_similarity": 0.008427455089986324,
          "input_gradient_l2_distance": -0.029125196859240532,
          "input_gradient_dot_product": 0.0037570102140307426
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.4733913148563366,
        "val_r": 0.25965243030263896,
        "n_iterations": 422,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0017074712086468935,
          "interaction_matrix_overlap_bottom_k": 0.01626325026154518,
          "effective_rank": 0.04960604012012482,
          "effective_rank_mergeability_score": 0.0404144786298275,
          "stable_rank": 0.006224446929991245,
          "spectral_gap": 0.057192426174879074,
          "singular_value_ratio": 0.04844551905989647,
          "layerwise_effective_rank": 0.02756277285516262,
          "layerwise_effective_rank_mergeability_score": 0.049579668790102005,
          "task_vector_cosine_similarity": 0.05588468536734581,
          "task_vector_l2_distance": -0.01814335770905018,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.07539273053407669,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.008148193359375,
          "subspace_overlap": 0.015404489822685719,
          "right_subspace_overlap": 0.0028633661568164825,
          "activation_l2_distance": 0.03475545719265938,
          "activation_cosine_similarity": 0.03194809705018997,
          "activation_magnitude_ratio": -0.0016152637545019388,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.001960702706128359,
          "encoder_gradient_l2_distance": -0.0042483750730752945,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0038469666615128517,
          "input_gradient_l2_distance": -0.008417172357439995,
          "input_gradient_dot_product": 0.0015725066186860204
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5951400489285127,
        "val_r": 0.06873783397159827,
        "n_iterations": 291,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0014061240945011377,
          "interaction_matrix_overlap_bottom_k": 0.009767260402441025,
          "effective_rank": 0.04593757912516594,
          "effective_rank_mergeability_score": 0.10321585088968277,
          "stable_rank": 0.052888840436935425,
          "spectral_gap": 0.035920582711696625,
          "singular_value_ratio": 0.026761014014482498,
          "layerwise_effective_rank": 0.0459723174571991,
          "layerwise_effective_rank_mergeability_score": 0.041414760053157806,
          "task_vector_cosine_similarity": 0.06513571739196777,
          "task_vector_l2_distance": -0.011411188170313835,
          "task_vector_dot_product": 0.0010063194204121828,
          "weight_space_angle": 0.06882977485656738,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.005895076785236597,
          "subspace_overlap": 0.005305061116814613,
          "right_subspace_overlap": 0.0019032573327422142,
          "activation_l2_distance": 0.011803077533841133,
          "activation_cosine_similarity": 0.011182252317667007,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0018587163649499416,
          "encoder_gradient_cosine_similarity": 0.003757872385904193,
          "encoder_gradient_l2_distance": -0.006048898212611675,
          "encoder_gradient_dot_product": 0.0015126249054446816,
          "input_gradient_cosine_similarity": 0.0015179693000391126,
          "input_gradient_l2_distance": -0.014685166999697685,
          "input_gradient_dot_product": -0.0031341444700956345
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5391783094060172,
        "val_r": 0.3621208786054817,
        "n_iterations": 389,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.002332288771867752,
          "interaction_matrix_overlap_top_k": 0.001969018252566457,
          "interaction_matrix_overlap_bottom_k": 0.010464994236826897,
          "effective_rank": 0.05103972554206848,
          "effective_rank_mergeability_score": 0.05946480855345726,
          "stable_rank": 0.005799146834760904,
          "spectral_gap": 0.058488864451646805,
          "singular_value_ratio": 0.053060274571180344,
          "layerwise_effective_rank": 0.050077639520168304,
          "layerwise_effective_rank_mergeability_score": 0.05542491376399994,
          "task_vector_cosine_similarity": 0.07789506018161774,
          "task_vector_l2_distance": -0.011362254619598389,
          "task_vector_dot_product": 0.003313465276733041,
          "weight_space_angle": 0.08765677362680435,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.007636265829205513,
          "subspace_overlap": 0.00901875365525484,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.003397783963009715,
          "activation_cosine_similarity": 0.00203372398391366,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.002315649762749672,
          "encoder_gradient_l2_distance": -0.011320971883833408,
          "encoder_gradient_dot_product": 0.006293409038335085,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.020040806382894516,
          "input_gradient_dot_product": -0.001148010604083538
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.49474456622730234,
        "val_r": 0.23264478231888555,
        "n_iterations": 267,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.012359149754047394,
          "right_subspace_overlap_bottom_k": 0.0035777471493929625,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.009432168677449226,
          "effective_rank": 0.02883460931479931,
          "effective_rank_mergeability_score": 0.0699603259563446,
          "stable_rank": 0.009427221491932869,
          "spectral_gap": 0.048409923911094666,
          "singular_value_ratio": 0.03949495777487755,
          "layerwise_effective_rank": 0.06885069608688354,
          "layerwise_effective_rank_mergeability_score": 0.0501558855175972,
          "task_vector_cosine_similarity": 0.08359401673078537,
          "task_vector_l2_distance": -0.011444084346294403,
          "task_vector_dot_product": -0.002410072600468993,
          "weight_space_angle": 0.08678970485925674,
          "task_vector_magnitude_ratio": -0.0015386707382276654,
          "singular_value_overlap": -0.005451160483062267,
          "subspace_overlap": -0.0028661552350968122,
          "right_subspace_overlap": 0.006609418895095587,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.010923185385763645,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.014850890263915062,
          "encoder_gradient_cosine_similarity": 0.004150649532675743,
          "encoder_gradient_l2_distance": -0.024071570485830307,
          "encoder_gradient_dot_product": 0.004512233193963766,
          "input_gradient_cosine_similarity": 0.011920955032110214,
          "input_gradient_l2_distance": -0.02000797726213932,
          "input_gradient_dot_product": 0.001875182380899787
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.48163591430375274,
        "val_r": 0.4817718775473831,
        "n_iterations": 249,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004795607645064592,
          "right_subspace_overlap_bottom_k": 0.0010541209485381842,
          "interaction_matrix_overlap_top_k": 0.0027049672789871693,
          "interaction_matrix_overlap_bottom_k": 0.011322448961436749,
          "effective_rank": 0.022646130993962288,
          "effective_rank_mergeability_score": 0.06309898942708969,
          "stable_rank": 0.005814664997160435,
          "spectral_gap": 0.02992580458521843,
          "singular_value_ratio": 0.02586306631565094,
          "layerwise_effective_rank": 0.07904162257909775,
          "layerwise_effective_rank_mergeability_score": 0.03698321804404259,
          "task_vector_cosine_similarity": 0.0713673010468483,
          "task_vector_l2_distance": -0.008773203939199448,
          "task_vector_dot_product": 0.005020296201109886,
          "weight_space_angle": 0.08869940042495728,
          "task_vector_magnitude_ratio": 0.001897204201668501,
          "singular_value_overlap": -0.002339700935408473,
          "subspace_overlap": 0.019142193719744682,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.03346095606684685,
          "activation_cosine_similarity": 0.029999008402228355,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.002473745495080948,
          "encoder_gradient_cosine_similarity": 0.005201899446547031,
          "encoder_gradient_l2_distance": -0.0037606460973620415,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.00439492566511035,
          "input_gradient_l2_distance": -0.01313411258161068,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5107076584417007,
        "val_r": 0.4051411765810078,
        "n_iterations": 300,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004225574433803558,
          "right_subspace_overlap_bottom_k": 0.002637506928294897,
          "interaction_matrix_overlap_top_k": -0.0018920637667179108,
          "interaction_matrix_overlap_bottom_k": 0.015560237690806389,
          "effective_rank": 0.038339294493198395,
          "effective_rank_mergeability_score": 0.0463755801320076,
          "stable_rank": 0.0180559940636158,
          "spectral_gap": 0.06029229983687401,
          "singular_value_ratio": 0.050328582525253296,
          "layerwise_effective_rank": 0.049639031291007996,
          "layerwise_effective_rank_mergeability_score": 0.05715835094451904,
          "task_vector_cosine_similarity": 0.06956499814987183,
          "task_vector_l2_distance": -0.008387049660086632,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.06425853818655014,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.008996846154332161,
          "subspace_overlap": 0.0014656217535957694,
          "right_subspace_overlap": 0.003159106243401766,
          "activation_l2_distance": 0.016356272622942924,
          "activation_cosine_similarity": 0.020247334614396095,
          "activation_magnitude_ratio": 0.002972410060465336,
          "activation_dot_product": 0.004314871039241552,
          "encoder_gradient_cosine_similarity": 0.006128590553998947,
          "encoder_gradient_l2_distance": -0.008797467686235905,
          "encoder_gradient_dot_product": 0.006410045083612204,
          "input_gradient_cosine_similarity": 0.01338145136833191,
          "input_gradient_l2_distance": -0.020828159525990486,
          "input_gradient_dot_product": -0.0027386839501559734
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5379005504275836,
        "val_r": 0.7159643017748891,
        "n_iterations": 263,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002267963718622923,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.0010001698974519968,
          "interaction_matrix_overlap_bottom_k": 0.010124221444129944,
          "effective_rank": 0.031685926020145416,
          "effective_rank_mergeability_score": 0.04161287099123001,
          "stable_rank": 0.005676928907632828,
          "spectral_gap": 0.04130346700549126,
          "singular_value_ratio": 0.03316676244139671,
          "layerwise_effective_rank": 0.04739068076014519,
          "layerwise_effective_rank_mergeability_score": 0.04887177422642708,
          "task_vector_cosine_similarity": 0.10292956233024597,
          "task_vector_l2_distance": -0.013230417855083942,
          "task_vector_dot_product": 0.006877101957798004,
          "weight_space_angle": 0.10806353390216827,
          "task_vector_magnitude_ratio": 0.0027188491076231003,
          "singular_value_overlap": -0.0031320550478994846,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.008415509015321732,
          "activation_cosine_similarity": 0.009725858457386494,
          "activation_magnitude_ratio": -0.0010418584570288658,
          "activation_dot_product": 0.005744616501033306,
          "encoder_gradient_cosine_similarity": 0.0020307262893766165,
          "encoder_gradient_l2_distance": -0.02318716235458851,
          "encoder_gradient_dot_product": 0.002912752563133836,
          "input_gradient_cosine_similarity": 0.001008749008178711,
          "input_gradient_l2_distance": -0.01246526837348938,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5004625504737237,
        "val_r": 0.595000676024466,
        "n_iterations": 320,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0019040607148781419,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.006505146156996489,
          "effective_rank": 0.04399656876921654,
          "effective_rank_mergeability_score": 0.06277819722890854,
          "stable_rank": 0.011843523010611534,
          "spectral_gap": 0.057438924908638,
          "singular_value_ratio": 0.05020638182759285,
          "layerwise_effective_rank": 0.043848950415849686,
          "layerwise_effective_rank_mergeability_score": 0.04199323058128357,
          "task_vector_cosine_similarity": 0.08282611519098282,
          "task_vector_l2_distance": -0.011097636073827744,
          "task_vector_dot_product": -0.0021572308614850044,
          "weight_space_angle": 0.09198613464832306,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.008131870999932289,
          "subspace_overlap": 0.011664694175124168,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.004310870077461004,
          "activation_cosine_similarity": 0.009321966208517551,
          "activation_magnitude_ratio": -0.0022498895414173603,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.011800090782344341,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0015626766253262758,
          "input_gradient_l2_distance": -0.014397269114851952,
          "input_gradient_dot_product": 0.0014506920706480742
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.5849326236384357,
        "val_r": 0.42198002079176217,
        "n_iterations": 540,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.0012847259640693665,
          "interaction_matrix_overlap_bottom_k": 0.008210113272070885,
          "effective_rank": 0.038258396089076996,
          "effective_rank_mergeability_score": 0.05378538370132446,
          "stable_rank": 0.0,
          "spectral_gap": 0.04742105305194855,
          "singular_value_ratio": 0.043301042169332504,
          "layerwise_effective_rank": 0.05592276155948639,
          "layerwise_effective_rank_mergeability_score": 0.042762402445077896,
          "task_vector_cosine_similarity": 0.09313283860683441,
          "task_vector_l2_distance": -0.01409248448908329,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.09460863471031189,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0018401487031951547,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.003500357735902071,
          "activation_l2_distance": 0.025875484570860863,
          "activation_cosine_similarity": 0.02006836235523224,
          "activation_magnitude_ratio": -0.0011770774144679308,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.00943892914801836,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.002288061659783125,
          "input_gradient_l2_distance": -0.011975888162851334,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5531434612041648,
        "val_r": 0.3161397253123455,
        "n_iterations": 477,
        "n_nonzero_coefficients": 29,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003870007349178195,
          "right_subspace_overlap_bottom_k": 0.004291201941668987,
          "interaction_matrix_overlap_top_k": 0.009897515177726746,
          "interaction_matrix_overlap_bottom_k": 0.0032850615680217743,
          "effective_rank": 0.03218454495072365,
          "effective_rank_mergeability_score": 0.04168960452079773,
          "stable_rank": 0.0014779854100197554,
          "spectral_gap": 0.06517692655324936,
          "singular_value_ratio": 0.060335155576467514,
          "layerwise_effective_rank": 0.04238898679614067,
          "layerwise_effective_rank_mergeability_score": 0.03759961202740669,
          "task_vector_cosine_similarity": 0.07645107805728912,
          "task_vector_l2_distance": -0.016583256423473358,
          "task_vector_dot_product": 0.005405594129115343,
          "weight_space_angle": 0.09934279322624207,
          "task_vector_magnitude_ratio": 0.006176697090268135,
          "singular_value_overlap": -0.0071053518913686275,
          "subspace_overlap": 0.007635423913598061,
          "right_subspace_overlap": 0.001884256023913622,
          "activation_l2_distance": 0.0068037621676921844,
          "activation_cosine_similarity": 0.0034737770911306143,
          "activation_magnitude_ratio": -0.0028906487859785557,
          "activation_dot_product": 0.0043131099082529545,
          "encoder_gradient_cosine_similarity": 0.005378323141485453,
          "encoder_gradient_l2_distance": 0.0018021846190094948,
          "encoder_gradient_dot_product": 0.009454645216464996,
          "input_gradient_cosine_similarity": 0.0021895496174693108,
          "input_gradient_l2_distance": -0.023007921874523163,
          "input_gradient_dot_product": -0.001074159168638289
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5598091344211292,
        "val_r": 0.2915949487866153,
        "n_iterations": 307,
        "n_nonzero_coefficients": 28,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0024166011717170477,
          "right_subspace_overlap_bottom_k": 0.0019366401247680187,
          "interaction_matrix_overlap_top_k": 0.0027126893401145935,
          "interaction_matrix_overlap_bottom_k": 0.016618739813566208,
          "effective_rank": 0.07117004692554474,
          "effective_rank_mergeability_score": 0.06455940753221512,
          "stable_rank": 0.020128922536969185,
          "spectral_gap": 0.043918658047914505,
          "singular_value_ratio": 0.03807384520769119,
          "layerwise_effective_rank": 0.03678339347243309,
          "layerwise_effective_rank_mergeability_score": 0.06786994636058807,
          "task_vector_cosine_similarity": 0.054286081343889236,
          "task_vector_l2_distance": -0.009804465807974339,
          "task_vector_dot_product": 0.0012132280971854925,
          "weight_space_angle": 0.0660819485783577,
          "task_vector_magnitude_ratio": 0.001526745967566967,
          "singular_value_overlap": -0.0015566409565508366,
          "subspace_overlap": 0.01013001799583435,
          "right_subspace_overlap": 0.0023801352363079786,
          "activation_l2_distance": 0.015345611609518528,
          "activation_cosine_similarity": 0.014648068696260452,
          "activation_magnitude_ratio": -0.0013175247004255652,
          "activation_dot_product": 0.007218101993203163,
          "encoder_gradient_cosine_similarity": 0.003258275566622615,
          "encoder_gradient_l2_distance": -0.013062011450529099,
          "encoder_gradient_dot_product": 0.002944465959444642,
          "input_gradient_cosine_similarity": 0.007815287448465824,
          "input_gradient_l2_distance": -0.0262135062366724,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7850113242421635,
        "val_r": 0.6063160330496264,
        "n_iterations": 352,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010329579003155231,
          "right_subspace_overlap_bottom_k": -0.005699553526937962,
          "interaction_matrix_overlap_top_k": 0.0020589998457580805,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.051199689507484436,
          "effective_rank_mergeability_score": 0.03961385786533356,
          "stable_rank": 0.0010544307297095656,
          "spectral_gap": 0.040577489882707596,
          "singular_value_ratio": 0.04190541431307793,
          "layerwise_effective_rank": 0.037866298109292984,
          "layerwise_effective_rank_mergeability_score": 0.05956173688173294,
          "task_vector_cosine_similarity": 0.08458662033081055,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0016937959007918835,
          "weight_space_angle": 0.10058653354644775,
          "task_vector_magnitude_ratio": 0.003351234830915928,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0038946918211877346,
          "right_subspace_overlap": 0.007433086633682251,
          "activation_l2_distance": 0.014256340451538563,
          "activation_cosine_similarity": 0.016378581523895264,
          "activation_magnitude_ratio": -0.0013516999315470457,
          "activation_dot_product": 0.006108683068305254,
          "encoder_gradient_cosine_similarity": 0.004454353358596563,
          "encoder_gradient_l2_distance": -0.011696399189531803,
          "encoder_gradient_dot_product": 0.0021869074553251266,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.012609098106622696,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.61811137177849,
        "val_r": 0.35137559386556255,
        "n_iterations": 456,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.001286168466322124,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.012040154077112675,
          "effective_rank": 0.03788142278790474,
          "effective_rank_mergeability_score": 0.04082424193620682,
          "stable_rank": 0.0,
          "spectral_gap": 0.06848742067813873,
          "singular_value_ratio": 0.06101091951131821,
          "layerwise_effective_rank": 0.06809207051992416,
          "layerwise_effective_rank_mergeability_score": 0.06721214205026627,
          "task_vector_cosine_similarity": 0.07787375897169113,
          "task_vector_l2_distance": -0.013742499984800816,
          "task_vector_dot_product": 0.0012969211675226688,
          "weight_space_angle": 0.08172136545181274,
          "task_vector_magnitude_ratio": 0.001028873142786324,
          "singular_value_overlap": -0.0076887174509465694,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.0016468387329950929,
          "activation_l2_distance": 0.0065783304162323475,
          "activation_cosine_similarity": 0.0021388756576925516,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.010752868838608265,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.008225261233747005,
          "encoder_gradient_dot_product": 0.00463744206354022,
          "input_gradient_cosine_similarity": 0.003791617229580879,
          "input_gradient_l2_distance": -0.014353667385876179,
          "input_gradient_dot_product": 0.0
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "tsv": {
    "aggregate_metrics": {
      "train_r": 0.636008860567922,
      "train_p": 0.0,
      "val_r": 0.5470177078810532,
      "val_p": 2.4987981320384807e-29
    },
    "per_fold_stats": {
      "train_r_mean": 0.7603918462942831,
      "train_r_std": 0.019579279887000322,
      "val_r_mean": 0.6028658615960845,
      "val_r_std": 0.18465412726026958,
      "n_nonzero_mean": 23.95,
      "n_nonzero_std": 2.178875856950093
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.009797555394470692,
      "right_subspace_overlap_bottom_k": -0.0132050272077322,
      "interaction_matrix_overlap_top_k": 0.0029477975331246853,
      "interaction_matrix_overlap_bottom_k": 0.0003103134222328663,
      "effective_rank": 0.05435997247695923,
      "effective_rank_mergeability_score": 0.03510959818959236,
      "stable_rank": 0.0026604225859045982,
      "spectral_gap": 0.040813885629177094,
      "singular_value_ratio": 0.038240864872932434,
      "layerwise_effective_rank": 0.038767118006944656,
      "layerwise_effective_rank_mergeability_score": 0.06595613062381744,
      "task_vector_cosine_similarity": 0.07314308732748032,
      "task_vector_l2_distance": -0.0007742965826764703,
      "task_vector_dot_product": 0.0013161993119865656,
      "weight_space_angle": 0.09051511436700821,
      "task_vector_magnitude_ratio": 0.003563620848581195,
      "singular_value_overlap": 0.004900320433080196,
      "subspace_overlap": 0.0024844533763825893,
      "right_subspace_overlap": 0.007836291566491127,
      "activation_l2_distance": 0.019489126279950142,
      "activation_cosine_similarity": 0.02716594934463501,
      "activation_magnitude_ratio": -2.151332955691032e-05,
      "activation_dot_product": 0.0024511869996786118,
      "encoder_gradient_cosine_similarity": 0.0035849474370479584,
      "encoder_gradient_l2_distance": -0.012591141276061535,
      "encoder_gradient_dot_product": 0.0023450329899787903,
      "input_gradient_cosine_similarity": 0.0026455430779606104,
      "input_gradient_l2_distance": -0.009899117052555084,
      "input_gradient_dot_product": -0.0005513665964826941
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.004132028203457594,
      "right_subspace_overlap_bottom_k": 0.0032481735106557608,
      "interaction_matrix_overlap_top_k": 0.002315203659236431,
      "interaction_matrix_overlap_bottom_k": 0.0011211164528504014,
      "effective_rank": 0.013905918225646019,
      "effective_rank_mergeability_score": 0.013895738869905472,
      "stable_rank": 0.005912187043577433,
      "spectral_gap": 0.014267207123339176,
      "singular_value_ratio": 0.014404688030481339,
      "layerwise_effective_rank": 0.011149565689265728,
      "layerwise_effective_rank_mergeability_score": 0.015470439568161964,
      "task_vector_cosine_similarity": 0.013256005942821503,
      "task_vector_l2_distance": 0.0018063061870634556,
      "task_vector_dot_product": 0.0019117887131869793,
      "weight_space_angle": 0.012224286794662476,
      "task_vector_magnitude_ratio": 0.003570543136447668,
      "singular_value_overlap": 0.0031920697074383497,
      "subspace_overlap": 0.0027462877333164215,
      "right_subspace_overlap": 0.0035147862508893013,
      "activation_l2_distance": 0.006328114308416843,
      "activation_cosine_similarity": 0.007913737557828426,
      "activation_magnitude_ratio": 0.0006367500172927976,
      "activation_dot_product": 0.0039245146326720715,
      "encoder_gradient_cosine_similarity": 0.0014898671070113778,
      "encoder_gradient_l2_distance": 0.003537653014063835,
      "encoder_gradient_dot_product": 0.002044718014076352,
      "input_gradient_cosine_similarity": 0.0020377766340970993,
      "input_gradient_l2_distance": 0.0044233533553779125,
      "input_gradient_dot_product": 0.0012834820663556457
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.95,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.75,
      "interaction_matrix_overlap_bottom_k": 0.5,
      "effective_rank": 1.0,
      "effective_rank_mergeability_score": 1.0,
      "stable_rank": 0.7,
      "spectral_gap": 1.0,
      "singular_value_ratio": 1.0,
      "layerwise_effective_rank": 1.0,
      "layerwise_effective_rank_mergeability_score": 1.0,
      "task_vector_cosine_similarity": 1.0,
      "task_vector_l2_distance": 0.35,
      "task_vector_dot_product": 0.5,
      "weight_space_angle": 1.0,
      "task_vector_magnitude_ratio": 0.85,
      "singular_value_overlap": 0.95,
      "subspace_overlap": 0.65,
      "right_subspace_overlap": 0.95,
      "activation_l2_distance": 1.0,
      "activation_cosine_similarity": 0.95,
      "activation_magnitude_ratio": 0.25,
      "activation_dot_product": 0.65,
      "encoder_gradient_cosine_similarity": 1.0,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.75,
      "input_gradient_cosine_similarity": 0.75,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.45
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7602331798041058,
        "val_r": 0.6510539049952611,
        "n_iterations": 523,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.008445714600384235,
          "right_subspace_overlap_bottom_k": -0.011657841503620148,
          "interaction_matrix_overlap_top_k": 0.0029467083513736725,
          "interaction_matrix_overlap_bottom_k": 0.0013273607473820448,
          "effective_rank": 0.07485952973365784,
          "effective_rank_mergeability_score": 0.06353633850812912,
          "stable_rank": 0.0027368480805307627,
          "spectral_gap": 0.05328845977783203,
          "singular_value_ratio": 0.05123745650053024,
          "layerwise_effective_rank": 0.01572132110595703,
          "layerwise_effective_rank_mergeability_score": 0.031884338706731796,
          "task_vector_cosine_similarity": 0.06711762398481369,
          "task_vector_l2_distance": -0.0016059931367635727,
          "task_vector_dot_product": 0.0017015370540320873,
          "weight_space_angle": 0.08634822815656662,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0029228224884718657,
          "subspace_overlap": 0.0034175643231719732,
          "right_subspace_overlap": 0.006265781819820404,
          "activation_l2_distance": 0.021642444655299187,
          "activation_cosine_similarity": 0.030540233477950096,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.003029260551556945,
          "encoder_gradient_cosine_similarity": 0.003368286183103919,
          "encoder_gradient_l2_distance": -0.01123195979744196,
          "encoder_gradient_dot_product": 0.001770024886354804,
          "input_gradient_cosine_similarity": 0.003527234308421612,
          "input_gradient_l2_distance": -0.006709341891109943,
          "input_gradient_dot_product": -0.0028918557800352573
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7176167085603844,
        "val_r": 0.41177178957196153,
        "n_iterations": 343,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004669573158025742,
          "right_subspace_overlap_bottom_k": -0.01099216565489769,
          "interaction_matrix_overlap_top_k": 0.004512439481914043,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.05276953801512718,
          "effective_rank_mergeability_score": 0.02957974746823311,
          "stable_rank": 0.0020070949103683233,
          "spectral_gap": 0.027874086052179337,
          "singular_value_ratio": 0.02671845071017742,
          "layerwise_effective_rank": 0.04104198142886162,
          "layerwise_effective_rank_mergeability_score": 0.06661196053028107,
          "task_vector_cosine_similarity": 0.08815452456474304,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.00182082480750978,
          "weight_space_angle": 0.10480973869562149,
          "task_vector_magnitude_ratio": 0.0022487209644168615,
          "singular_value_overlap": 0.0050592366605997086,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.009742332622408867,
          "activation_l2_distance": 0.025159010663628578,
          "activation_cosine_similarity": 0.028295285999774933,
          "activation_magnitude_ratio": -0.0010510036954656243,
          "activation_dot_product": 0.0019169820006936789,
          "encoder_gradient_cosine_similarity": 0.002828196156769991,
          "encoder_gradient_l2_distance": -0.013365596532821655,
          "encoder_gradient_dot_product": 0.007661711424589157,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010095737874507904,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7880162645958032,
        "val_r": 0.7843400544464499,
        "n_iterations": 501,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010806366801261902,
          "right_subspace_overlap_bottom_k": -0.010189277119934559,
          "interaction_matrix_overlap_top_k": 0.0014522207202389836,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.050217628479003906,
          "effective_rank_mergeability_score": 0.02394859492778778,
          "stable_rank": 0.0011691163526847959,
          "spectral_gap": 0.04896235093474388,
          "singular_value_ratio": 0.04874503239989281,
          "layerwise_effective_rank": 0.050663094967603683,
          "layerwise_effective_rank_mergeability_score": 0.08308206498622894,
          "task_vector_cosine_similarity": 0.0639258325099945,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.08094679564237595,
          "task_vector_magnitude_ratio": 0.002564789727330208,
          "singular_value_overlap": 0.001143230707384646,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.010127956047654152,
          "activation_l2_distance": 0.017061220481991768,
          "activation_cosine_similarity": 0.023953117430210114,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0014457179931923747,
          "encoder_gradient_l2_distance": -0.012768558226525784,
          "encoder_gradient_dot_product": 0.003079058602452278,
          "input_gradient_cosine_similarity": 0.002100772690027952,
          "input_gradient_l2_distance": -0.010221216827630997,
          "input_gradient_dot_product": -0.00204808684065938
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7308945973824823,
        "val_r": 0.717824996492944,
        "n_iterations": 537,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01427371520549059,
          "right_subspace_overlap_bottom_k": -0.011593079194426537,
          "interaction_matrix_overlap_top_k": 0.002092500915750861,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.03450019657611847,
          "effective_rank_mergeability_score": 0.015147550962865353,
          "stable_rank": 0.0,
          "spectral_gap": 0.061613913625478745,
          "singular_value_ratio": 0.06101638078689575,
          "layerwise_effective_rank": 0.05300329253077507,
          "layerwise_effective_rank_mergeability_score": 0.07978519797325134,
          "task_vector_cosine_similarity": 0.06182216480374336,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.07762698084115982,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0016471717972308397,
          "subspace_overlap": 0.0018850343767553568,
          "right_subspace_overlap": 0.0032013989984989166,
          "activation_l2_distance": 0.019633445888757706,
          "activation_cosine_similarity": 0.026796258985996246,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.0013788886135444045,
          "encoder_gradient_cosine_similarity": 0.0025795770343393087,
          "encoder_gradient_l2_distance": -0.009534932672977448,
          "encoder_gradient_dot_product": 0.0014999577542766929,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0063939462415874004,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7542514380757174,
        "val_r": 0.6816973872052975,
        "n_iterations": 456,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007547907996922731,
          "right_subspace_overlap_bottom_k": -0.011715313419699669,
          "interaction_matrix_overlap_top_k": 0.002972938120365143,
          "interaction_matrix_overlap_bottom_k": 0.0015358394011855125,
          "effective_rank": 0.04620683193206787,
          "effective_rank_mergeability_score": 0.023261424154043198,
          "stable_rank": 0.0020054399501532316,
          "spectral_gap": 0.03964792937040329,
          "singular_value_ratio": 0.03640588000416756,
          "layerwise_effective_rank": 0.0451372005045414,
          "layerwise_effective_rank_mergeability_score": 0.06830679625272751,
          "task_vector_cosine_similarity": 0.08609943836927414,
          "task_vector_l2_distance": -0.0016628848388791084,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.10176257789134979,
          "task_vector_magnitude_ratio": 0.001983778551220894,
          "singular_value_overlap": 0.003393472172319889,
          "subspace_overlap": 0.0028154542669653893,
          "right_subspace_overlap": 0.010908430442214012,
          "activation_l2_distance": 0.017116308212280273,
          "activation_cosine_similarity": 0.02477278560400009,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.00302702933549881,
          "encoder_gradient_l2_distance": -0.012803186662495136,
          "encoder_gradient_dot_product": 0.0049484046176075935,
          "input_gradient_cosine_similarity": 0.0024083571042865515,
          "input_gradient_l2_distance": -0.010994812473654747,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7768527625112625,
        "val_r": 0.7182396860478898,
        "n_iterations": 385,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.015918772667646408,
          "right_subspace_overlap_bottom_k": -0.014724748209118843,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.0011686945799738169,
          "effective_rank": 0.05053598806262016,
          "effective_rank_mergeability_score": 0.02877831645309925,
          "stable_rank": 0.0018399882828816772,
          "spectral_gap": 0.03171686455607414,
          "singular_value_ratio": 0.030749991536140442,
          "layerwise_effective_rank": 0.057869888842105865,
          "layerwise_effective_rank_mergeability_score": 0.08553779870271683,
          "task_vector_cosine_similarity": 0.07362072169780731,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.004612022079527378,
          "weight_space_angle": 0.0951140895485878,
          "task_vector_magnitude_ratio": 0.0017794822342693806,
          "singular_value_overlap": 0.003051162464544177,
          "subspace_overlap": 0.0018479579593986273,
          "right_subspace_overlap": 0.005559207871556282,
          "activation_l2_distance": 0.014529400505125523,
          "activation_cosine_similarity": 0.025716286152601242,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0056084864772856236,
          "encoder_gradient_l2_distance": -0.017393313348293304,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0017913318006321788,
          "input_gradient_l2_distance": -0.0026296330615878105,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7450440524931728,
        "val_r": 0.6375791075446408,
        "n_iterations": 544,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009240454994142056,
          "right_subspace_overlap_bottom_k": -0.01750115491449833,
          "interaction_matrix_overlap_top_k": 0.004205784760415554,
          "interaction_matrix_overlap_bottom_k": 0.0018196039600297809,
          "effective_rank": 0.043952323496341705,
          "effective_rank_mergeability_score": 0.017774850130081177,
          "stable_rank": 0.0016658131498843431,
          "spectral_gap": 0.04199517145752907,
          "singular_value_ratio": 0.04218101501464844,
          "layerwise_effective_rank": 0.04131656140089035,
          "layerwise_effective_rank_mergeability_score": 0.0722721740603447,
          "task_vector_cosine_similarity": 0.0936817154288292,
          "task_vector_l2_distance": 0.0024831797927618027,
          "task_vector_dot_product": 0.0016784629551693797,
          "weight_space_angle": 0.0999901220202446,
          "task_vector_magnitude_ratio": 0.001234646188095212,
          "singular_value_overlap": 0.004972153343260288,
          "subspace_overlap": 0.0017155504319816828,
          "right_subspace_overlap": 0.005970028229057789,
          "activation_l2_distance": 0.018871041014790535,
          "activation_cosine_similarity": 0.03291245549917221,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0041092014871537685,
          "encoder_gradient_l2_distance": -0.013008715584874153,
          "encoder_gradient_dot_product": 0.001793603296391666,
          "input_gradient_cosine_similarity": 0.001990805845707655,
          "input_gradient_l2_distance": -0.007849989458918571,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7483677923629198,
        "val_r": 0.5284533106735473,
        "n_iterations": 300,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.012204858474433422,
          "right_subspace_overlap_bottom_k": -0.01629316806793213,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.001702398993074894,
          "effective_rank": 0.07184580713510513,
          "effective_rank_mergeability_score": 0.0458490364253521,
          "stable_rank": 0.0010523421224206686,
          "spectral_gap": 0.04726209118962288,
          "singular_value_ratio": 0.04656081646680832,
          "layerwise_effective_rank": 0.03552635759115219,
          "layerwise_effective_rank_mergeability_score": 0.06738368421792984,
          "task_vector_cosine_similarity": 0.04849442094564438,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.003226952161639929,
          "weight_space_angle": 0.06847326457500458,
          "task_vector_magnitude_ratio": 0.004120031371712685,
          "singular_value_overlap": 0.006038963329046965,
          "subspace_overlap": 0.003647236153483391,
          "right_subspace_overlap": 0.00689297029748559,
          "activation_l2_distance": 0.015720492228865623,
          "activation_cosine_similarity": 0.025808341801166534,
          "activation_magnitude_ratio": -0.0010020805057138205,
          "activation_dot_product": 0.002048204652965069,
          "encoder_gradient_cosine_similarity": 0.00337672489695251,
          "encoder_gradient_l2_distance": -0.007687402423471212,
          "encoder_gradient_dot_product": 0.004930244758725166,
          "input_gradient_cosine_similarity": 0.004970982670783997,
          "input_gradient_l2_distance": -0.00799369066953659,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.781148710643519,
        "val_r": 0.020921508523550236,
        "n_iterations": 238,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01875588297843933,
          "right_subspace_overlap_bottom_k": -0.01857205480337143,
          "interaction_matrix_overlap_top_k": 0.0060261269100010395,
          "interaction_matrix_overlap_bottom_k": 0.002129815286025405,
          "effective_rank": 0.030437249690294266,
          "effective_rank_mergeability_score": 0.04226686805486679,
          "stable_rank": 0.028010854497551918,
          "spectral_gap": 0.03271938115358353,
          "singular_value_ratio": 0.029988471418619156,
          "layerwise_effective_rank": 0.03759116679430008,
          "layerwise_effective_rank_mergeability_score": 0.06672268360853195,
          "task_vector_cosine_similarity": 0.06423065066337585,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.08351156115531921,
          "task_vector_magnitude_ratio": 0.0064734951592981815,
          "singular_value_overlap": 0.004665628541260958,
          "subspace_overlap": 0.0010492530418559909,
          "right_subspace_overlap": 0.008152930065989494,
          "activation_l2_distance": 0.026264404878020287,
          "activation_cosine_similarity": 0.03209364414215088,
          "activation_magnitude_ratio": 0.0014579070266336203,
          "activation_dot_product": 0.0015622942009940743,
          "encoder_gradient_cosine_similarity": 0.007643657736480236,
          "encoder_gradient_l2_distance": -0.005689941346645355,
          "encoder_gradient_dot_product": 0.00439385324716568,
          "input_gradient_cosine_similarity": 0.0017851796001195908,
          "input_gradient_l2_distance": -0.010177492164075375,
          "input_gradient_dot_product": -0.003280606120824814
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7546796740047407,
        "val_r": 0.45917723731961163,
        "n_iterations": 434,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01425003819167614,
          "right_subspace_overlap_bottom_k": -0.015362954698503017,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.08198992162942886,
          "effective_rank_mergeability_score": 0.061709463596343994,
          "stable_rank": 0.0,
          "spectral_gap": 0.04505809023976326,
          "singular_value_ratio": 0.0459529347717762,
          "layerwise_effective_rank": 0.03322852402925491,
          "layerwise_effective_rank_mergeability_score": 0.06126109138131142,
          "task_vector_cosine_similarity": 0.0701519101858139,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.001033987384289503,
          "weight_space_angle": 0.0885695293545723,
          "task_vector_magnitude_ratio": 0.002652094466611743,
          "singular_value_overlap": 0.001201228005811572,
          "subspace_overlap": 0.0070610661059618,
          "right_subspace_overlap": 0.006154593545943499,
          "activation_l2_distance": 0.003571803215891123,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.002797609195113182,
          "encoder_gradient_l2_distance": -0.009565269574522972,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.008328192867338657,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7774505769074354,
        "val_r": 0.262260509731293,
        "n_iterations": 351,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005421049427241087,
          "right_subspace_overlap_bottom_k": -0.01392168179154396,
          "interaction_matrix_overlap_top_k": 0.007122265174984932,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.04429490864276886,
          "effective_rank_mergeability_score": 0.05026128143072128,
          "stable_rank": 0.002363264560699463,
          "spectral_gap": 0.03064604662358761,
          "singular_value_ratio": 0.03148643672466278,
          "layerwise_effective_rank": 0.05644480139017105,
          "layerwise_effective_rank_mergeability_score": 0.06181076169013977,
          "task_vector_cosine_similarity": 0.06786061078310013,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.003692965256050229,
          "weight_space_angle": 0.09246567636728287,
          "task_vector_magnitude_ratio": 0.0031891963444650173,
          "singular_value_overlap": 0.010895101353526115,
          "subspace_overlap": 0.0026315962895751,
          "right_subspace_overlap": 0.004787693731486797,
          "activation_l2_distance": 0.014825192280113697,
          "activation_cosine_similarity": 0.025519942864775658,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.010320421308279037,
          "encoder_gradient_cosine_similarity": 0.003907721024006605,
          "encoder_gradient_l2_distance": -0.020473694428801537,
          "encoder_gradient_dot_product": 0.002385206986218691,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.002684214850887656,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7482341179013767,
        "val_r": 0.6881970991990278,
        "n_iterations": 553,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007779944222420454,
          "right_subspace_overlap_bottom_k": -0.011396615765988827,
          "interaction_matrix_overlap_top_k": 0.006889307405799627,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.03443816304206848,
          "effective_rank_mergeability_score": 0.026144709438085556,
          "stable_rank": 0.003338388167321682,
          "spectral_gap": 0.08523096144199371,
          "singular_value_ratio": 0.08157100528478622,
          "layerwise_effective_rank": 0.016497613862156868,
          "layerwise_effective_rank_mergeability_score": 0.027957962825894356,
          "task_vector_cosine_similarity": 0.047195613384246826,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.07377175241708755,
          "task_vector_magnitude_ratio": 0.005237981211394072,
          "singular_value_overlap": 0.008419957011938095,
          "subspace_overlap": 0.004767949227243662,
          "right_subspace_overlap": 0.011899339966475964,
          "activation_l2_distance": 0.029148584231734276,
          "activation_cosine_similarity": 0.03544263169169426,
          "activation_magnitude_ratio": 0.0014735704753547907,
          "activation_dot_product": 0.0035611253697425127,
          "encoder_gradient_cosine_similarity": 0.004923287313431501,
          "encoder_gradient_l2_distance": -0.012985944747924805,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.006510498002171516,
          "input_gradient_l2_distance": -0.01349292416125536,
          "input_gradient_dot_product": -0.0017649729270488024
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7671894062912067,
        "val_r": 0.6816614576531593,
        "n_iterations": 263,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006454101298004389,
          "right_subspace_overlap_bottom_k": -0.011690374463796616,
          "interaction_matrix_overlap_top_k": 0.0024222172796726227,
          "interaction_matrix_overlap_bottom_k": -0.0011829647701233625,
          "effective_rank": 0.05568665266036987,
          "effective_rank_mergeability_score": 0.02348557487130165,
          "stable_rank": 0.0,
          "spectral_gap": 0.0364292711019516,
          "singular_value_ratio": 0.03643253818154335,
          "layerwise_effective_rank": 0.03481423854827881,
          "layerwise_effective_rank_mergeability_score": 0.07133252918720245,
          "task_vector_cosine_similarity": 0.07468349486589432,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0810864269733429,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0032288958318531513,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.012098615989089012,
          "activation_l2_distance": 0.02853785827755928,
          "activation_cosine_similarity": 0.03428764268755913,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0027372438926249743,
          "encoder_gradient_l2_distance": -0.008756374940276146,
          "encoder_gradient_dot_product": 0.0017024684930220246,
          "input_gradient_cosine_similarity": 0.002892098855227232,
          "input_gradient_l2_distance": -0.008916477672755718,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7581867424399589,
        "val_r": 0.7533070496886474,
        "n_iterations": 341,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011465783230960369,
          "right_subspace_overlap_bottom_k": -0.013728480786085129,
          "interaction_matrix_overlap_top_k": 0.004899340681731701,
          "interaction_matrix_overlap_bottom_k": 0.0014261486940085888,
          "effective_rank": 0.05322251841425896,
          "effective_rank_mergeability_score": 0.03790004178881645,
          "stable_rank": 0.0,
          "spectral_gap": 0.04080292955040932,
          "singular_value_ratio": 0.04126583784818649,
          "layerwise_effective_rank": 0.031084634363651276,
          "layerwise_effective_rank_mergeability_score": 0.05987150967121124,
          "task_vector_cosine_similarity": 0.07971974462270737,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.10800260305404663,
          "task_vector_magnitude_ratio": 0.004927343688905239,
          "singular_value_overlap": 0.009436339139938354,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.012137345969676971,
          "activation_l2_distance": 0.012607118114829063,
          "activation_cosine_similarity": 0.023040518164634705,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.011923897080123425,
          "encoder_gradient_cosine_similarity": 0.003225516527891159,
          "encoder_gradient_l2_distance": -0.017860673367977142,
          "encoder_gradient_dot_product": 0.0020174451638013124,
          "input_gradient_cosine_similarity": 0.005515174940228462,
          "input_gradient_l2_distance": -0.014717232435941696,
          "input_gradient_dot_product": 0.0019280363339930773
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7478595387275223,
        "val_r": 0.7298390483952464,
        "n_iterations": 263,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009577536024153233,
          "right_subspace_overlap_bottom_k": -0.01370878517627716,
          "interaction_matrix_overlap_top_k": 0.0029236427508294582,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.04374336078763008,
          "effective_rank_mergeability_score": 0.01661696285009384,
          "stable_rank": 0.0031623567920178175,
          "spectral_gap": 0.04042035713791847,
          "singular_value_ratio": 0.029365137219429016,
          "layerwise_effective_rank": 0.04092630743980408,
          "layerwise_effective_rank_mergeability_score": 0.07115034759044647,
          "task_vector_cosine_similarity": 0.08090327680110931,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.10043668001890182,
          "task_vector_magnitude_ratio": 0.012022781185805798,
          "singular_value_overlap": 0.0034160849172621965,
          "subspace_overlap": 0.010266268625855446,
          "right_subspace_overlap": 0.006299299653619528,
          "activation_l2_distance": 0.013228144496679306,
          "activation_cosine_similarity": 0.02295910194516182,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0030703824013471603,
          "encoder_gradient_cosine_similarity": 0.004511023405939341,
          "encoder_gradient_l2_distance": -0.013674253597855568,
          "encoder_gradient_dot_product": 0.0022138801869004965,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.013520793057978153,
          "input_gradient_dot_product": -0.001087153097614646
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.8002974180075895,
        "val_r": 0.6050794943750459,
        "n_iterations": 263,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.008655274286866188,
          "right_subspace_overlap_bottom_k": -0.013375569134950638,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.05402281880378723,
          "effective_rank_mergeability_score": 0.04060268774628639,
          "stable_rank": 0.001027920050546527,
          "spectral_gap": 0.023249223828315735,
          "singular_value_ratio": 0.0207726638764143,
          "layerwise_effective_rank": 0.02935105748474598,
          "layerwise_effective_rank_mergeability_score": 0.048227034509181976,
          "task_vector_cosine_similarity": 0.09922850131988525,
          "task_vector_l2_distance": -0.004671430215239525,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.11345893889665604,
          "task_vector_magnitude_ratio": 0.0017736094305291772,
          "singular_value_overlap": 0.00865877140313387,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.013255054131150246,
          "activation_l2_distance": 0.029413189738988876,
          "activation_cosine_similarity": 0.03714824095368385,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0013598236255347729,
          "encoder_gradient_l2_distance": -0.013986648991703987,
          "encoder_gradient_dot_product": 0.0010415377328172326,
          "input_gradient_cosine_similarity": 0.005942468531429768,
          "input_gradient_l2_distance": -0.010748865082859993,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.769711971300589,
        "val_r": 0.7567865532489317,
        "n_iterations": 320,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.008392978459596634,
          "right_subspace_overlap_bottom_k": -0.013712020590901375,
          "interaction_matrix_overlap_top_k": 0.005573976784944534,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.06935754418373108,
          "effective_rank_mergeability_score": 0.044140227138996124,
          "stable_rank": 0.0,
          "spectral_gap": 0.032377131283283234,
          "singular_value_ratio": 0.02941538766026497,
          "layerwise_effective_rank": 0.03393636271357536,
          "layerwise_effective_rank_mergeability_score": 0.06426579505205154,
          "task_vector_cosine_similarity": 0.06937575340270996,
          "task_vector_l2_distance": -0.001691895187832415,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.084381602704525,
          "task_vector_magnitude_ratio": 0.0012477264972403646,
          "singular_value_overlap": 0.005465805996209383,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.008707348257303238,
          "activation_l2_distance": 0.02093588188290596,
          "activation_cosine_similarity": 0.0296732559800148,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0017937201773747802,
          "encoder_gradient_cosine_similarity": 0.004042437300086021,
          "encoder_gradient_l2_distance": -0.013344700448215008,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0035255993716418743,
          "input_gradient_l2_distance": -0.01508785504847765,
          "input_gradient_dot_product": -0.0010589327430352569
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7432388133180653,
        "val_r": 0.7082440313059885,
        "n_iterations": 443,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009637675248086452,
          "right_subspace_overlap_bottom_k": -0.015366344712674618,
          "interaction_matrix_overlap_top_k": 0.0036534336395561695,
          "interaction_matrix_overlap_bottom_k": -0.0024863588623702526,
          "effective_rank": 0.06343119591474533,
          "effective_rank_mergeability_score": 0.0312346164137125,
          "stable_rank": 0.0015931872185319662,
          "spectral_gap": 0.026381472125649452,
          "singular_value_ratio": 0.02404179237782955,
          "layerwise_effective_rank": 0.036310821771621704,
          "layerwise_effective_rank_mergeability_score": 0.0838649794459343,
          "task_vector_cosine_similarity": 0.07798988372087479,
          "task_vector_l2_distance": -0.00239388644695282,
          "task_vector_dot_product": 0.006045778747648001,
          "weight_space_angle": 0.0884164422750473,
          "task_vector_magnitude_ratio": 0.001813146285712719,
          "singular_value_overlap": 0.011165876872837543,
          "subspace_overlap": 0.002216784516349435,
          "right_subspace_overlap": 0.003078971989452839,
          "activation_l2_distance": 0.023887399584054947,
          "activation_cosine_similarity": 0.037242159247398376,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.007796066347509623,
          "encoder_gradient_cosine_similarity": 0.004506764933466911,
          "encoder_gradient_l2_distance": -0.01661876030266285,
          "encoder_gradient_dot_product": 0.004786347039043903,
          "input_gradient_cosine_similarity": 0.004541096743196249,
          "input_gradient_l2_distance": -0.02242879383265972,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7809695131399639,
        "val_r": 0.5721181922635667,
        "n_iterations": 393,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.012453481554985046,
          "right_subspace_overlap_bottom_k": -0.015779249370098114,
          "interaction_matrix_overlap_top_k": 0.0012630483834072948,
          "interaction_matrix_overlap_bottom_k": 0.0011031199246644974,
          "effective_rank": 0.06878064572811127,
          "effective_rank_mergeability_score": 0.04936038330197334,
          "stable_rank": 0.0012358356034383178,
          "spectral_gap": 0.023178022354841232,
          "singular_value_ratio": 0.022180868312716484,
          "layerwise_effective_rank": 0.03474090248346329,
          "layerwise_effective_rank_mergeability_score": 0.06030777841806412,
          "task_vector_cosine_similarity": 0.08493194729089737,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.003767920657992363,
          "weight_space_angle": 0.1044832319021225,
          "task_vector_magnitude_ratio": 0.004190361592918634,
          "singular_value_overlap": 0.0032245106995105743,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.011486532166600227,
          "activation_l2_distance": 0.02102701924741268,
          "activation_cosine_similarity": 0.027701159939169884,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0010130873415619135,
          "encoder_gradient_cosine_similarity": 0.004535524640232325,
          "encoder_gradient_l2_distance": -0.011328227818012238,
          "encoder_gradient_dot_product": 0.002676913980394602,
          "input_gradient_cosine_similarity": 0.001949070836417377,
          "input_gradient_l2_distance": -0.005787009373307228,
          "input_gradient_dot_product": -0.002177067566663027
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7575936474178476,
        "val_r": 0.68876481323963,
        "n_iterations": 243,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.0028196878265589476,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.06290663033723831,
          "effective_rank_mergeability_score": 0.030593276023864746,
          "stable_rank": 0.0,
          "spectral_gap": 0.04742387309670448,
          "singular_value_ratio": 0.028729286044836044,
          "layerwise_effective_rank": 0.050136078149080276,
          "layerwise_effective_rank_mergeability_score": 0.0874861404299736,
          "task_vector_cosine_similarity": 0.06367392092943192,
          "task_vector_l2_distance": -0.005943020805716515,
          "task_vector_dot_product": -0.0012564667267724872,
          "weight_space_angle": 0.07664602994918823,
          "task_vector_magnitude_ratio": 0.013813228346407413,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.006367349531501532,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.01660252921283245,
          "activation_cosine_similarity": 0.0194159634411335,
          "activation_magnitude_ratio": -0.001308659790083766,
          "activation_dot_product": 0.008425704203546047,
          "encoder_gradient_cosine_similarity": 0.0011651107342913747,
          "encoder_gradient_l2_distance": -0.009744662791490555,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.003460187930613756,
          "input_gradient_l2_distance": -0.009204111993312836,
          "input_gradient_dot_product": 0.0013533078599721193
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "isotropic": {
    "aggregate_metrics": {
      "train_r": 0.20681682351991035,
      "train_p": 1.8337289723875815e-32,
      "val_r": -0.06623537928182745,
      "val_p": 0.21121823215719754
    },
    "per_fold_stats": {
      "train_r_mean": 0.4020602173767463,
      "train_r_std": 0.11988676946900144,
      "val_r_mean": 0.3080382326484644,
      "val_r_std": 0.20502155606750072,
      "n_nonzero_mean": 24.75,
      "n_nonzero_std": 1.920286436967152
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.0050026485696434975,
      "right_subspace_overlap_bottom_k": 0.005834916140884161,
      "interaction_matrix_overlap_top_k": 0.0036775744520127773,
      "interaction_matrix_overlap_bottom_k": 0.06419934332370758,
      "effective_rank": 0.026529882103204727,
      "effective_rank_mergeability_score": 0.04969625547528267,
      "stable_rank": 0.014260893687605858,
      "spectral_gap": 0.055154889822006226,
      "singular_value_ratio": 0.02664296329021454,
      "layerwise_effective_rank": 0.03246966376900673,
      "layerwise_effective_rank_mergeability_score": 0.030321979895234108,
      "task_vector_cosine_similarity": 0.033555708825588226,
      "task_vector_l2_distance": -0.004642520099878311,
      "task_vector_dot_product": 0.002283920766785741,
      "weight_space_angle": 0.06355614960193634,
      "task_vector_magnitude_ratio": 0.0023139158729463816,
      "singular_value_overlap": -0.004964123945683241,
      "subspace_overlap": 0.0398387536406517,
      "right_subspace_overlap": 0.005033909343183041,
      "activation_l2_distance": 0.009047386236488819,
      "activation_cosine_similarity": 0.006861566100269556,
      "activation_magnitude_ratio": 0.0006721236277371645,
      "activation_dot_product": 0.005115295294672251,
      "encoder_gradient_cosine_similarity": 0.008529935963451862,
      "encoder_gradient_l2_distance": -0.0012927325442433357,
      "encoder_gradient_dot_product": 0.009031449444591999,
      "input_gradient_cosine_similarity": 0.014061744324862957,
      "input_gradient_l2_distance": -0.006346783135086298,
      "input_gradient_dot_product": 0.0013193546328693628
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.00527644157409668,
      "right_subspace_overlap_bottom_k": 0.005057893227785826,
      "interaction_matrix_overlap_top_k": 0.0046028089709579945,
      "interaction_matrix_overlap_bottom_k": 0.04041263833642006,
      "effective_rank": 0.022992722690105438,
      "effective_rank_mergeability_score": 0.027269862592220306,
      "stable_rank": 0.00974889937788248,
      "spectral_gap": 0.01780964806675911,
      "singular_value_ratio": 0.023738563060760498,
      "layerwise_effective_rank": 0.02656368725001812,
      "layerwise_effective_rank_mergeability_score": 0.026137739419937134,
      "task_vector_cosine_similarity": 0.02867422066628933,
      "task_vector_l2_distance": 0.007369569037109613,
      "task_vector_dot_product": 0.003109127515926957,
      "weight_space_angle": 0.021712666377425194,
      "task_vector_magnitude_ratio": 0.003084976226091385,
      "singular_value_overlap": 0.005290892440825701,
      "subspace_overlap": 0.03355112299323082,
      "right_subspace_overlap": 0.005296109244227409,
      "activation_l2_distance": 0.009097130037844181,
      "activation_cosine_similarity": 0.0054947007447481155,
      "activation_magnitude_ratio": 0.00672015268355608,
      "activation_dot_product": 0.006461990997195244,
      "encoder_gradient_cosine_similarity": 0.009647076949477196,
      "encoder_gradient_l2_distance": 0.0035873805172741413,
      "encoder_gradient_dot_product": 0.00725163659080863,
      "input_gradient_cosine_similarity": 0.011053862050175667,
      "input_gradient_l2_distance": 0.007068573962897062,
      "input_gradient_dot_product": 0.004239276517182589
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.75,
      "right_subspace_overlap_bottom_k": 0.9,
      "interaction_matrix_overlap_top_k": 0.7,
      "interaction_matrix_overlap_bottom_k": 0.95,
      "effective_rank": 0.9,
      "effective_rank_mergeability_score": 1.0,
      "stable_rank": 0.95,
      "spectral_gap": 1.0,
      "singular_value_ratio": 1.0,
      "layerwise_effective_rank": 1.0,
      "layerwise_effective_rank_mergeability_score": 1.0,
      "task_vector_cosine_similarity": 1.0,
      "task_vector_l2_distance": 0.7,
      "task_vector_dot_product": 0.6,
      "weight_space_angle": 1.0,
      "task_vector_magnitude_ratio": 0.6,
      "singular_value_overlap": 0.8,
      "subspace_overlap": 1.0,
      "right_subspace_overlap": 0.7,
      "activation_l2_distance": 0.95,
      "activation_cosine_similarity": 0.85,
      "activation_magnitude_ratio": 0.7,
      "activation_dot_product": 0.85,
      "encoder_gradient_cosine_similarity": 0.9,
      "encoder_gradient_l2_distance": 0.7,
      "encoder_gradient_dot_product": 0.95,
      "input_gradient_cosine_similarity": 0.95,
      "input_gradient_l2_distance": 0.7,
      "input_gradient_dot_product": 0.65
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.3234348499457338,
        "val_r": 0.2247130145938361,
        "n_iterations": 217,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.012105781584978104,
          "interaction_matrix_overlap_top_k": 0.0030521852895617485,
          "interaction_matrix_overlap_bottom_k": 0.09157423675060272,
          "effective_rank": 0.004457312636077404,
          "effective_rank_mergeability_score": 0.029378267005085945,
          "stable_rank": 0.010411798022687435,
          "spectral_gap": 0.07126694917678833,
          "singular_value_ratio": 0.010321298614144325,
          "layerwise_effective_rank": 0.04660293832421303,
          "layerwise_effective_rank_mergeability_score": 0.002659787191078067,
          "task_vector_cosine_similarity": 0.01698037050664425,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.07417549192905426,
          "task_vector_magnitude_ratio": 0.002828029217198491,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.06728126108646393,
          "right_subspace_overlap": -0.001415751175954938,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.002772153355181217,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0050691100768744946,
          "encoder_gradient_cosine_similarity": 0.0024271132424473763,
          "encoder_gradient_l2_distance": 0.0,
          "encoder_gradient_dot_product": 0.010018312372267246,
          "input_gradient_cosine_similarity": 0.006557122804224491,
          "input_gradient_l2_distance": -0.0038260973524302244,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5063520549915409,
        "val_r": 0.4073152951056832,
        "n_iterations": 374,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.001887317281216383,
          "right_subspace_overlap_bottom_k": 0.0032892944291234016,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.02297503501176834,
          "effective_rank": 0.021457819268107414,
          "effective_rank_mergeability_score": 0.052402276545763016,
          "stable_rank": 0.03325341269373894,
          "spectral_gap": 0.07027751207351685,
          "singular_value_ratio": 0.06031401827931404,
          "layerwise_effective_rank": 0.04964178428053856,
          "layerwise_effective_rank_mergeability_score": 0.046685606241226196,
          "task_vector_cosine_similarity": 0.0724324882030487,
          "task_vector_l2_distance": -0.014132550917565823,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.07597047090530396,
          "task_vector_magnitude_ratio": 0.0012874412350356579,
          "singular_value_overlap": -0.014101849868893623,
          "subspace_overlap": 0.0036467788740992546,
          "right_subspace_overlap": 0.003374922089278698,
          "activation_l2_distance": 0.004970336798578501,
          "activation_cosine_similarity": 0.002776562701910734,
          "activation_magnitude_ratio": -0.001985767390578985,
          "activation_dot_product": -0.0013917190954089165,
          "encoder_gradient_cosine_similarity": 0.0010788694489747286,
          "encoder_gradient_l2_distance": -0.006919016595929861,
          "encoder_gradient_dot_product": 0.00308799184858799,
          "input_gradient_cosine_similarity": 0.005165811628103256,
          "input_gradient_l2_distance": -0.017339300364255905,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.3040439584951941,
        "val_r": 0.22745240994297783,
        "n_iterations": 276,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009240318089723587,
          "right_subspace_overlap_bottom_k": 0.009684229269623756,
          "interaction_matrix_overlap_top_k": 0.00604553148150444,
          "interaction_matrix_overlap_bottom_k": 0.05985346809029579,
          "effective_rank": 0.02490375190973282,
          "effective_rank_mergeability_score": 0.03555745258927345,
          "stable_rank": 0.02669820748269558,
          "spectral_gap": 0.062099020928144455,
          "singular_value_ratio": 0.014614586718380451,
          "layerwise_effective_rank": 0.001051372499205172,
          "layerwise_effective_rank_mergeability_score": 0.021604740992188454,
          "task_vector_cosine_similarity": 0.005331520456820726,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.06697136163711548,
          "task_vector_magnitude_ratio": 0.010504861362278461,
          "singular_value_overlap": -0.001542209181934595,
          "subspace_overlap": 0.061107248067855835,
          "right_subspace_overlap": 0.00856365729123354,
          "activation_l2_distance": 0.0023748399689793587,
          "activation_cosine_similarity": 0.0024366218131035566,
          "activation_magnitude_ratio": -0.001734964200295508,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.017473220825195312,
          "encoder_gradient_l2_distance": 0.0,
          "encoder_gradient_dot_product": 0.015604173764586449,
          "input_gradient_cosine_similarity": 0.01966654136776924,
          "input_gradient_l2_distance": -0.004335665609687567,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.31016256464529135,
        "val_r": 0.31765456513106793,
        "n_iterations": 367,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.008971421048045158,
          "right_subspace_overlap_bottom_k": 0.005252446513622999,
          "interaction_matrix_overlap_top_k": 0.004304743837565184,
          "interaction_matrix_overlap_bottom_k": 0.1040075346827507,
          "effective_rank": 0.0045882281847298145,
          "effective_rank_mergeability_score": 0.03175710141658783,
          "stable_rank": 0.019804328680038452,
          "spectral_gap": 0.0499516986310482,
          "singular_value_ratio": 0.004011484328657389,
          "layerwise_effective_rank": 0.013139410875737667,
          "layerwise_effective_rank_mergeability_score": 0.01739640161395073,
          "task_vector_cosine_similarity": 0.01262974925339222,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0012931261444464326,
          "weight_space_angle": 0.048817653208971024,
          "task_vector_magnitude_ratio": 0.005295718554407358,
          "singular_value_overlap": -0.004574656952172518,
          "subspace_overlap": 0.06458920985460281,
          "right_subspace_overlap": 0.009590886533260345,
          "activation_l2_distance": 0.04191824421286583,
          "activation_cosine_similarity": 0.016479773446917534,
          "activation_magnitude_ratio": 0.001886219484731555,
          "activation_dot_product": 0.01124405488371849,
          "encoder_gradient_cosine_similarity": 0.010928524658083916,
          "encoder_gradient_l2_distance": -0.0010634582722559571,
          "encoder_gradient_dot_product": 0.01319578941911459,
          "input_gradient_cosine_similarity": 0.031876157969236374,
          "input_gradient_l2_distance": 0.0,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5570360965370867,
        "val_r": 0.5838090006701524,
        "n_iterations": 760,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004903800319880247,
          "right_subspace_overlap_bottom_k": 0.0018180327024310827,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.021841906011104584,
          "effective_rank": 0.03679506108164787,
          "effective_rank_mergeability_score": 0.03914790228009224,
          "stable_rank": 0.0025956290774047375,
          "spectral_gap": 0.06471437960863113,
          "singular_value_ratio": 0.05822739377617836,
          "layerwise_effective_rank": 0.04926056042313576,
          "layerwise_effective_rank_mergeability_score": 0.051924027502536774,
          "task_vector_cosine_similarity": 0.09222477674484253,
          "task_vector_l2_distance": -0.015972480177879333,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.09814286977052689,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.013685159385204315,
          "subspace_overlap": 0.0013385923812165856,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.004427280277013779,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002715685870498419,
          "activation_dot_product": -0.0023484486155211926,
          "encoder_gradient_cosine_similarity": -0.0015439426060765982,
          "encoder_gradient_l2_distance": -0.004224705044180155,
          "encoder_gradient_dot_product": 0.0036125383339822292,
          "input_gradient_cosine_similarity": 0.0018076575361192226,
          "input_gradient_l2_distance": -0.013345361687242985,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.2970791307057157,
        "val_r": 0.46116854011954006,
        "n_iterations": 258,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0029942835681140423,
          "right_subspace_overlap_bottom_k": 0.001216050935909152,
          "interaction_matrix_overlap_top_k": 0.0018693564925342798,
          "interaction_matrix_overlap_bottom_k": 0.09757205843925476,
          "effective_rank": 0.007005484774708748,
          "effective_rank_mergeability_score": 0.05895364657044411,
          "stable_rank": 0.011580719612538815,
          "spectral_gap": 0.04870785027742386,
          "singular_value_ratio": 0.005213411524891853,
          "layerwise_effective_rank": 0.03585762530565262,
          "layerwise_effective_rank_mergeability_score": 0.004559795372188091,
          "task_vector_cosine_similarity": 0.02555685304105282,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0010621235705912113,
          "weight_space_angle": 0.05343850329518318,
          "task_vector_magnitude_ratio": 0.006027781404554844,
          "singular_value_overlap": -0.0011435332708060741,
          "subspace_overlap": 0.07622770220041275,
          "right_subspace_overlap": 0.0068550193682312965,
          "activation_l2_distance": 0.006181170232594013,
          "activation_cosine_similarity": 0.00982162356376648,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.002186410129070282,
          "encoder_gradient_cosine_similarity": 0.013340622186660767,
          "encoder_gradient_l2_distance": 0.0,
          "encoder_gradient_dot_product": 0.003602496115490794,
          "input_gradient_cosine_similarity": 0.025860536843538284,
          "input_gradient_l2_distance": -0.003108869306743145,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.36052862462933916,
        "val_r": -0.19047123697990567,
        "n_iterations": 220,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0012613439466804266,
          "right_subspace_overlap_bottom_k": 0.019421368837356567,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.10714103281497955,
          "effective_rank": 0.009106048382818699,
          "effective_rank_mergeability_score": 0.04194368049502373,
          "stable_rank": 0.016658129170536995,
          "spectral_gap": 0.03908972069621086,
          "singular_value_ratio": 0.005805380642414093,
          "layerwise_effective_rank": 0.0018089241348206997,
          "layerwise_effective_rank_mergeability_score": 0.011528149247169495,
          "task_vector_cosine_similarity": 0.00225519435480237,
          "task_vector_l2_distance": 0.0034855741541832685,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.08066590130329132,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.06282069534063339,
          "right_subspace_overlap": 0.007096030283719301,
          "activation_l2_distance": 0.0025064614601433277,
          "activation_cosine_similarity": 0.01696012355387211,
          "activation_magnitude_ratio": 0.02895294316112995,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.018304258584976196,
          "encoder_gradient_l2_distance": -0.0011679647723212838,
          "encoder_gradient_dot_product": 0.017576206475496292,
          "input_gradient_cosine_similarity": 0.019100243225693703,
          "input_gradient_l2_distance": 0.0,
          "input_gradient_dot_product": 0.001853608526289463
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.30495282656937817,
        "val_r": 0.32353188974045227,
        "n_iterations": 220,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011304913088679314,
          "right_subspace_overlap_bottom_k": 0.006661118473857641,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.13470561802387238,
          "effective_rank": 0.01803911291062832,
          "effective_rank_mergeability_score": 0.0012207827530801296,
          "stable_rank": 0.010950927622616291,
          "spectral_gap": 0.10125505179166794,
          "singular_value_ratio": 0.012847991660237312,
          "layerwise_effective_rank": 0.0029990561306476593,
          "layerwise_effective_rank_mergeability_score": 0.014093853533267975,
          "task_vector_cosine_similarity": 0.017038246616721153,
          "task_vector_l2_distance": 0.0022872621193528175,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0025441257748752832,
          "task_vector_magnitude_ratio": 0.0013816911960020661,
          "singular_value_overlap": -0.0018726969137787819,
          "subspace_overlap": 0.05444205179810524,
          "right_subspace_overlap": 0.014401545748114586,
          "activation_l2_distance": 0.015719885006546974,
          "activation_cosine_similarity": 0.009402060881257057,
          "activation_magnitude_ratio": 0.0024967254139482975,
          "activation_dot_product": 0.0010216168593615294,
          "encoder_gradient_cosine_similarity": 0.006988592445850372,
          "encoder_gradient_l2_distance": 0.007570573128759861,
          "encoder_gradient_dot_product": 0.006068970076739788,
          "input_gradient_cosine_similarity": 0.020022297278046608,
          "input_gradient_l2_distance": 0.0033267135731875896,
          "input_gradient_dot_product": 0.015221193432807922
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.2884479421618031,
        "val_r": -0.09709731957269038,
        "n_iterations": 285,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004074038937687874,
          "right_subspace_overlap_bottom_k": 0.007204233668744564,
          "interaction_matrix_overlap_top_k": 0.0028495164588093758,
          "interaction_matrix_overlap_bottom_k": 0.08317329734563828,
          "effective_rank": 0.010575196705758572,
          "effective_rank_mergeability_score": 0.05296779051423073,
          "stable_rank": 0.012971463613212109,
          "spectral_gap": 0.031121253967285156,
          "singular_value_ratio": 0.010335765779018402,
          "layerwise_effective_rank": 0.004155052825808525,
          "layerwise_effective_rank_mergeability_score": 0.018960127606987953,
          "task_vector_cosine_similarity": 0.011944541707634926,
          "task_vector_l2_distance": 0.0010641072876751423,
          "task_vector_dot_product": 0.009092269465327263,
          "weight_space_angle": 0.04467841610312462,
          "task_vector_magnitude_ratio": 0.0017658377764746547,
          "singular_value_overlap": 0.002077947836369276,
          "subspace_overlap": 0.06892240047454834,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.01937124878168106,
          "activation_cosine_similarity": 0.017238397151231766,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.004659892991185188,
          "encoder_gradient_cosine_similarity": 0.03754547983407974,
          "encoder_gradient_l2_distance": 0.0029650405049324036,
          "encoder_gradient_dot_product": 0.02316119149327278,
          "input_gradient_cosine_similarity": 0.025677356868982315,
          "input_gradient_l2_distance": 0.0011133492225781083,
          "input_gradient_dot_product": 0.009266708046197891
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.2906153479455351,
        "val_r": 0.2943712262795681,
        "n_iterations": 271,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010208917781710625,
          "right_subspace_overlap_bottom_k": 0.009297299198806286,
          "interaction_matrix_overlap_top_k": 0.015128380618989468,
          "interaction_matrix_overlap_bottom_k": 0.10255273431539536,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.036444973200559616,
          "stable_rank": 0.013604273088276386,
          "spectral_gap": 0.05436825379729271,
          "singular_value_ratio": 0.012876687571406364,
          "layerwise_effective_rank": 0.014603562653064728,
          "layerwise_effective_rank_mergeability_score": 0.007856684736907482,
          "task_vector_cosine_similarity": 0.0143578564748168,
          "task_vector_l2_distance": 0.001190589857287705,
          "task_vector_dot_product": 0.0055854180827736855,
          "weight_space_angle": 0.06998147815465927,
          "task_vector_magnitude_ratio": -0.0011208293726667762,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.07592980563640594,
          "right_subspace_overlap": 0.009888555854558945,
          "activation_l2_distance": 0.0014745327644050121,
          "activation_cosine_similarity": 0.009045174345374107,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.007947883568704128,
          "encoder_gradient_cosine_similarity": 0.0058761839754879475,
          "encoder_gradient_l2_distance": 0.0,
          "encoder_gradient_dot_product": 0.020907077938318253,
          "input_gradient_cosine_similarity": 0.0022248949389904737,
          "input_gradient_l2_distance": 0.0,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.32453498490917926,
        "val_r": 0.4312108227310043,
        "n_iterations": 272,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009619316086173058,
          "right_subspace_overlap_bottom_k": 0.014005456119775772,
          "interaction_matrix_overlap_top_k": 0.00934008602052927,
          "interaction_matrix_overlap_bottom_k": 0.0682634636759758,
          "effective_rank": 0.010394608601927757,
          "effective_rank_mergeability_score": 0.10407387465238571,
          "stable_rank": 0.0,
          "spectral_gap": 0.03676209971308708,
          "singular_value_ratio": 0.013880248181521893,
          "layerwise_effective_rank": 0.09846631437540054,
          "layerwise_effective_rank_mergeability_score": 0.004541289061307907,
          "task_vector_cosine_similarity": 0.010602984577417374,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.004629894159734249,
          "weight_space_angle": 0.030661607161164284,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.01466003991663456,
          "right_subspace_overlap": 0.002730089705437422,
          "activation_l2_distance": 0.01087195985019207,
          "activation_cosine_similarity": 0.009480404667556286,
          "activation_magnitude_ratio": -0.0016753474483266473,
          "activation_dot_product": 0.013241962529718876,
          "encoder_gradient_cosine_similarity": 0.0014238925650715828,
          "encoder_gradient_l2_distance": -0.002332544419914484,
          "encoder_gradient_dot_product": 0.00406532222405076,
          "input_gradient_cosine_similarity": 0.03191094100475311,
          "input_gradient_l2_distance": 0.0,
          "input_gradient_dot_product": 0.0028482505585998297
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.47962457721974694,
        "val_r": 0.41575144882486964,
        "n_iterations": 404,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.004349709954112768,
          "interaction_matrix_overlap_top_k": -0.0022377921268343925,
          "interaction_matrix_overlap_bottom_k": 0.02208542451262474,
          "effective_rank": 0.04822773486375809,
          "effective_rank_mergeability_score": 0.09229253232479095,
          "stable_rank": 0.022683437913656235,
          "spectral_gap": 0.051397450268268585,
          "singular_value_ratio": 0.03751422464847565,
          "layerwise_effective_rank": 0.0676909014582634,
          "layerwise_effective_rank_mergeability_score": 0.04627424478530884,
          "task_vector_cosine_similarity": 0.05156388878822327,
          "task_vector_l2_distance": -0.016707027330994606,
          "task_vector_dot_product": 0.0052054282277822495,
          "weight_space_angle": 0.06650687009096146,
          "task_vector_magnitude_ratio": 0.001068370882421732,
          "singular_value_overlap": -0.010322016663849354,
          "subspace_overlap": 0.008317001163959503,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.007107316050678492,
          "activation_cosine_similarity": 0.003972445614635944,
          "activation_magnitude_ratio": -0.0021591882687062025,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0017579493578523397,
          "encoder_gradient_l2_distance": -0.0031789850909262896,
          "encoder_gradient_dot_product": 0.0017002332024276257,
          "input_gradient_cosine_similarity": 0.00276566157117486,
          "input_gradient_l2_distance": -0.01182587817311287,
          "input_gradient_dot_product": -0.002640761900693178
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.49283417502784743,
        "val_r": 0.4724309280549316,
        "n_iterations": 423,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.025070233270525932,
          "effective_rank": 0.060015883296728134,
          "effective_rank_mergeability_score": 0.08279780298471451,
          "stable_rank": 0.03089010901749134,
          "spectral_gap": 0.06342441588640213,
          "singular_value_ratio": 0.05090634152293205,
          "layerwise_effective_rank": 0.03706544265151024,
          "layerwise_effective_rank_mergeability_score": 0.03839727118611336,
          "task_vector_cosine_similarity": 0.06508945673704147,
          "task_vector_l2_distance": -0.01259162649512291,
          "task_vector_dot_product": -0.0010337303392589092,
          "weight_space_angle": 0.06273765116930008,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.012714223936200142,
          "subspace_overlap": 0.0023911839816719294,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0075680967420339584,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.003523873398080468,
          "activation_dot_product": 0.0015368795720860362,
          "encoder_gradient_cosine_similarity": 0.0011968198232352734,
          "encoder_gradient_l2_distance": 0.0,
          "encoder_gradient_dot_product": 0.004451029933989048,
          "input_gradient_cosine_similarity": 0.006837334018200636,
          "input_gradient_l2_distance": -0.015475133433938026,
          "input_gradient_dot_product": -0.0016597347566857934
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.26786927253104853,
        "val_r": 0.43831991763755984,
        "n_iterations": 477,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.012373083271086216,
          "right_subspace_overlap_bottom_k": 0.005002265330404043,
          "interaction_matrix_overlap_top_k": 0.011106531135737896,
          "interaction_matrix_overlap_bottom_k": 0.09595635533332825,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.05617320537567139,
          "stable_rank": 0.014119816944003105,
          "spectral_gap": 0.04066113010048866,
          "singular_value_ratio": 0.004337072838097811,
          "layerwise_effective_rank": 0.017435628920793533,
          "layerwise_effective_rank_mergeability_score": 0.003313993336632848,
          "task_vector_cosine_similarity": 0.0017888844013214111,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.05947111174464226,
          "task_vector_magnitude_ratio": 0.007630105130374432,
          "singular_value_overlap": -0.0028392933309078217,
          "subspace_overlap": 0.0802265852689743,
          "right_subspace_overlap": 0.00698067294433713,
          "activation_l2_distance": 0.012537820264697075,
          "activation_cosine_similarity": 0.0026464578695595264,
          "activation_magnitude_ratio": 0.0012226359685882926,
          "activation_dot_product": 0.019216204062104225,
          "encoder_gradient_cosine_similarity": 0.022978490218520164,
          "encoder_gradient_l2_distance": 0.003457120154052973,
          "encoder_gradient_dot_product": 0.014284062199294567,
          "input_gradient_cosine_similarity": 0.01740487478673458,
          "input_gradient_l2_distance": 0.0,
          "input_gradient_dot_product": 0.005060833878815174
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.4751272945059014,
        "val_r": 0.5681104634664744,
        "n_iterations": 681,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0020882892422378063,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.016329409554600716,
          "effective_rank": 0.07474885135889053,
          "effective_rank_mergeability_score": 0.08317190408706665,
          "stable_rank": 0.001452677883207798,
          "spectral_gap": 0.0633162260055542,
          "singular_value_ratio": 0.05823477357625961,
          "layerwise_effective_rank": 0.058033592998981476,
          "layerwise_effective_rank_mergeability_score": 0.05667423829436302,
          "task_vector_cosine_similarity": 0.04676862433552742,
          "task_vector_l2_distance": -0.00981929711997509,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.05577229708433151,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.01072001364082098,
          "subspace_overlap": 0.007792133372277021,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.001711905817501247,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.003539605997502804,
          "activation_dot_product": -0.0014568404294550419,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.004066281020641327,
          "encoder_gradient_dot_product": 0.0012040629517287016,
          "input_gradient_cosine_similarity": 0.003284706501290202,
          "input_gradient_l2_distance": -0.013846809044480324,
          "input_gradient_dot_product": -0.0012771805049851537
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.5316493955534956,
        "val_r": 0.33571292161242405,
        "n_iterations": 456,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0022839016746729612,
          "interaction_matrix_overlap_top_k": 0.0012188879773020744,
          "interaction_matrix_overlap_bottom_k": 0.02012234553694725,
          "effective_rank": 0.06030718609690666,
          "effective_rank_mergeability_score": 0.07771886885166168,
          "stable_rank": 0.00970469694584608,
          "spectral_gap": 0.05812413617968559,
          "singular_value_ratio": 0.05346459522843361,
          "layerwise_effective_rank": 0.05206706374883652,
          "layerwise_effective_rank_mergeability_score": 0.04200845956802368,
          "task_vector_cosine_similarity": 0.06891856342554092,
          "task_vector_l2_distance": -0.0151622723788023,
          "task_vector_dot_product": 0.0013853204436600208,
          "weight_space_angle": 0.07160083204507828,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.006040120497345924,
          "subspace_overlap": 0.0015570592368021607,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.012850149534642696,
          "activation_cosine_similarity": 0.004282104782760143,
          "activation_magnitude_ratio": -0.0035887539852410555,
          "activation_dot_product": 0.002080171834677458,
          "encoder_gradient_cosine_similarity": 0.0010680537670850754,
          "encoder_gradient_l2_distance": -0.002811357844620943,
          "encoder_gradient_dot_product": 0.001842282246798277,
          "input_gradient_cosine_similarity": 0.003347939345985651,
          "input_gradient_l2_distance": -0.011519668623805046,
          "input_gradient_dot_product": -0.0020763122010976076
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.29248938669788566,
        "val_r": 0.2664098703647227,
        "n_iterations": 417,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.014905480667948723,
          "right_subspace_overlap_bottom_k": 0.004391595255583525,
          "interaction_matrix_overlap_top_k": 0.008477793075144291,
          "interaction_matrix_overlap_bottom_k": 0.07864594459533691,
          "effective_rank": 0.0079755038022995,
          "effective_rank_mergeability_score": 0.02370840683579445,
          "stable_rank": 0.011631493456661701,
          "spectral_gap": 0.04520896077156067,
          "singular_value_ratio": 0.005626408848911524,
          "layerwise_effective_rank": 0.003824335290119052,
          "layerwise_effective_rank_mergeability_score": 0.004694455768913031,
          "task_vector_cosine_similarity": 0.0026400000788271427,
          "task_vector_l2_distance": -0.002606102265417576,
          "task_vector_dot_product": 0.002019460080191493,
          "weight_space_angle": 0.08624841272830963,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.003883832599967718,
          "subspace_overlap": 0.0998578816652298,
          "right_subspace_overlap": 0.014890080317854881,
          "activation_l2_distance": 0.0070493086241185665,
          "activation_cosine_similarity": 0.008612453937530518,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.020812060683965683,
          "encoder_gradient_cosine_similarity": 0.013568608090281487,
          "encoder_gradient_l2_distance": -0.0026981139089912176,
          "encoder_gradient_dot_product": 0.019612358883023262,
          "input_gradient_cosine_similarity": 0.01663484424352646,
          "input_gradient_l2_distance": 0.0,
          "input_gradient_dot_product": 0.002961922436952591
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.3845796235521117,
        "val_r": -0.03616753092254377,
        "n_iterations": 249,
        "n_nonzero_coefficients": 28,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0010657534003257751,
          "right_subspace_overlap_bottom_k": 0.007417366374284029,
          "interaction_matrix_overlap_top_k": 0.009852616116404533,
          "interaction_matrix_overlap_bottom_k": 0.11164368689060211,
          "effective_rank": 0.026476822793483734,
          "effective_rank_mergeability_score": 0.004187475424259901,
          "stable_rank": 0.028568902984261513,
          "spectral_gap": 0.03170979022979736,
          "singular_value_ratio": 0.0012004534946754575,
          "layerwise_effective_rank": 0.0035597386304289103,
          "layerwise_effective_rank_mergeability_score": 0.08677110821008682,
          "task_vector_cosine_similarity": 0.017523106187582016,
          "task_vector_l2_distance": 0.0014307107776403427,
          "task_vector_dot_product": 0.002687889849767089,
          "weight_space_angle": 0.04965782165527344,
          "task_vector_magnitude_ratio": 0.005587821360677481,
          "singular_value_overlap": -0.002252239268273115,
          "subspace_overlap": 0.04248855635523796,
          "right_subspace_overlap": 0.007257794961333275,
          "activation_l2_distance": 0.012918264605104923,
          "activation_cosine_similarity": 0.011389434337615967,
          "activation_magnitude_ratio": 0.0011371473083272576,
          "activation_dot_product": 0.006966262124478817,
          "encoder_gradient_cosine_similarity": 0.011662304401397705,
          "encoder_gradient_l2_distance": 0.0,
          "encoder_gradient_dot_product": 0.012739129364490509,
          "input_gradient_cosine_similarity": 0.032900117337703705,
          "input_gradient_l2_distance": -0.004182205535471439,
          "input_gradient_dot_product": 0.001621114439330995
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6911544293523026,
        "val_r": 0.5001974589795519,
        "n_iterations": 359,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011462780646979809,
          "right_subspace_overlap_bottom_k": -0.0018214936135336757,
          "interaction_matrix_overlap_top_k": 0.0014494727365672588,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.05021950602531433,
          "effective_rank_mergeability_score": 0.028694629669189453,
          "stable_rank": 0.00132488994859159,
          "spectral_gap": 0.03445211425423622,
          "singular_value_ratio": 0.03769076243042946,
          "layerwise_effective_rank": 0.05404794216156006,
          "layerwise_effective_rank_mergeability_score": 0.09017971903085709,
          "task_vector_cosine_similarity": 0.06826629489660263,
          "task_vector_l2_distance": 0.001069343532435596,
          "task_vector_dot_product": 0.010312303900718689,
          "weight_space_angle": 0.09711143374443054,
          "task_vector_magnitude_ratio": 0.004021492321044207,
          "singular_value_overlap": -0.0021965072955936193,
          "subspace_overlap": 0.0010810114908963442,
          "right_subspace_overlap": 0.012345829978585243,
          "activation_l2_distance": 0.006153657101094723,
          "activation_cosine_similarity": 0.007873660884797573,
          "activation_magnitude_ratio": -0.0013300133869051933,
          "activation_dot_product": 0.007594991475343704,
          "encoder_gradient_cosine_similarity": 0.004523669369518757,
          "encoder_gradient_l2_distance": -0.009721306152641773,
          "encoder_gradient_dot_product": 0.003895784728229046,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.013196360319852829,
          "input_gradient_dot_product": -0.0030927867628633976
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5586878115587891,
        "val_r": 0.21634096718961132,
        "n_iterations": 254,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.00511967996135354,
          "interaction_matrix_overlap_top_k": 0.0010941813234239817,
          "interaction_matrix_overlap_bottom_k": 0.020473098382353783,
          "effective_rank": 0.05530351772904396,
          "effective_rank_mergeability_score": 0.06133255362510681,
          "stable_rank": 0.006312975659966469,
          "spectral_gap": 0.08518984168767929,
          "singular_value_ratio": 0.07543633133172989,
          "layerwise_effective_rank": 0.038081925362348557,
          "layerwise_effective_rank_mergeability_score": 0.036315616220235825,
          "task_vector_cosine_similarity": 0.06720072776079178,
          "task_vector_l2_distance": -0.016386637464165688,
          "task_vector_dot_product": 0.003438910935074091,
          "weight_space_angle": 0.07596874982118607,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.013472088612616062,
          "subspace_overlap": 0.0020979621913284063,
          "right_subspace_overlap": -0.001881149597465992,
          "activation_l2_distance": 0.0032352495472878218,
          "activation_cosine_similarity": 0.0020418688654899597,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.003925414755940437,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0016636503860354424,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.008189854212105274,
          "input_gradient_l2_distance": -0.019374370574951172,
          "input_gradient_dot_product": -0.0016997616039589047
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  }
}