{
  "aggregate_metrics": {
    "train_r": 0.5732672128184724,
    "train_p": 6.202093137380893e-281,
    "val_r": 0.5141345528513949,
    "val_p": 1.5158152437614106e-25
  },
  "per_fold_stats": {
    "train_r_mean": 0.725547515382024,
    "train_r_std": 0.026382606463823222,
    "val_r_mean": 0.5614779613604306,
    "val_r_std": 0.17210797669719335,
    "n_nonzero_mean": 24.65,
    "n_nonzero_std": 2.1277922830953213
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.007256903685629368,
    "right_subspace_overlap_bottom_k": -0.006256594322621822,
    "interaction_matrix_overlap_top_k": 0.0023141668643802404,
    "interaction_matrix_overlap_bottom_k": -5.2033381507499143e-05,
    "effective_rank": 0.050724614411592484,
    "effective_rank_mergeability_score": 0.03915776312351227,
    "stable_rank": 0.00378103693947196,
    "spectral_gap": 0.040649522095918655,
    "singular_value_ratio": 0.038104742765426636,
    "layerwise_effective_rank": 0.04318822920322418,
    "layerwise_effective_rank_mergeability_score": 0.06268628686666489,
    "task_vector_cosine_similarity": 0.07740236818790436,
    "task_vector_l2_distance": -0.0037744524888694286,
    "task_vector_dot_product": 0.0021373070776462555,
    "weight_space_angle": 0.09100255370140076,
    "task_vector_magnitude_ratio": 0.0020202784799039364,
    "singular_value_overlap": 0.0004897821927443147,
    "subspace_overlap": 0.0039537991397082806,
    "right_subspace_overlap": 0.006161978468298912,
    "activation_l2_distance": 0.019640948623418808,
    "activation_cosine_similarity": 0.02699042297899723,
    "activation_magnitude_ratio": -0.0006416704854927957,
    "activation_dot_product": 0.002063560765236616,
    "encoder_gradient_cosine_similarity": 0.004193493165075779,
    "encoder_gradient_l2_distance": -0.014128519222140312,
    "encoder_gradient_dot_product": 0.0024707228876650333,
    "input_gradient_cosine_similarity": 0.0035860624630004168,
    "input_gradient_l2_distance": -0.013320401310920715,
    "input_gradient_dot_product": -0.0005674147978425026
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.003232428105548024,
    "right_subspace_overlap_bottom_k": 0.0028295996598899364,
    "interaction_matrix_overlap_top_k": 0.0017639865400269628,
    "interaction_matrix_overlap_bottom_k": 0.0009884311584755778,
    "effective_rank": 0.013661222532391548,
    "effective_rank_mergeability_score": 0.013331720605492592,
    "stable_rank": 0.006728705950081348,
    "spectral_gap": 0.00991460494697094,
    "singular_value_ratio": 0.01055691484361887,
    "layerwise_effective_rank": 0.011544610373675823,
    "layerwise_effective_rank_mergeability_score": 0.015954403206706047,
    "task_vector_cosine_similarity": 0.01015794649720192,
    "task_vector_l2_distance": 0.0028690630570054054,
    "task_vector_dot_product": 0.0017767813988029957,
    "weight_space_angle": 0.012260559014976025,
    "task_vector_magnitude_ratio": 0.001797739416360855,
    "singular_value_overlap": 0.0010779222939163446,
    "subspace_overlap": 0.0030988906510174274,
    "right_subspace_overlap": 0.0036388146691024303,
    "activation_l2_distance": 0.009562560357153416,
    "activation_cosine_similarity": 0.010763346217572689,
    "activation_magnitude_ratio": 0.0013862296473234892,
    "activation_dot_product": 0.0027211711276322603,
    "encoder_gradient_cosine_similarity": 0.0016030835686251521,
    "encoder_gradient_l2_distance": 0.003162519307807088,
    "encoder_gradient_dot_product": 0.0017200745642185211,
    "input_gradient_cosine_similarity": 0.0026457614731043577,
    "input_gradient_l2_distance": 0.004842014517635107,
    "input_gradient_dot_product": 0.0013075278839096427
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.95,
    "right_subspace_overlap_bottom_k": 0.95,
    "interaction_matrix_overlap_top_k": 0.8,
    "interaction_matrix_overlap_bottom_k": 0.35,
    "effective_rank": 1.0,
    "effective_rank_mergeability_score": 1.0,
    "stable_rank": 0.75,
    "spectral_gap": 1.0,
    "singular_value_ratio": 1.0,
    "layerwise_effective_rank": 1.0,
    "layerwise_effective_rank_mergeability_score": 1.0,
    "task_vector_cosine_similarity": 1.0,
    "task_vector_l2_distance": 0.9,
    "task_vector_dot_product": 0.75,
    "weight_space_angle": 1.0,
    "task_vector_magnitude_ratio": 0.7,
    "singular_value_overlap": 0.6,
    "subspace_overlap": 0.9,
    "right_subspace_overlap": 0.9,
    "activation_l2_distance": 1.0,
    "activation_cosine_similarity": 0.95,
    "activation_magnitude_ratio": 0.3,
    "activation_dot_product": 0.65,
    "encoder_gradient_cosine_similarity": 1.0,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.8,
    "input_gradient_cosine_similarity": 0.9,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.5
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7299705056590243,
      "val_r": 0.5551635884900401,
      "n_iterations": 286,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010652112774550915,
        "right_subspace_overlap_bottom_k": -0.003294107737019658,
        "interaction_matrix_overlap_top_k": 0.002259379019960761,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.03700217977166176,
        "effective_rank_mergeability_score": 0.03944568708539009,
        "stable_rank": 0.0035182505380362272,
        "spectral_gap": 0.034511685371398926,
        "singular_value_ratio": 0.029475906863808632,
        "layerwise_effective_rank": 0.03159857913851738,
        "layerwise_effective_rank_mergeability_score": 0.03871572017669678,
        "task_vector_cosine_similarity": 0.09456640481948853,
        "task_vector_l2_distance": -0.010124141350388527,
        "task_vector_dot_product": 0.004792379215359688,
        "weight_space_angle": 0.12145605683326721,
        "task_vector_magnitude_ratio": 0.006178956013172865,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.005327718332409859,
        "right_subspace_overlap": 0.011404250748455524,
        "activation_l2_distance": 0.02828570082783699,
        "activation_cosine_similarity": 0.04101958125829697,
        "activation_magnitude_ratio": -0.004440027289092541,
        "activation_dot_product": 0.005319193471223116,
        "encoder_gradient_cosine_similarity": 0.008160467259585857,
        "encoder_gradient_l2_distance": -0.021943191066384315,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.011319334618747234,
        "input_gradient_l2_distance": -0.02481919154524803,
        "input_gradient_dot_product": 0.0026031741872429848
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7071004946409631,
      "val_r": 0.5889615569174086,
      "n_iterations": 412,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.013867753557860851,
        "right_subspace_overlap_bottom_k": -0.006684088613837957,
        "interaction_matrix_overlap_top_k": 0.0021539817098528147,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.05782417953014374,
        "effective_rank_mergeability_score": 0.04128323867917061,
        "stable_rank": 0.001700354041531682,
        "spectral_gap": 0.036437876522541046,
        "singular_value_ratio": 0.03441515937447548,
        "layerwise_effective_rank": 0.04424477368593216,
        "layerwise_effective_rank_mergeability_score": 0.06413581967353821,
        "task_vector_cosine_similarity": 0.07208438962697983,
        "task_vector_l2_distance": -0.004073963034898043,
        "task_vector_dot_product": 0.0038360124453902245,
        "weight_space_angle": 0.08899416029453278,
        "task_vector_magnitude_ratio": 0.00116393540520221,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.00506768561899662,
        "right_subspace_overlap": 0.008391750045120716,
        "activation_l2_distance": 0.023534148931503296,
        "activation_cosine_similarity": 0.031987790018320084,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.00395481800660491,
        "encoder_gradient_l2_distance": -0.014683985151350498,
        "encoder_gradient_dot_product": 0.004922904074192047,
        "input_gradient_cosine_similarity": 0.001357418135739863,
        "input_gradient_l2_distance": -0.013432914391160011,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7055792046488323,
      "val_r": 0.680066734510155,
      "n_iterations": 331,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010123279877007008,
        "right_subspace_overlap_bottom_k": -0.004662083927541971,
        "interaction_matrix_overlap_top_k": 0.002997229341417551,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.07364872843027115,
        "effective_rank_mergeability_score": 0.05758683383464813,
        "stable_rank": 0.006648491136729717,
        "spectral_gap": 0.03624473884701729,
        "singular_value_ratio": 0.03198671713471413,
        "layerwise_effective_rank": 0.029955608770251274,
        "layerwise_effective_rank_mergeability_score": 0.05991050601005554,
        "task_vector_cosine_similarity": 0.07075385749340057,
        "task_vector_l2_distance": -0.0023899273946881294,
        "task_vector_dot_product": 0.0036671538837254047,
        "weight_space_angle": 0.0811660885810852,
        "task_vector_magnitude_ratio": 0.001374998944811523,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.004944056738168001,
        "right_subspace_overlap": 0.009518186561763287,
        "activation_l2_distance": 0.018263675272464752,
        "activation_cosine_similarity": 0.027491802349686623,
        "activation_magnitude_ratio": -0.0021524359472095966,
        "activation_dot_product": 0.004190477076917887,
        "encoder_gradient_cosine_similarity": 0.0031634115148335695,
        "encoder_gradient_l2_distance": -0.011382377706468105,
        "encoder_gradient_dot_product": 0.0023106071166694164,
        "input_gradient_cosine_similarity": 0.0023047160357236862,
        "input_gradient_l2_distance": -0.013926905579864979,
        "input_gradient_dot_product": -0.0024718751665204763
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7113545088731207,
      "val_r": 0.6321037868009347,
      "n_iterations": 265,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009817564859986305,
        "right_subspace_overlap_bottom_k": -0.003275918308645487,
        "interaction_matrix_overlap_top_k": 0.0052430639043450356,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.07277730107307434,
        "effective_rank_mergeability_score": 0.055337853729724884,
        "stable_rank": 0.003879319177940488,
        "spectral_gap": 0.04953338950872421,
        "singular_value_ratio": 0.04872004687786102,
        "layerwise_effective_rank": 0.013371269218623638,
        "layerwise_effective_rank_mergeability_score": 0.043116092681884766,
        "task_vector_cosine_similarity": 0.05486813932657242,
        "task_vector_l2_distance": -0.0037829638458788395,
        "task_vector_dot_product": 0.0029809807892888784,
        "weight_space_angle": 0.07801777124404907,
        "task_vector_magnitude_ratio": 0.004383991938084364,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0026108170859515667,
        "right_subspace_overlap": 0.00773673877120018,
        "activation_l2_distance": 0.027388855814933777,
        "activation_cosine_similarity": 0.0369512103497982,
        "activation_magnitude_ratio": 0.0011216300772503018,
        "activation_dot_product": 0.004714303649961948,
        "encoder_gradient_cosine_similarity": 0.004861517809331417,
        "encoder_gradient_l2_distance": -0.017323369160294533,
        "encoder_gradient_dot_product": 0.005021573044359684,
        "input_gradient_cosine_similarity": 0.006020974833518267,
        "input_gradient_l2_distance": -0.02470904402434826,
        "input_gradient_dot_product": -0.001774105243384838
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.728181791137263,
      "val_r": 0.6920051601907778,
      "n_iterations": 328,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009020921774208546,
        "right_subspace_overlap_bottom_k": -0.006064691115170717,
        "interaction_matrix_overlap_top_k": 0.0016289276536554098,
        "interaction_matrix_overlap_bottom_k": 0.0012105291243642569,
        "effective_rank": 0.05067787319421768,
        "effective_rank_mergeability_score": 0.03619230538606644,
        "stable_rank": 0.0,
        "spectral_gap": 0.03846118226647377,
        "singular_value_ratio": 0.035251911729574203,
        "layerwise_effective_rank": 0.04365047067403793,
        "layerwise_effective_rank_mergeability_score": 0.06086773797869682,
        "task_vector_cosine_similarity": 0.0942806527018547,
        "task_vector_l2_distance": -0.006310341879725456,
        "task_vector_dot_product": 0.0015132722910493612,
        "weight_space_angle": 0.103736013174057,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.004419977776706219,
        "right_subspace_overlap": 0.0049092997796833515,
        "activation_l2_distance": 0.014453105628490448,
        "activation_cosine_similarity": 0.021731138229370117,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0033211386762559414,
        "encoder_gradient_cosine_similarity": 0.0030149894300848246,
        "encoder_gradient_l2_distance": -0.01381415594369173,
        "encoder_gradient_dot_product": 0.0019237210508435965,
        "input_gradient_cosine_similarity": 0.004849226213991642,
        "input_gradient_l2_distance": -0.013469822704792023,
        "input_gradient_dot_product": -0.0018117236904799938
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.749197238381563,
      "val_r": 0.7219357464278046,
      "n_iterations": 347,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00885577592998743,
        "right_subspace_overlap_bottom_k": -0.005592481233179569,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0012584580108523369,
        "effective_rank": 0.04768598452210426,
        "effective_rank_mergeability_score": 0.03396258130669594,
        "stable_rank": 0.001156987389549613,
        "spectral_gap": 0.06069417670369148,
        "singular_value_ratio": 0.05896078422665596,
        "layerwise_effective_rank": 0.04953683167695999,
        "layerwise_effective_rank_mergeability_score": 0.0651233047246933,
        "task_vector_cosine_similarity": 0.07261301577091217,
        "task_vector_l2_distance": -0.002041037194430828,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.08311732113361359,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0034951562993228436,
        "right_subspace_overlap": 0.0021572187542915344,
        "activation_l2_distance": 0.008105498738586903,
        "activation_cosine_similarity": 0.017522120848298073,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0034186793491244316,
        "encoder_gradient_l2_distance": -0.013241183944046497,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.002440276090055704,
        "input_gradient_l2_distance": -0.006760688964277506,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7245383501916309,
      "val_r": 0.4208170732507355,
      "n_iterations": 205,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006499932613223791,
        "right_subspace_overlap_bottom_k": -0.012533307075500488,
        "interaction_matrix_overlap_top_k": 0.006639027968049049,
        "interaction_matrix_overlap_bottom_k": -0.001488225650973618,
        "effective_rank": 0.05117232725024223,
        "effective_rank_mergeability_score": 0.029254069551825523,
        "stable_rank": 0.002105854917317629,
        "spectral_gap": 0.04939967766404152,
        "singular_value_ratio": 0.04415871948003769,
        "layerwise_effective_rank": 0.04128403961658478,
        "layerwise_effective_rank_mergeability_score": 0.0727430135011673,
        "task_vector_cosine_similarity": 0.0677800104022026,
        "task_vector_l2_distance": -0.0027355521451681852,
        "task_vector_dot_product": 0.0013631765032187104,
        "weight_space_angle": 0.0762789398431778,
        "task_vector_magnitude_ratio": 0.004344502929598093,
        "singular_value_overlap": 0.0014708263333886862,
        "subspace_overlap": 0.004648478236049414,
        "right_subspace_overlap": 0.005028815474361181,
        "activation_l2_distance": 0.02196209691464901,
        "activation_cosine_similarity": 0.040095627307891846,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.0016576119232922792,
        "encoder_gradient_cosine_similarity": 0.006334634032100439,
        "encoder_gradient_l2_distance": -0.019557688385248184,
        "encoder_gradient_dot_product": 0.003772786818444729,
        "input_gradient_cosine_similarity": 0.0016023452626541257,
        "input_gradient_l2_distance": -0.011473692953586578,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6831339764476685,
      "val_r": 0.3496532596433283,
      "n_iterations": 396,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010775959119200706,
        "right_subspace_overlap_bottom_k": -0.007329413201659918,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.060134872794151306,
        "effective_rank_mergeability_score": 0.04132317379117012,
        "stable_rank": 0.0027781426906585693,
        "spectral_gap": 0.04795496165752411,
        "singular_value_ratio": 0.04665835201740265,
        "layerwise_effective_rank": 0.0365806519985199,
        "layerwise_effective_rank_mergeability_score": 0.05950561538338661,
        "task_vector_cosine_similarity": 0.07150042057037354,
        "task_vector_l2_distance": -0.005150907672941685,
        "task_vector_dot_product": 0.002233077073469758,
        "weight_space_angle": 0.07849389314651489,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0016325224423781037,
        "subspace_overlap": 0.005358985159546137,
        "right_subspace_overlap": 0.00706941494718194,
        "activation_l2_distance": 0.018950868397951126,
        "activation_cosine_similarity": 0.024815429002046585,
        "activation_magnitude_ratio": -0.0012112482218071818,
        "activation_dot_product": 0.002350347116589546,
        "encoder_gradient_cosine_similarity": 0.006919724866747856,
        "encoder_gradient_l2_distance": -0.014672772958874702,
        "encoder_gradient_dot_product": 0.0030045686289668083,
        "input_gradient_cosine_similarity": 0.0021579754538834095,
        "input_gradient_l2_distance": -0.009181132540106773,
        "input_gradient_dot_product": 0.0015578812453895807
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7258136278333361,
      "val_r": 0.193291082363055,
      "n_iterations": 201,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004283341579139233,
        "right_subspace_overlap_bottom_k": -0.00772884814068675,
        "interaction_matrix_overlap_top_k": 0.0017044155392795801,
        "interaction_matrix_overlap_bottom_k": -0.0023219771683216095,
        "effective_rank": 0.027292540296912193,
        "effective_rank_mergeability_score": 0.05023341625928879,
        "stable_rank": 0.03198331221938133,
        "spectral_gap": 0.030010459944605827,
        "singular_value_ratio": 0.029209697619080544,
        "layerwise_effective_rank": 0.041181936860084534,
        "layerwise_effective_rank_mergeability_score": 0.05997186899185181,
        "task_vector_cosine_similarity": 0.06898049265146255,
        "task_vector_l2_distance": -0.0028965198434889317,
        "task_vector_dot_product": 0.004516848362982273,
        "weight_space_angle": 0.08559219539165497,
        "task_vector_magnitude_ratio": 0.002659840974956751,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.001191380200907588,
        "right_subspace_overlap": 0.007424985058605671,
        "activation_l2_distance": 0.0222152266651392,
        "activation_cosine_similarity": 0.028552241623401642,
        "activation_magnitude_ratio": -0.0036570592783391476,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0052565596997737885,
        "encoder_gradient_l2_distance": -0.011828400194644928,
        "encoder_gradient_dot_product": 0.003923060372471809,
        "input_gradient_cosine_similarity": 0.004330417141318321,
        "input_gradient_l2_distance": -0.01604398898780346,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7108073235000623,
      "val_r": 0.48828662267240003,
      "n_iterations": 341,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009772106073796749,
        "right_subspace_overlap_bottom_k": -0.007681564893573523,
        "interaction_matrix_overlap_top_k": 0.004445794969797134,
        "interaction_matrix_overlap_bottom_k": 0.002536914311349392,
        "effective_rank": 0.044177085161209106,
        "effective_rank_mergeability_score": 0.028184935450553894,
        "stable_rank": 0.0,
        "spectral_gap": 0.05584338679909706,
        "singular_value_ratio": 0.05498843267560005,
        "layerwise_effective_rank": 0.06614251434803009,
        "layerwise_effective_rank_mergeability_score": 0.08969587087631226,
        "task_vector_cosine_similarity": 0.06498917192220688,
        "task_vector_l2_distance": -0.004360982216894627,
        "task_vector_dot_product": 0.0027566379867494106,
        "weight_space_angle": 0.08249451965093613,
        "task_vector_magnitude_ratio": 0.002895105630159378,
        "singular_value_overlap": -0.0013657500967383385,
        "subspace_overlap": 0.006597355008125305,
        "right_subspace_overlap": 0.00880658533424139,
        "activation_l2_distance": 0.0028157716151326895,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.001090307254344225,
        "encoder_gradient_cosine_similarity": 0.004044767003506422,
        "encoder_gradient_l2_distance": -0.014148646034300327,
        "encoder_gradient_dot_product": 0.00286905188113451,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.015989631414413452,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7491590790332391,
      "val_r": 0.16149619340693272,
      "n_iterations": 334,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003580225631594658,
        "right_subspace_overlap_bottom_k": -0.0037005734629929066,
        "interaction_matrix_overlap_top_k": 0.0016414023702964187,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.052388980984687805,
        "effective_rank_mergeability_score": 0.06353820860385895,
        "stable_rank": 0.0022920251358300447,
        "spectral_gap": 0.040667153894901276,
        "singular_value_ratio": 0.039712902158498764,
        "layerwise_effective_rank": 0.05258651077747345,
        "layerwise_effective_rank_mergeability_score": 0.04887818545103073,
        "task_vector_cosine_similarity": 0.08046378940343857,
        "task_vector_l2_distance": -0.00286734476685524,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.085660919547081,
        "task_vector_magnitude_ratio": 0.0021295950282365084,
        "singular_value_overlap": 0.0011859023943543434,
        "subspace_overlap": -0.0010612154146656394,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.007849869318306446,
        "activation_cosine_similarity": 0.01650463417172432,
        "activation_magnitude_ratio": -0.002494269050657749,
        "activation_dot_product": 0.0017175008542835712,
        "encoder_gradient_cosine_similarity": 0.002871408360078931,
        "encoder_gradient_l2_distance": -0.014033820480108261,
        "encoder_gradient_dot_product": 0.0011935359798371792,
        "input_gradient_cosine_similarity": 0.0023803813382983208,
        "input_gradient_l2_distance": -0.005103535018861294,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7367590044829082,
      "val_r": 0.691607793952778,
      "n_iterations": 415,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006424675229936838,
        "right_subspace_overlap_bottom_k": -0.008995573036372662,
        "interaction_matrix_overlap_top_k": 0.0024379827082157135,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.026882892474532127,
        "effective_rank_mergeability_score": 0.03828616067767143,
        "stable_rank": 0.003788462607190013,
        "spectral_gap": 0.044542767107486725,
        "singular_value_ratio": 0.03960946202278137,
        "layerwise_effective_rank": 0.034224070608615875,
        "layerwise_effective_rank_mergeability_score": 0.026538429781794548,
        "task_vector_cosine_similarity": 0.08403538167476654,
        "task_vector_l2_distance": -0.0017554882215335965,
        "task_vector_dot_product": 0.0064531187526881695,
        "weight_space_angle": 0.11107612401247025,
        "task_vector_magnitude_ratio": 0.0037926621735095978,
        "singular_value_overlap": 0.0010155412601307034,
        "subspace_overlap": 0.01168283261358738,
        "right_subspace_overlap": 0.0028327093459665775,
        "activation_l2_distance": 0.035810437053442,
        "activation_cosine_similarity": 0.039703696966171265,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.004968469496816397,
        "encoder_gradient_cosine_similarity": 0.004330002702772617,
        "encoder_gradient_l2_distance": -0.012670150958001614,
        "encoder_gradient_dot_product": 0.001106677227653563,
        "input_gradient_cosine_similarity": 0.006544434931129217,
        "input_gradient_l2_distance": -0.0149656031280756,
        "input_gradient_dot_product": -0.0014396619517356157
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7231181045808794,
      "val_r": 0.6376310909896931,
      "n_iterations": 411,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0071691726334393024,
        "right_subspace_overlap_bottom_k": -0.004026518203318119,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.049762338399887085,
        "effective_rank_mergeability_score": 0.023134469985961914,
        "stable_rank": 0.002570144599303603,
        "spectral_gap": 0.032864633947610855,
        "singular_value_ratio": 0.031697746366262436,
        "layerwise_effective_rank": 0.04698869213461876,
        "layerwise_effective_rank_mergeability_score": 0.07866466790437698,
        "task_vector_cosine_similarity": 0.07683892548084259,
        "task_vector_l2_distance": -0.0010176151990890503,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.07542300969362259,
        "task_vector_magnitude_ratio": 0.00143460463732481,
        "singular_value_overlap": 0.0015761996619403362,
        "subspace_overlap": 0.0011868771398440003,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.035300273448228836,
        "activation_cosine_similarity": 0.038404904305934906,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.005850032437592745,
        "encoder_gradient_l2_distance": -0.008640985935926437,
        "encoder_gradient_dot_product": 0.004176896996796131,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.010863340459764004,
        "input_gradient_dot_product": -0.0023949421010911465
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7345959517145335,
      "val_r": 0.8346019441743311,
      "n_iterations": 422,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006611368618905544,
        "right_subspace_overlap_bottom_k": -0.007789508439600468,
        "interaction_matrix_overlap_top_k": 0.0034281667321920395,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.05076514184474945,
        "effective_rank_mergeability_score": 0.03879496827721596,
        "stable_rank": 0.0060572754591703415,
        "spectral_gap": 0.047896623611450195,
        "singular_value_ratio": 0.04877520352602005,
        "layerwise_effective_rank": 0.035315144807100296,
        "layerwise_effective_rank_mergeability_score": 0.058222390711307526,
        "task_vector_cosine_similarity": 0.08443621546030045,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.09493464976549149,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0015679971547797322,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.009885418228805065,
        "activation_l2_distance": 0.012172301299870014,
        "activation_cosine_similarity": 0.02029431238770485,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.003981086425483227,
        "encoder_gradient_cosine_similarity": 0.0028616259805858135,
        "encoder_gradient_l2_distance": -0.012313893996179104,
        "encoder_gradient_dot_product": 0.003093636129051447,
        "input_gradient_cosine_similarity": 0.0031083894427865744,
        "input_gradient_l2_distance": -0.011861108243465424,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7116389015059359,
      "val_r": 0.7562881368099804,
      "n_iterations": 254,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006249363999813795,
        "right_subspace_overlap_bottom_k": -0.008535921573638916,
        "interaction_matrix_overlap_top_k": 0.0010841813636943698,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.06465297937393188,
        "effective_rank_mergeability_score": 0.051063165068626404,
        "stable_rank": 0.00195146759506315,
        "spectral_gap": 0.032512202858924866,
        "singular_value_ratio": 0.03156299516558647,
        "layerwise_effective_rank": 0.04665611684322357,
        "layerwise_effective_rank_mergeability_score": 0.061853013932704926,
        "task_vector_cosine_similarity": 0.08450044691562653,
        "task_vector_l2_distance": -0.0025105876848101616,
        "task_vector_dot_product": 0.001296613598242402,
        "weight_space_angle": 0.09625956416130066,
        "task_vector_magnitude_ratio": 0.0017599457642063498,
        "singular_value_overlap": -0.0010646459413692355,
        "subspace_overlap": 0.003869944252073765,
        "right_subspace_overlap": 0.007312229368835688,
        "activation_l2_distance": 0.006970238406211138,
        "activation_cosine_similarity": 0.01615005172789097,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.002337832935154438,
        "encoder_gradient_cosine_similarity": 0.004626682493835688,
        "encoder_gradient_l2_distance": -0.015170182101428509,
        "encoder_gradient_dot_product": 0.002000346314162016,
        "input_gradient_cosine_similarity": 0.003516371129080653,
        "input_gradient_l2_distance": -0.015147886238992214,
        "input_gradient_dot_product": -0.0013156457571312785
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7310283359002613,
      "val_r": 0.5461072954188364,
      "n_iterations": 276,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007029427215456963,
        "right_subspace_overlap_bottom_k": -0.005796416196972132,
        "interaction_matrix_overlap_top_k": 0.004230639431625605,
        "interaction_matrix_overlap_bottom_k": -0.0010866487864404917,
        "effective_rank": 0.032814040780067444,
        "effective_rank_mergeability_score": 0.03050496242940426,
        "stable_rank": 0.0,
        "spectral_gap": 0.05485738068819046,
        "singular_value_ratio": 0.05152135342359543,
        "layerwise_effective_rank": 0.04109668731689453,
        "layerwise_effective_rank_mergeability_score": 0.05113707482814789,
        "task_vector_cosine_similarity": 0.07802028954029083,
        "task_vector_l2_distance": -0.009893644601106644,
        "task_vector_dot_product": 0.0022102310322225094,
        "weight_space_angle": 0.09446515142917633,
        "task_vector_magnitude_ratio": 0.0011394284665584564,
        "singular_value_overlap": 0.0019320063292980194,
        "subspace_overlap": 0.0011924590216949582,
        "right_subspace_overlap": 0.008616099134087563,
        "activation_l2_distance": 0.034257542341947556,
        "activation_cosine_similarity": 0.0387101024389267,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0027942790184170008,
        "encoder_gradient_l2_distance": -0.01421879231929779,
        "encoder_gradient_dot_product": 0.0021386086009442806,
        "input_gradient_cosine_similarity": 0.00272355112247169,
        "input_gradient_l2_distance": -0.01090907771140337,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6704255072323227,
      "val_r": 0.5395833185364547,
      "n_iterations": 276,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006258642300963402,
        "right_subspace_overlap_bottom_k": -0.004891207441687584,
        "interaction_matrix_overlap_top_k": 0.0016500517958775163,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.04531100019812584,
        "effective_rank_mergeability_score": 0.031877271831035614,
        "stable_rank": 0.002202631440013647,
        "spectral_gap": 0.034383270889520645,
        "singular_value_ratio": 0.0334654301404953,
        "layerwise_effective_rank": 0.04880528897047043,
        "layerwise_effective_rank_mergeability_score": 0.06560840457677841,
        "task_vector_cosine_similarity": 0.08698318898677826,
        "task_vector_l2_distance": -0.0034770960919559,
        "task_vector_dot_product": 0.0012794939102604985,
        "weight_space_angle": 0.10220761597156525,
        "task_vector_magnitude_ratio": 0.0040054405108094215,
        "singular_value_overlap": 0.0011496192310005426,
        "subspace_overlap": 0.006835200358182192,
        "right_subspace_overlap": 0.010720597580075264,
        "activation_l2_distance": 0.019971119239926338,
        "activation_cosine_similarity": 0.02650386095046997,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0014406373957172036,
        "encoder_gradient_cosine_similarity": 0.0031687559094280005,
        "encoder_gradient_l2_distance": -0.010347869247198105,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0012872666120529175,
        "input_gradient_l2_distance": -0.009889396838843822,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7396097423230633,
      "val_r": 0.5159454649370347,
      "n_iterations": 314,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0012855667155236006,
        "right_subspace_overlap_bottom_k": -0.005225132219493389,
        "interaction_matrix_overlap_top_k": 0.0027609311509877443,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.04871590435504913,
        "effective_rank_mergeability_score": 0.009528874419629574,
        "stable_rank": 0.002988019958138466,
        "spectral_gap": 0.024532627314329147,
        "singular_value_ratio": 0.018939480185508728,
        "layerwise_effective_rank": 0.04204833135008812,
        "layerwise_effective_rank_mergeability_score": 0.0840551033616066,
        "task_vector_cosine_similarity": 0.0932852029800415,
        "task_vector_l2_distance": -0.0014866129495203495,
        "task_vector_dot_product": 0.0016974823083728552,
        "weight_space_angle": 0.10439832508563995,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0014498821692541242,
        "subspace_overlap": 0.009146506898105145,
        "right_subspace_overlap": 0.00539398193359375,
        "activation_l2_distance": 0.024206260219216347,
        "activation_cosine_similarity": 0.03488028794527054,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.003817114047706127,
        "encoder_gradient_l2_distance": -0.018565600737929344,
        "encoder_gradient_dot_product": 0.0057094828225672245,
        "input_gradient_cosine_similarity": 0.006263331975787878,
        "input_gradient_l2_distance": -0.015037929639220238,
        "input_gradient_dot_product": -0.001929338090121746
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.735643404448849,
      "val_r": 0.5093971085923642,
      "n_iterations": 316,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00686088390648365,
        "right_subspace_overlap_bottom_k": -0.011324544437229633,
        "interaction_matrix_overlap_top_k": 0.001978157553821802,
        "interaction_matrix_overlap_bottom_k": -0.0011497174855321646,
        "effective_rank": 0.04483836144208908,
        "effective_rank_mergeability_score": 0.025176847353577614,
        "stable_rank": 0.0,
        "spectral_gap": 0.026177864521741867,
        "singular_value_ratio": 0.022455738857388496,
        "layerwise_effective_rank": 0.06355030834674835,
        "layerwise_effective_rank_mergeability_score": 0.08990047127008438,
        "task_vector_cosine_similarity": 0.07297249883413315,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.09360288083553314,
        "task_vector_magnitude_ratio": 0.003142560599371791,
        "singular_value_overlap": 0.0023815371096134186,
        "subspace_overlap": 0.0025617722421884537,
        "right_subspace_overlap": 0.007538631092756987,
        "activation_l2_distance": 0.021655870601534843,
        "activation_cosine_similarity": 0.02583937533199787,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.00306151295080781,
        "encoder_gradient_l2_distance": -0.010373438708484173,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.003007507650181651,
        "input_gradient_l2_distance": -0.008336995728313923,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8032952551050219,
      "val_r": 0.7146162691235663,
      "n_iterations": 510,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.07596763223409653,
        "effective_rank_mergeability_score": 0.05844622105360031,
        "stable_rank": 0.0,
        "spectral_gap": 0.03546435385942459,
        "singular_value_ratio": 0.03052879497408867,
        "layerwise_effective_rank": 0.05494677647948265,
        "layerwise_effective_rank_mergeability_score": 0.0750824362039566,
        "task_vector_cosine_similarity": 0.07409486174583435,
        "task_vector_l2_distance": -0.00861432310193777,
        "task_vector_dot_product": 0.0021496654953807592,
        "weight_space_angle": 0.08267571032047272,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": -0.0015073411632329226,
        "activation_l2_distance": 0.008650130592286587,
        "activation_cosine_similarity": 0.01265023648738861,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.009678147733211517,
        "encoder_gradient_cosine_similarity": 0.0013588883448392153,
        "encoder_gradient_l2_distance": -0.01363985426723957,
        "encoder_gradient_dot_product": 0.002246994525194168,
        "input_gradient_cosine_similarity": 0.006507327780127525,
        "input_gradient_l2_distance": -0.014486150816082954,
        "input_gradient_dot_product": -0.002372058806940913
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}