{
  "aggregate_metrics": {
    "train_r": 0.5290633709942661,
    "train_p": 6.587689925154428e-232,
    "val_r": 0.4294298914784088,
    "val_p": 1.6974690095593796e-17
  },
  "per_fold_stats": {
    "train_r_mean": 0.7316460138260129,
    "train_r_std": 0.05502860076223991,
    "val_r_mean": 0.650375420419637,
    "val_r_std": 0.14850503398965997,
    "n_nonzero_mean": 15.85,
    "n_nonzero_std": 3.9404948927767944
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.005235358141362667,
    "right_subspace_overlap_bottom_k": -0.010832762345671654,
    "interaction_matrix_overlap_top_k": 0.0016651041805744171,
    "interaction_matrix_overlap_bottom_k": -0.0008830794831737876,
    "effective_rank": 0.0003325382713228464,
    "effective_rank_mergeability_score": -0.0001228251203428954,
    "stable_rank": 6.782588025089353e-05,
    "spectral_gap": -0.0005311515415087342,
    "singular_value_ratio": 0.0003939929883927107,
    "layerwise_effective_rank": -0.00048267710371874273,
    "layerwise_effective_rank_mergeability_score": 0.0003646916593424976,
    "task_vector_cosine_similarity": 7.832822302589193e-05,
    "task_vector_l2_distance": -0.0005659348680637777,
    "task_vector_dot_product": 0.0007299001445062459,
    "weight_space_angle": -0.000987150939181447,
    "task_vector_magnitude_ratio": 0.00042212969856336713,
    "singular_value_overlap": 0.004108462482690811,
    "subspace_overlap": 0.00041928552673198283,
    "right_subspace_overlap": 0.005432952661067247,
    "activation_l2_distance": -0.0009091203100979328,
    "activation_cosine_similarity": 0.0077171288430690765,
    "activation_magnitude_ratio": -0.0011999184498563409,
    "activation_dot_product": 0.0035313882399350405,
    "encoder_gradient_cosine_similarity": 0.0014940901892259717,
    "encoder_gradient_l2_distance": -0.015350237488746643,
    "encoder_gradient_dot_product": 0.0003060023591388017,
    "input_gradient_cosine_similarity": 0.00032560410909354687,
    "input_gradient_l2_distance": -0.010015105828642845,
    "input_gradient_dot_product": -0.0013603048864752054
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.0025316071696579456,
    "right_subspace_overlap_bottom_k": 0.0025025370996445417,
    "interaction_matrix_overlap_top_k": 0.002434283262118697,
    "interaction_matrix_overlap_bottom_k": 0.002186831785365939,
    "effective_rank": 0.0007700594724155962,
    "effective_rank_mergeability_score": 0.000755267683416605,
    "stable_rank": 0.0006573242135345936,
    "spectral_gap": 0.0010597172658890486,
    "singular_value_ratio": 0.0010648672468960285,
    "layerwise_effective_rank": 0.0012403368018567562,
    "layerwise_effective_rank_mergeability_score": 0.0006352490745484829,
    "task_vector_cosine_similarity": 0.00154915452003479,
    "task_vector_l2_distance": 0.0014877647627145052,
    "task_vector_dot_product": 0.002485217759385705,
    "weight_space_angle": 0.002037431811913848,
    "task_vector_magnitude_ratio": 0.0010192285990342498,
    "singular_value_overlap": 0.0018658811459317803,
    "subspace_overlap": 0.0012871354119852185,
    "right_subspace_overlap": 0.002553565427660942,
    "activation_l2_distance": 0.001669451710768044,
    "activation_cosine_similarity": 0.0034852251410484314,
    "activation_magnitude_ratio": 0.0014418908394873142,
    "activation_dot_product": 0.004725202452391386,
    "encoder_gradient_cosine_similarity": 0.0017557725077494979,
    "encoder_gradient_l2_distance": 0.004913958255201578,
    "encoder_gradient_dot_product": 0.0012090642703697085,
    "input_gradient_cosine_similarity": 0.0012937994906678796,
    "input_gradient_l2_distance": 0.005296805873513222,
    "input_gradient_dot_product": 0.0018615596927702427
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.9,
    "right_subspace_overlap_bottom_k": 1.0,
    "interaction_matrix_overlap_top_k": 0.4,
    "interaction_matrix_overlap_bottom_k": 0.5,
    "effective_rank": 0.2,
    "effective_rank_mergeability_score": 0.15,
    "stable_rank": 0.15,
    "spectral_gap": 0.35,
    "singular_value_ratio": 0.4,
    "layerwise_effective_rank": 0.4,
    "layerwise_effective_rank_mergeability_score": 0.25,
    "task_vector_cosine_similarity": 0.45,
    "task_vector_l2_distance": 0.4,
    "task_vector_dot_product": 0.55,
    "weight_space_angle": 0.6,
    "task_vector_magnitude_ratio": 0.2,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.35,
    "right_subspace_overlap": 0.95,
    "activation_l2_distance": 0.55,
    "activation_cosine_similarity": 1.0,
    "activation_magnitude_ratio": 0.6,
    "activation_dot_product": 0.7,
    "encoder_gradient_cosine_similarity": 0.6,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.45,
    "input_gradient_cosine_similarity": 0.35,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.4
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7460757587703115,
      "val_r": 0.48473623878417865,
      "n_iterations": 227,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004939467180520296,
        "right_subspace_overlap_bottom_k": -0.007220138795673847,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0025594111066311598,
        "task_vector_dot_product": -0.002209023805335164,
        "weight_space_angle": -0.0025507966056466103,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.00348083907738328,
        "subspace_overlap": 0.003922568634152412,
        "right_subspace_overlap": 0.0050598266534507275,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.01447668019682169,
        "activation_magnitude_ratio": -0.002844018628820777,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0020093382336199284,
        "encoder_gradient_l2_distance": -0.022952958941459656,
        "encoder_gradient_dot_product": -0.00286259688436985,
        "input_gradient_cosine_similarity": -0.0028334783855825663,
        "input_gradient_l2_distance": -0.013292110525071621,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7431747476565332,
      "val_r": 0.7804530490476721,
      "n_iterations": 180,
      "n_nonzero_coefficients": 12,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0035942397080361843,
        "right_subspace_overlap_bottom_k": -0.00939579401165247,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.001015659305267036,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0011777296895161271,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0010044265072792768,
        "weight_space_angle": -0.0012046193005517125,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.003189152805134654,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.008194162510335445,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.008832637220621109,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.015373100526630878,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.006413559895008802,
        "input_gradient_dot_product": -0.0033504543825984
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7604816933891827,
      "val_r": 0.8110674944810811,
      "n_iterations": 218,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006120740901678801,
        "right_subspace_overlap_bottom_k": -0.01195450872182846,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.0010650078766047955,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0020519935060292482,
        "layerwise_effective_rank_mergeability_score": 0.0016661378322169185,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0020138034597039223,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0017866939306259155,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.00539473257958889,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0045649269595742226,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.007271338254213333,
        "activation_magnitude_ratio": -0.001256838208064437,
        "activation_dot_product": 0.006512367632240057,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.016992513090372086,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.013374474830925465,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.752049902992376,
      "val_r": 0.7202556824916212,
      "n_iterations": 304,
      "n_nonzero_coefficients": 10,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0054786959663033485,
        "right_subspace_overlap_bottom_k": -0.010535621084272861,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.004943337291479111,
        "subspace_overlap": -0.0020071298349648714,
        "right_subspace_overlap": 0.005949452985078096,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.007012778427451849,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0020752977579832077,
        "encoder_gradient_cosine_similarity": 0.0013209140161052346,
        "encoder_gradient_l2_distance": -0.01645980402827263,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.00861264392733574,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7349801363184286,
      "val_r": 0.7372228405363558,
      "n_iterations": 184,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009308171458542347,
        "right_subspace_overlap_bottom_k": -0.014870303682982922,
        "interaction_matrix_overlap_top_k": 0.0054614427499473095,
        "interaction_matrix_overlap_bottom_k": -0.0017879446968436241,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0012369519099593163,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.002450081519782543,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0017862844979390502,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.007453626021742821,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.008754932321608067,
        "activation_l2_distance": -0.001295741181820631,
        "activation_cosine_similarity": 0.015863271430134773,
        "activation_magnitude_ratio": 0.0011747080134227872,
        "activation_dot_product": 0.0047609745524823666,
        "encoder_gradient_cosine_similarity": -0.0014121863059699535,
        "encoder_gradient_l2_distance": -0.028998691588640213,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.002215879037976265,
        "input_gradient_l2_distance": -0.02459561452269554,
        "input_gradient_dot_product": -0.0023965928703546524
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7292148630851963,
      "val_r": 0.7314106386995965,
      "n_iterations": 297,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0045795077458024025,
        "right_subspace_overlap_bottom_k": -0.005825150292366743,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.002606799826025963,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.001008512219414115,
        "singular_value_ratio": -0.001213743700645864,
        "layerwise_effective_rank": -0.0016066060634329915,
        "layerwise_effective_rank_mergeability_score": 0.0013138847425580025,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0012097735889256,
        "task_vector_dot_product": -0.0019158790819346905,
        "weight_space_angle": -0.0022879389580339193,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0015955627895891666,
        "subspace_overlap": 0.0017552158096805215,
        "right_subspace_overlap": 0.001700956141576171,
        "activation_l2_distance": -0.0027789354790002108,
        "activation_cosine_similarity": 0.005284746177494526,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.00309855118393898,
        "encoder_gradient_cosine_similarity": 0.002138867974281311,
        "encoder_gradient_l2_distance": -0.009617635048925877,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.006023216526955366,
        "input_gradient_dot_product": -0.0024902168661355972
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7590039882679394,
      "val_r": 0.6341496567882572,
      "n_iterations": 321,
      "n_nonzero_coefficients": 8,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0060069365426898,
        "right_subspace_overlap_bottom_k": -0.013125593774020672,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0010762521997094154,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0021653559524565935,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.002732814522460103,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.009675728157162666,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.014667442068457603,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.005394076928496361,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6753080392378696,
      "val_r": 0.3939443361983645,
      "n_iterations": 173,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007171315606683493,
        "right_subspace_overlap_bottom_k": -0.008806966245174408,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0010602069087326527,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": -0.0010389171075075865,
        "stable_rank": 0.0,
        "spectral_gap": -0.001227633561939001,
        "singular_value_ratio": 0.001570333493873477,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0019516728352755308,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.0019786013290286064,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.001015920890495181,
        "singular_value_overlap": 0.003128973999992013,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0059214564971625805,
        "activation_l2_distance": -0.002596492413431406,
        "activation_cosine_similarity": 0.006218931172043085,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.003019528230652213,
        "encoder_gradient_l2_distance": -0.014379989355802536,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.0011963710421696305,
        "input_gradient_l2_distance": -0.00852806307375431,
        "input_gradient_dot_product": -0.0023159547708928585
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.660273236056212,
      "val_r": 0.6455597208080806,
      "n_iterations": 216,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006770221516489983,
        "right_subspace_overlap_bottom_k": -0.012858601287007332,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.002035801764577627,
        "singular_value_ratio": 0.0021048691123723984,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0029965818393975496,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0017030219314619899,
        "singular_value_overlap": 0.0017089927569031715,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.005365757271647453,
        "activation_l2_distance": 0.0017383540980517864,
        "activation_cosine_similarity": 0.006749924272298813,
        "activation_magnitude_ratio": -0.0027326056733727455,
        "activation_dot_product": 0.0037920381873846054,
        "encoder_gradient_cosine_similarity": 0.004246370401233435,
        "encoder_gradient_l2_distance": -0.012962661683559418,
        "encoder_gradient_dot_product": 0.002622943837195635,
        "input_gradient_cosine_similarity": 0.0026017569471150637,
        "input_gradient_l2_distance": -0.00827745534479618,
        "input_gradient_dot_product": -0.00621039979159832
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7552335115331923,
      "val_r": 0.557853500871393,
      "n_iterations": 287,
      "n_nonzero_coefficients": 13,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004682696424424648,
        "right_subspace_overlap_bottom_k": -0.01159114483743906,
        "interaction_matrix_overlap_top_k": 0.0011889422312378883,
        "interaction_matrix_overlap_bottom_k": 0.0010879866313189268,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.001543678343296051,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.003138749860227108,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.004656417295336723,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": -0.0013633206253871322,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.0029800934717059135,
        "encoder_gradient_cosine_similarity": 0.0025913347490131855,
        "encoder_gradient_l2_distance": -0.00933835282921791,
        "encoder_gradient_dot_product": 0.002144918777048588,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0055945697240531445,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.756051162257753,
      "val_r": 0.26695617854928194,
      "n_iterations": 350,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004557818174362183,
        "right_subspace_overlap_bottom_k": -0.009406044147908688,
        "interaction_matrix_overlap_top_k": 0.003145844442769885,
        "interaction_matrix_overlap_bottom_k": -0.0011672705877572298,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.00141719460953027,
        "layerwise_effective_rank": 0.0014049762394279242,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0011936649680137634,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0012890321668237448,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.005993725266307592,
        "subspace_overlap": 0.0010023625800386071,
        "right_subspace_overlap": 0.006631241180002689,
        "activation_l2_distance": -0.003064910415560007,
        "activation_cosine_similarity": 0.008076783269643784,
        "activation_magnitude_ratio": -0.0026194611564278603,
        "activation_dot_product": 0.0052791316993534565,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.012232553213834763,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01111050695180893,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7576353308911983,
      "val_r": 0.7356917474630699,
      "n_iterations": 357,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004123079590499401,
        "right_subspace_overlap_bottom_k": -0.008891246281564236,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.002129010856151581,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.002028773771598935,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0019540912471711636,
        "subspace_overlap": 0.0017753047868609428,
        "right_subspace_overlap": 0.006810033228248358,
        "activation_l2_distance": -0.0024834293872117996,
        "activation_cosine_similarity": 0.006169133819639683,
        "activation_magnitude_ratio": -0.0013178146909922361,
        "activation_dot_product": 0.0010433838469907641,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.013001257553696632,
        "encoder_gradient_dot_product": 0.0011763419024646282,
        "input_gradient_cosine_similarity": 0.0034420976880937815,
        "input_gradient_l2_distance": -0.00807165540754795,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7489792048421116,
      "val_r": 0.7493075336029957,
      "n_iterations": 314,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0033433684147894382,
        "right_subspace_overlap_bottom_k": -0.011165331117808819,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0012483660830184817,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0015172016574069858,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.001431598560884595,
        "task_vector_cosine_similarity": 0.0013096145121380687,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0033218106254935265,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.006485395133495331,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.009267369285225868,
        "activation_magnitude_ratio": -0.001959618180990219,
        "activation_dot_product": 0.0014021615497767925,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.017170468345284462,
        "encoder_gradient_dot_product": -0.0019372347742319107,
        "input_gradient_cosine_similarity": 0.001201448030769825,
        "input_gradient_l2_distance": -0.01112083625048399,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5377582770860767,
      "val_r": 0.4545180145235257,
      "n_iterations": 262,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.011149607598781586,
        "right_subspace_overlap_bottom_k": -0.00990502443164587,
        "interaction_matrix_overlap_top_k": 0.0074616242200136185,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.003157667350023985,
        "effective_rank_mergeability_score": -0.0029026686679571867,
        "stable_rank": 0.0020812556613236666,
        "spectral_gap": -0.003767079208046198,
        "singular_value_ratio": 0.003214651718735695,
        "layerwise_effective_rank": 0.001903551397845149,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.005001392215490341,
        "task_vector_l2_distance": 0.0027950459625571966,
        "task_vector_dot_product": 0.009356082417070866,
        "weight_space_angle": -0.007157469168305397,
        "task_vector_magnitude_ratio": 0.0042809690348804,
        "singular_value_overlap": 0.007266528904438019,
        "subspace_overlap": 0.0029837985057383776,
        "right_subspace_overlap": 0.012081893160939217,
        "activation_l2_distance": -0.001137584913522005,
        "activation_cosine_similarity": 0.008489669300615788,
        "activation_magnitude_ratio": -0.0047652823850512505,
        "activation_dot_product": 0.01236993819475174,
        "encoder_gradient_cosine_similarity": 0.004798866808414459,
        "encoder_gradient_l2_distance": -0.018957726657390594,
        "encoder_gradient_dot_product": 0.001275714486837387,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.014026942662894726,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7597432499781291,
      "val_r": 0.7394650596511906,
      "n_iterations": 181,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00690007209777832,
        "right_subspace_overlap_bottom_k": -0.011490773409605026,
        "interaction_matrix_overlap_top_k": 0.0010332392994314432,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0014850833686068654,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0014479949604719877,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.001054266351275146,
        "task_vector_l2_distance": 0.0010047310497611761,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0017555209342390299,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.005127580836415291,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.004009398631751537,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.00920871365815401,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0017853295430541039,
        "encoder_gradient_l2_distance": -0.011040212586522102,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.005136732943356037,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7640989126705746,
      "val_r": 0.8681077669167268,
      "n_iterations": 350,
      "n_nonzero_coefficients": 12,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0052687544375658035,
        "right_subspace_overlap_bottom_k": -0.013051792979240417,
        "interaction_matrix_overlap_top_k": 0.004647812806069851,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.003247868036851287,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0013358163414523005,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0022499042097479105,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0029793584253638983,
        "activation_l2_distance": -0.0022592961322516203,
        "activation_cosine_similarity": 0.00599423423409462,
        "activation_magnitude_ratio": -0.002724143210798502,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.014950891956686974,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.003796098753809929,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7146031115713901,
      "val_r": 0.753077431902018,
      "n_iterations": 437,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.013017037883400917,
        "interaction_matrix_overlap_top_k": 0.00455487472936511,
        "interaction_matrix_overlap_bottom_k": 0.0012555464636534452,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0023569315671920776,
        "layerwise_effective_rank_mergeability_score": 0.0015539610758423805,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.004309171810746193,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.005831524264067411,
        "activation_l2_distance": 0.0021884050220251083,
        "activation_cosine_similarity": 0.009779260493814945,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0027379710227251053,
        "encoder_gradient_cosine_similarity": 0.0023660052102059126,
        "encoder_gradient_l2_distance": -0.00800544023513794,
        "encoder_gradient_dot_product": 0.0012091356329619884,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.004753232467919588,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7220802925535983,
      "val_r": 0.6434840876742607,
      "n_iterations": 271,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006509613711386919,
        "right_subspace_overlap_bottom_k": -0.01594272069633007,
        "interaction_matrix_overlap_top_k": 0.005808302666991949,
        "interaction_matrix_overlap_bottom_k": -0.003455009311437607,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0018468741327524185,
        "singular_value_ratio": 0.0012419933918863535,
        "layerwise_effective_rank": -0.0023817671462893486,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0028062118217349052,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0029173349030315876,
        "weight_space_angle": -0.003702213056385517,
        "task_vector_magnitude_ratio": 0.001442682114429772,
        "singular_value_overlap": 0.007330550812184811,
        "subspace_overlap": -0.0010464100632816553,
        "right_subspace_overlap": 0.004426212050020695,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0060499911196529865,
        "activation_magnitude_ratio": -0.0025129884015768766,
        "activation_dot_product": 0.011490955948829651,
        "encoder_gradient_cosine_similarity": 0.0021580432076007128,
        "encoder_gradient_l2_distance": -0.016636764630675316,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01774664968252182,
        "input_gradient_dot_product": -0.00476971548050642
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7351809694584512,
      "val_r": 0.5833262940307162,
      "n_iterations": 294,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0042028664611279964,
        "right_subspace_overlap_bottom_k": -0.007776312530040741,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.001080938964150846,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0010913594160228968,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0027095999103039503,
        "weight_space_angle": 0.0012956801801919937,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.002908392809331417,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.006503301206976175,
        "activation_l2_distance": -0.0016216569347307086,
        "activation_cosine_similarity": 0.007539503276348114,
        "activation_magnitude_ratio": -0.0012523403856903315,
        "activation_dot_product": 0.002856090199202299,
        "encoder_gradient_cosine_similarity": 0.004859393462538719,
        "encoder_gradient_l2_distance": -0.011652067303657532,
        "encoder_gradient_dot_product": 0.0010148773435503244,
        "input_gradient_cosine_similarity": 0.0010807502549141645,
        "input_gradient_l2_distance": -0.0064039211720228195,
        "input_gradient_dot_product": -0.00240437313914299
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8209938879037342,
      "val_r": 0.7169211353723542,
      "n_iterations": 409,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.009825140237808228,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.008854287676513195,
        "effective_rank": 0.0012290726881474257,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0018009901978075504,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0015363773563876748,
        "layerwise_effective_rank": -0.0031167762354016304,
        "layerwise_effective_rank_mergeability_score": 0.0013282508589327335,
        "task_vector_cosine_similarity": 0.0021431329660117626,
        "task_vector_l2_distance": -0.003637536196038127,
        "task_vector_dot_product": -0.00160032301209867,
        "weight_space_angle": -0.0030120969749987125,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.005508167203515768,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.004871118348091841,
        "activation_cosine_similarity": 0.003745216177776456,
        "activation_magnitude_ratio": -0.0011879679514095187,
        "activation_dot_product": 0.01618899032473564,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.021614206954836845,
        "encoder_gradient_dot_product": 0.0014759463956579566,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.018029779195785522,
        "input_gradient_dot_product": -0.0032683927565813065
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1.5,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}