{
  "aggregate_metrics": {
    "train_r": 0.36523958100052206,
    "train_p": 2.9692774409609538e-102,
    "val_r": 0.1133057721352425,
    "val_p": 0.03209265218512175
  },
  "per_fold_stats": {
    "train_r_mean": 0.5465391367599152,
    "train_r_std": 0.07820556430973429,
    "val_r_mean": 0.41989531015863346,
    "val_r_std": 0.1717412182174602,
    "n_nonzero_mean": 24.85,
    "n_nonzero_std": 2.4753787588973126
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.0038630622439086437,
    "right_subspace_overlap_bottom_k": 0.0007589542656205595,
    "interaction_matrix_overlap_top_k": 0.0024459243286401033,
    "interaction_matrix_overlap_bottom_k": 0.011242149397730827,
    "effective_rank": 0.04197682812809944,
    "effective_rank_mergeability_score": 0.05645439028739929,
    "stable_rank": 0.010606127791106701,
    "spectral_gap": 0.054473478347063065,
    "singular_value_ratio": 0.04766102880239487,
    "layerwise_effective_rank": 0.05099276825785637,
    "layerwise_effective_rank_mergeability_score": 0.050280600786209106,
    "task_vector_cosine_similarity": 0.07598420232534409,
    "task_vector_l2_distance": -0.011571855284273624,
    "task_vector_dot_product": 0.0009202024666592479,
    "weight_space_angle": 0.08328479528427124,
    "task_vector_magnitude_ratio": 0.0009617680916562676,
    "singular_value_overlap": -0.005503048188984394,
    "subspace_overlap": 0.006451759487390518,
    "right_subspace_overlap": 0.0027673617005348206,
    "activation_l2_distance": 0.012015430256724358,
    "activation_cosine_similarity": 0.014312486164271832,
    "activation_magnitude_ratio": 0.00025082993670366704,
    "activation_dot_product": 0.004850971978157759,
    "encoder_gradient_cosine_similarity": 0.002875309204682708,
    "encoder_gradient_l2_distance": -0.011458508670330048,
    "encoder_gradient_dot_product": 0.003672781167551875,
    "input_gradient_cosine_similarity": 0.00384212052449584,
    "input_gradient_l2_distance": -0.016613174229860306,
    "input_gradient_dot_product": -0.00020923660486005247
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.0055230725556612015,
    "right_subspace_overlap_bottom_k": 0.0028261623810976744,
    "interaction_matrix_overlap_top_k": 0.003556023584678769,
    "interaction_matrix_overlap_bottom_k": 0.004581043031066656,
    "effective_rank": 0.01601855270564556,
    "effective_rank_mergeability_score": 0.01914389245212078,
    "stable_rank": 0.01204177550971508,
    "spectral_gap": 0.016313623636960983,
    "singular_value_ratio": 0.01590082049369812,
    "layerwise_effective_rank": 0.015462138690054417,
    "layerwise_effective_rank_mergeability_score": 0.01270507276058197,
    "task_vector_cosine_similarity": 0.013291682116687298,
    "task_vector_l2_distance": 0.003933359403163195,
    "task_vector_dot_product": 0.0027752683963626623,
    "weight_space_angle": 0.014463613741099834,
    "task_vector_magnitude_ratio": 0.0017036937642842531,
    "singular_value_overlap": 0.003941190429031849,
    "subspace_overlap": 0.006348214577883482,
    "right_subspace_overlap": 0.0037435314152389765,
    "activation_l2_distance": 0.010547442361712456,
    "activation_cosine_similarity": 0.008980074897408485,
    "activation_magnitude_ratio": 0.0051793912425637245,
    "activation_dot_product": 0.006403650622814894,
    "encoder_gradient_cosine_similarity": 0.00287380232475698,
    "encoder_gradient_l2_distance": 0.007537545170634985,
    "encoder_gradient_dot_product": 0.0034398019779473543,
    "input_gradient_cosine_similarity": 0.003652745857834816,
    "input_gradient_l2_distance": 0.005044944118708372,
    "input_gradient_dot_product": 0.0016669004689902067
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.7,
    "right_subspace_overlap_bottom_k": 0.55,
    "interaction_matrix_overlap_top_k": 0.8,
    "interaction_matrix_overlap_bottom_k": 0.95,
    "effective_rank": 1.0,
    "effective_rank_mergeability_score": 1.0,
    "stable_rank": 0.85,
    "spectral_gap": 1.0,
    "singular_value_ratio": 1.0,
    "layerwise_effective_rank": 1.0,
    "layerwise_effective_rank_mergeability_score": 1.0,
    "task_vector_cosine_similarity": 1.0,
    "task_vector_l2_distance": 0.95,
    "task_vector_dot_product": 0.7,
    "weight_space_angle": 1.0,
    "task_vector_magnitude_ratio": 0.6,
    "singular_value_overlap": 0.95,
    "subspace_overlap": 0.75,
    "right_subspace_overlap": 0.7,
    "activation_l2_distance": 0.95,
    "activation_cosine_similarity": 1.0,
    "activation_magnitude_ratio": 0.65,
    "activation_dot_product": 0.7,
    "encoder_gradient_cosine_similarity": 0.75,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.8,
    "input_gradient_cosine_similarity": 0.9,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.6
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5953173502423217,
      "val_r": 0.5902246500404309,
      "n_iterations": 288,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0025200957898050547,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0031146849505603313,
        "interaction_matrix_overlap_bottom_k": 0.014079579152166843,
        "effective_rank": 0.023750564083456993,
        "effective_rank_mergeability_score": 0.06293374300003052,
        "stable_rank": 0.026264578104019165,
        "spectral_gap": 0.07303491979837418,
        "singular_value_ratio": 0.06425982713699341,
        "layerwise_effective_rank": 0.044390711933374405,
        "layerwise_effective_rank_mergeability_score": 0.026918241754174232,
        "task_vector_cosine_similarity": 0.08394726365804672,
        "task_vector_l2_distance": -0.010754233226180077,
        "task_vector_dot_product": -0.0014231788227334619,
        "weight_space_angle": 0.08886060118675232,
        "task_vector_magnitude_ratio": 0.0017722113989293575,
        "singular_value_overlap": -0.008807219564914703,
        "subspace_overlap": 0.007012350484728813,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.010000789538025856,
        "activation_cosine_similarity": 0.0133676677942276,
        "activation_magnitude_ratio": -0.003846755251288414,
        "activation_dot_product": 0.00207308866083622,
        "encoder_gradient_cosine_similarity": 0.0012380261905491352,
        "encoder_gradient_l2_distance": -0.01643987186253071,
        "encoder_gradient_dot_product": 0.0022866218350827694,
        "input_gradient_cosine_similarity": 0.0014597040135413408,
        "input_gradient_l2_distance": -0.016159458085894585,
        "input_gradient_dot_product": -0.001888248254545033
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5595292010868732,
      "val_r": 0.30381231584422275,
      "n_iterations": 314,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.008302178233861923,
        "interaction_matrix_overlap_bottom_k": 0.012615181505680084,
        "effective_rank": 0.06409730762243271,
        "effective_rank_mergeability_score": 0.08023659884929657,
        "stable_rank": 0.014275440946221352,
        "spectral_gap": 0.041157227009534836,
        "singular_value_ratio": 0.02973439171910286,
        "layerwise_effective_rank": 0.05195464938879013,
        "layerwise_effective_rank_mergeability_score": 0.046837951987981796,
        "task_vector_cosine_similarity": 0.06441450864076614,
        "task_vector_l2_distance": -0.013728474266827106,
        "task_vector_dot_product": 0.004226164426654577,
        "weight_space_angle": 0.0747983530163765,
        "task_vector_magnitude_ratio": 0.001516458811238408,
        "singular_value_overlap": -0.0069622076116502285,
        "subspace_overlap": 0.005341010168194771,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.01732459105551243,
        "activation_cosine_similarity": 0.0135668208822608,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0029151258058845997,
        "encoder_gradient_cosine_similarity": 0.0018405200680717826,
        "encoder_gradient_l2_distance": -0.0067168413661420345,
        "encoder_gradient_dot_product": 0.0025136617477983236,
        "input_gradient_cosine_similarity": 0.0024918264243751764,
        "input_gradient_l2_distance": -0.011859682388603687,
        "input_gradient_dot_product": 0.0011655203998088837
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5482454058863735,
      "val_r": 0.508976499049505,
      "n_iterations": 287,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0012522728648036718,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.011905405670404434,
        "effective_rank": 0.05875558778643608,
        "effective_rank_mergeability_score": 0.06772689521312714,
        "stable_rank": 0.01366003230214119,
        "spectral_gap": 0.04025785252451897,
        "singular_value_ratio": 0.035588547587394714,
        "layerwise_effective_rank": 0.048263490200042725,
        "layerwise_effective_rank_mergeability_score": 0.05027084797620773,
        "task_vector_cosine_similarity": 0.08179587125778198,
        "task_vector_l2_distance": -0.010750600136816502,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.08885475248098373,
        "task_vector_magnitude_ratio": 0.0011849055299535394,
        "singular_value_overlap": -0.007253941148519516,
        "subspace_overlap": 0.0060371593572199345,
        "right_subspace_overlap": 0.002746951300650835,
        "activation_l2_distance": 0.01137627474963665,
        "activation_cosine_similarity": 0.00881096813827753,
        "activation_magnitude_ratio": -0.0012455754913389683,
        "activation_dot_product": 0.0023634061217308044,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.00934805627912283,
        "encoder_gradient_dot_product": 0.0033154580742120743,
        "input_gradient_cosine_similarity": 0.0011513640638440847,
        "input_gradient_l2_distance": -0.014175215736031532,
        "input_gradient_dot_product": -0.0011658358853310347
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4656485249871559,
      "val_r": 0.3671419282442522,
      "n_iterations": 313,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003423442132771015,
        "right_subspace_overlap_bottom_k": -0.0017544038128107786,
        "interaction_matrix_overlap_top_k": 0.0031988583505153656,
        "interaction_matrix_overlap_bottom_k": 0.010976781137287617,
        "effective_rank": 0.018223799765110016,
        "effective_rank_mergeability_score": 0.024319032207131386,
        "stable_rank": 0.0072894468903541565,
        "spectral_gap": 0.1038215160369873,
        "singular_value_ratio": 0.0963028222322464,
        "layerwise_effective_rank": 0.023858584463596344,
        "layerwise_effective_rank_mergeability_score": 0.03531908243894577,
        "task_vector_cosine_similarity": 0.071907177567482,
        "task_vector_l2_distance": -0.008784297853708267,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.07313016802072525,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0035012478474527597,
        "subspace_overlap": 0.010281178168952465,
        "right_subspace_overlap": 0.0018392736092209816,
        "activation_l2_distance": 0.020436178892850876,
        "activation_cosine_similarity": 0.021435951814055443,
        "activation_magnitude_ratio": -0.0014331999700516462,
        "activation_dot_product": 0.004747242201119661,
        "encoder_gradient_cosine_similarity": 0.0022222381085157394,
        "encoder_gradient_l2_distance": -0.00630585104227066,
        "encoder_gradient_dot_product": 0.0029894807375967503,
        "input_gradient_cosine_similarity": 0.0016304892487823963,
        "input_gradient_l2_distance": -0.015362540259957314,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5572576953135869,
      "val_r": 0.6089733540361635,
      "n_iterations": 366,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0034868025686591864,
        "right_subspace_overlap_bottom_k": 0.0010165320709347725,
        "interaction_matrix_overlap_top_k": 0.0016437303274869919,
        "interaction_matrix_overlap_bottom_k": 0.011513778008520603,
        "effective_rank": 0.04257991164922714,
        "effective_rank_mergeability_score": 0.047572024166584015,
        "stable_rank": 0.0,
        "spectral_gap": 0.05743873491883278,
        "singular_value_ratio": 0.051502250134944916,
        "layerwise_effective_rank": 0.04875225946307182,
        "layerwise_effective_rank_mergeability_score": 0.04843314737081528,
        "task_vector_cosine_similarity": 0.0979895144701004,
        "task_vector_l2_distance": -0.01660124585032463,
        "task_vector_dot_product": -0.0012658004416152835,
        "weight_space_angle": 0.10577890276908875,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.008797204121947289,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.005154358223080635,
        "activation_l2_distance": 0.004149764310568571,
        "activation_cosine_similarity": 0.006235101260244846,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.010143267922103405,
        "encoder_gradient_dot_product": 0.0045272731222212315,
        "input_gradient_cosine_similarity": 0.00348164071328938,
        "input_gradient_l2_distance": -0.01710568368434906,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5943621444469385,
      "val_r": 0.7021736140226598,
      "n_iterations": 212,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0038912291638553143,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.002407452091574669,
        "interaction_matrix_overlap_bottom_k": 0.012662841007113457,
        "effective_rank": 0.07260574400424957,
        "effective_rank_mergeability_score": 0.08778543770313263,
        "stable_rank": 0.010721871629357338,
        "spectral_gap": 0.04926512762904167,
        "singular_value_ratio": 0.04240847006440163,
        "layerwise_effective_rank": 0.061138950288295746,
        "layerwise_effective_rank_mergeability_score": 0.05805317685008049,
        "task_vector_cosine_similarity": 0.05333588272333145,
        "task_vector_l2_distance": -0.015426275320351124,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.059535857290029526,
        "task_vector_magnitude_ratio": 0.0011226278729736805,
        "singular_value_overlap": -0.012292437255382538,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0017763508949428797,
        "activation_l2_distance": 0.005087911617010832,
        "activation_cosine_similarity": 0.008577782660722733,
        "activation_magnitude_ratio": -0.0018134041456505656,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0013101112563163042,
        "encoder_gradient_l2_distance": -0.014692799188196659,
        "encoder_gradient_dot_product": 0.0023766455706208944,
        "input_gradient_cosine_similarity": 0.004481729585677385,
        "input_gradient_l2_distance": -0.016339702531695366,
        "input_gradient_dot_product": -0.002856561215594411
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.3762535848857412,
      "val_r": 0.20816356300317138,
      "n_iterations": 266,
      "n_nonzero_coefficients": 29,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.023057298734784126,
        "right_subspace_overlap_bottom_k": 0.009199309162795544,
        "interaction_matrix_overlap_top_k": 0.01197175495326519,
        "interaction_matrix_overlap_bottom_k": 0.021495604887604713,
        "effective_rank": 0.016743676736950874,
        "effective_rank_mergeability_score": 0.03112032078206539,
        "stable_rank": 0.0015190886333584785,
        "spectral_gap": 0.06994042545557022,
        "singular_value_ratio": 0.061471499502658844,
        "layerwise_effective_rank": 0.08805953711271286,
        "layerwise_effective_rank_mergeability_score": 0.08319194614887238,
        "task_vector_cosine_similarity": 0.07076606154441833,
        "task_vector_l2_distance": -0.007320062257349491,
        "task_vector_dot_product": -0.004392554517835379,
        "weight_space_angle": 0.06071916222572327,
        "task_vector_magnitude_ratio": -0.0015217752661556005,
        "singular_value_overlap": 0.005475309677422047,
        "subspace_overlap": 0.019568707793951035,
        "right_subspace_overlap": 0.015744155272841454,
        "activation_l2_distance": -0.009426357224583626,
        "activation_cosine_similarity": 0.03216629847884178,
        "activation_magnitude_ratio": 0.022027086466550827,
        "activation_dot_product": 0.027284974232316017,
        "encoder_gradient_cosine_similarity": 0.012258246541023254,
        "encoder_gradient_l2_distance": -0.03166789188981056,
        "encoder_gradient_dot_product": 0.014581955038011074,
        "input_gradient_cosine_similarity": 0.008427455089986324,
        "input_gradient_l2_distance": -0.029125196859240532,
        "input_gradient_dot_product": 0.0037570102140307426
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4733913148563366,
      "val_r": 0.25965243030263896,
      "n_iterations": 422,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0017074712086468935,
        "interaction_matrix_overlap_bottom_k": 0.01626325026154518,
        "effective_rank": 0.04960604012012482,
        "effective_rank_mergeability_score": 0.0404144786298275,
        "stable_rank": 0.006224446929991245,
        "spectral_gap": 0.057192426174879074,
        "singular_value_ratio": 0.04844551905989647,
        "layerwise_effective_rank": 0.02756277285516262,
        "layerwise_effective_rank_mergeability_score": 0.049579668790102005,
        "task_vector_cosine_similarity": 0.05588468536734581,
        "task_vector_l2_distance": -0.01814335770905018,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.07539273053407669,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.008148193359375,
        "subspace_overlap": 0.015404489822685719,
        "right_subspace_overlap": 0.0028633661568164825,
        "activation_l2_distance": 0.03475545719265938,
        "activation_cosine_similarity": 0.03194809705018997,
        "activation_magnitude_ratio": -0.0016152637545019388,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.001960702706128359,
        "encoder_gradient_l2_distance": -0.0042483750730752945,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0038469666615128517,
        "input_gradient_l2_distance": -0.008417172357439995,
        "input_gradient_dot_product": 0.0015725066186860204
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5951400489285127,
      "val_r": 0.06873783397159827,
      "n_iterations": 291,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0014061240945011377,
        "interaction_matrix_overlap_bottom_k": 0.009767260402441025,
        "effective_rank": 0.04593757912516594,
        "effective_rank_mergeability_score": 0.10321585088968277,
        "stable_rank": 0.052888840436935425,
        "spectral_gap": 0.035920582711696625,
        "singular_value_ratio": 0.026761014014482498,
        "layerwise_effective_rank": 0.0459723174571991,
        "layerwise_effective_rank_mergeability_score": 0.041414760053157806,
        "task_vector_cosine_similarity": 0.06513571739196777,
        "task_vector_l2_distance": -0.011411188170313835,
        "task_vector_dot_product": 0.0010063194204121828,
        "weight_space_angle": 0.06882977485656738,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.005895076785236597,
        "subspace_overlap": 0.005305061116814613,
        "right_subspace_overlap": 0.0019032573327422142,
        "activation_l2_distance": 0.011803077533841133,
        "activation_cosine_similarity": 0.011182252317667007,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0018587163649499416,
        "encoder_gradient_cosine_similarity": 0.003757872385904193,
        "encoder_gradient_l2_distance": -0.006048898212611675,
        "encoder_gradient_dot_product": 0.0015126249054446816,
        "input_gradient_cosine_similarity": 0.0015179693000391126,
        "input_gradient_l2_distance": -0.014685166999697685,
        "input_gradient_dot_product": -0.0031341444700956345
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5391783094060172,
      "val_r": 0.3621208786054817,
      "n_iterations": 389,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.002332288771867752,
        "interaction_matrix_overlap_top_k": 0.001969018252566457,
        "interaction_matrix_overlap_bottom_k": 0.010464994236826897,
        "effective_rank": 0.05103972554206848,
        "effective_rank_mergeability_score": 0.05946480855345726,
        "stable_rank": 0.005799146834760904,
        "spectral_gap": 0.058488864451646805,
        "singular_value_ratio": 0.053060274571180344,
        "layerwise_effective_rank": 0.050077639520168304,
        "layerwise_effective_rank_mergeability_score": 0.05542491376399994,
        "task_vector_cosine_similarity": 0.07789506018161774,
        "task_vector_l2_distance": -0.011362254619598389,
        "task_vector_dot_product": 0.003313465276733041,
        "weight_space_angle": 0.08765677362680435,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.007636265829205513,
        "subspace_overlap": 0.00901875365525484,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.003397783963009715,
        "activation_cosine_similarity": 0.00203372398391366,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.002315649762749672,
        "encoder_gradient_l2_distance": -0.011320971883833408,
        "encoder_gradient_dot_product": 0.006293409038335085,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.020040806382894516,
        "input_gradient_dot_product": -0.001148010604083538
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.49474456622730234,
      "val_r": 0.23264478231888555,
      "n_iterations": 267,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.012359149754047394,
        "right_subspace_overlap_bottom_k": 0.0035777471493929625,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.009432168677449226,
        "effective_rank": 0.02883460931479931,
        "effective_rank_mergeability_score": 0.0699603259563446,
        "stable_rank": 0.009427221491932869,
        "spectral_gap": 0.048409923911094666,
        "singular_value_ratio": 0.03949495777487755,
        "layerwise_effective_rank": 0.06885069608688354,
        "layerwise_effective_rank_mergeability_score": 0.0501558855175972,
        "task_vector_cosine_similarity": 0.08359401673078537,
        "task_vector_l2_distance": -0.011444084346294403,
        "task_vector_dot_product": -0.002410072600468993,
        "weight_space_angle": 0.08678970485925674,
        "task_vector_magnitude_ratio": -0.0015386707382276654,
        "singular_value_overlap": -0.005451160483062267,
        "subspace_overlap": -0.0028661552350968122,
        "right_subspace_overlap": 0.006609418895095587,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.010923185385763645,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.014850890263915062,
        "encoder_gradient_cosine_similarity": 0.004150649532675743,
        "encoder_gradient_l2_distance": -0.024071570485830307,
        "encoder_gradient_dot_product": 0.004512233193963766,
        "input_gradient_cosine_similarity": 0.011920955032110214,
        "input_gradient_l2_distance": -0.02000797726213932,
        "input_gradient_dot_product": 0.001875182380899787
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.48163591430375274,
      "val_r": 0.4817718775473831,
      "n_iterations": 249,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004795607645064592,
        "right_subspace_overlap_bottom_k": 0.0010541209485381842,
        "interaction_matrix_overlap_top_k": 0.0027049672789871693,
        "interaction_matrix_overlap_bottom_k": 0.011322448961436749,
        "effective_rank": 0.022646130993962288,
        "effective_rank_mergeability_score": 0.06309898942708969,
        "stable_rank": 0.005814664997160435,
        "spectral_gap": 0.02992580458521843,
        "singular_value_ratio": 0.02586306631565094,
        "layerwise_effective_rank": 0.07904162257909775,
        "layerwise_effective_rank_mergeability_score": 0.03698321804404259,
        "task_vector_cosine_similarity": 0.0713673010468483,
        "task_vector_l2_distance": -0.008773203939199448,
        "task_vector_dot_product": 0.005020296201109886,
        "weight_space_angle": 0.08869940042495728,
        "task_vector_magnitude_ratio": 0.001897204201668501,
        "singular_value_overlap": -0.002339700935408473,
        "subspace_overlap": 0.019142193719744682,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.03346095606684685,
        "activation_cosine_similarity": 0.029999008402228355,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.002473745495080948,
        "encoder_gradient_cosine_similarity": 0.005201899446547031,
        "encoder_gradient_l2_distance": -0.0037606460973620415,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.00439492566511035,
        "input_gradient_l2_distance": -0.01313411258161068,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5107076584417007,
      "val_r": 0.4051411765810078,
      "n_iterations": 300,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004225574433803558,
        "right_subspace_overlap_bottom_k": 0.002637506928294897,
        "interaction_matrix_overlap_top_k": -0.0018920637667179108,
        "interaction_matrix_overlap_bottom_k": 0.015560237690806389,
        "effective_rank": 0.038339294493198395,
        "effective_rank_mergeability_score": 0.0463755801320076,
        "stable_rank": 0.0180559940636158,
        "spectral_gap": 0.06029229983687401,
        "singular_value_ratio": 0.050328582525253296,
        "layerwise_effective_rank": 0.049639031291007996,
        "layerwise_effective_rank_mergeability_score": 0.05715835094451904,
        "task_vector_cosine_similarity": 0.06956499814987183,
        "task_vector_l2_distance": -0.008387049660086632,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.06425853818655014,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.008996846154332161,
        "subspace_overlap": 0.0014656217535957694,
        "right_subspace_overlap": 0.003159106243401766,
        "activation_l2_distance": 0.016356272622942924,
        "activation_cosine_similarity": 0.020247334614396095,
        "activation_magnitude_ratio": 0.002972410060465336,
        "activation_dot_product": 0.004314871039241552,
        "encoder_gradient_cosine_similarity": 0.006128590553998947,
        "encoder_gradient_l2_distance": -0.008797467686235905,
        "encoder_gradient_dot_product": 0.006410045083612204,
        "input_gradient_cosine_similarity": 0.01338145136833191,
        "input_gradient_l2_distance": -0.020828159525990486,
        "input_gradient_dot_product": -0.0027386839501559734
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5379005504275836,
      "val_r": 0.7159643017748891,
      "n_iterations": 263,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002267963718622923,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.0010001698974519968,
        "interaction_matrix_overlap_bottom_k": 0.010124221444129944,
        "effective_rank": 0.031685926020145416,
        "effective_rank_mergeability_score": 0.04161287099123001,
        "stable_rank": 0.005676928907632828,
        "spectral_gap": 0.04130346700549126,
        "singular_value_ratio": 0.03316676244139671,
        "layerwise_effective_rank": 0.04739068076014519,
        "layerwise_effective_rank_mergeability_score": 0.04887177422642708,
        "task_vector_cosine_similarity": 0.10292956233024597,
        "task_vector_l2_distance": -0.013230417855083942,
        "task_vector_dot_product": 0.006877101957798004,
        "weight_space_angle": 0.10806353390216827,
        "task_vector_magnitude_ratio": 0.0027188491076231003,
        "singular_value_overlap": -0.0031320550478994846,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.008415509015321732,
        "activation_cosine_similarity": 0.009725858457386494,
        "activation_magnitude_ratio": -0.0010418584570288658,
        "activation_dot_product": 0.005744616501033306,
        "encoder_gradient_cosine_similarity": 0.0020307262893766165,
        "encoder_gradient_l2_distance": -0.02318716235458851,
        "encoder_gradient_dot_product": 0.002912752563133836,
        "input_gradient_cosine_similarity": 0.001008749008178711,
        "input_gradient_l2_distance": -0.01246526837348938,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5004625504737237,
      "val_r": 0.595000676024466,
      "n_iterations": 320,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0019040607148781419,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.006505146156996489,
        "effective_rank": 0.04399656876921654,
        "effective_rank_mergeability_score": 0.06277819722890854,
        "stable_rank": 0.011843523010611534,
        "spectral_gap": 0.057438924908638,
        "singular_value_ratio": 0.05020638182759285,
        "layerwise_effective_rank": 0.043848950415849686,
        "layerwise_effective_rank_mergeability_score": 0.04199323058128357,
        "task_vector_cosine_similarity": 0.08282611519098282,
        "task_vector_l2_distance": -0.011097636073827744,
        "task_vector_dot_product": -0.0021572308614850044,
        "weight_space_angle": 0.09198613464832306,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.008131870999932289,
        "subspace_overlap": 0.011664694175124168,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.004310870077461004,
        "activation_cosine_similarity": 0.009321966208517551,
        "activation_magnitude_ratio": -0.0022498895414173603,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.011800090782344341,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0015626766253262758,
        "input_gradient_l2_distance": -0.014397269114851952,
        "input_gradient_dot_product": 0.0014506920706480742
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5849326236384357,
      "val_r": 0.42198002079176217,
      "n_iterations": 540,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.0012847259640693665,
        "interaction_matrix_overlap_bottom_k": 0.008210113272070885,
        "effective_rank": 0.038258396089076996,
        "effective_rank_mergeability_score": 0.05378538370132446,
        "stable_rank": 0.0,
        "spectral_gap": 0.04742105305194855,
        "singular_value_ratio": 0.043301042169332504,
        "layerwise_effective_rank": 0.05592276155948639,
        "layerwise_effective_rank_mergeability_score": 0.042762402445077896,
        "task_vector_cosine_similarity": 0.09313283860683441,
        "task_vector_l2_distance": -0.01409248448908329,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.09460863471031189,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0018401487031951547,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.003500357735902071,
        "activation_l2_distance": 0.025875484570860863,
        "activation_cosine_similarity": 0.02006836235523224,
        "activation_magnitude_ratio": -0.0011770774144679308,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.00943892914801836,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.002288061659783125,
        "input_gradient_l2_distance": -0.011975888162851334,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5531434612041648,
      "val_r": 0.3161397253123455,
      "n_iterations": 477,
      "n_nonzero_coefficients": 29,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003870007349178195,
        "right_subspace_overlap_bottom_k": 0.004291201941668987,
        "interaction_matrix_overlap_top_k": 0.009897515177726746,
        "interaction_matrix_overlap_bottom_k": 0.0032850615680217743,
        "effective_rank": 0.03218454495072365,
        "effective_rank_mergeability_score": 0.04168960452079773,
        "stable_rank": 0.0014779854100197554,
        "spectral_gap": 0.06517692655324936,
        "singular_value_ratio": 0.060335155576467514,
        "layerwise_effective_rank": 0.04238898679614067,
        "layerwise_effective_rank_mergeability_score": 0.03759961202740669,
        "task_vector_cosine_similarity": 0.07645107805728912,
        "task_vector_l2_distance": -0.016583256423473358,
        "task_vector_dot_product": 0.005405594129115343,
        "weight_space_angle": 0.09934279322624207,
        "task_vector_magnitude_ratio": 0.006176697090268135,
        "singular_value_overlap": -0.0071053518913686275,
        "subspace_overlap": 0.007635423913598061,
        "right_subspace_overlap": 0.001884256023913622,
        "activation_l2_distance": 0.0068037621676921844,
        "activation_cosine_similarity": 0.0034737770911306143,
        "activation_magnitude_ratio": -0.0028906487859785557,
        "activation_dot_product": 0.0043131099082529545,
        "encoder_gradient_cosine_similarity": 0.005378323141485453,
        "encoder_gradient_l2_distance": 0.0018021846190094948,
        "encoder_gradient_dot_product": 0.009454645216464996,
        "input_gradient_cosine_similarity": 0.0021895496174693108,
        "input_gradient_l2_distance": -0.023007921874523163,
        "input_gradient_dot_product": -0.001074159168638289
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5598091344211292,
      "val_r": 0.2915949487866153,
      "n_iterations": 307,
      "n_nonzero_coefficients": 28,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0024166011717170477,
        "right_subspace_overlap_bottom_k": 0.0019366401247680187,
        "interaction_matrix_overlap_top_k": 0.0027126893401145935,
        "interaction_matrix_overlap_bottom_k": 0.016618739813566208,
        "effective_rank": 0.07117004692554474,
        "effective_rank_mergeability_score": 0.06455940753221512,
        "stable_rank": 0.020128922536969185,
        "spectral_gap": 0.043918658047914505,
        "singular_value_ratio": 0.03807384520769119,
        "layerwise_effective_rank": 0.03678339347243309,
        "layerwise_effective_rank_mergeability_score": 0.06786994636058807,
        "task_vector_cosine_similarity": 0.054286081343889236,
        "task_vector_l2_distance": -0.009804465807974339,
        "task_vector_dot_product": 0.0012132280971854925,
        "weight_space_angle": 0.0660819485783577,
        "task_vector_magnitude_ratio": 0.001526745967566967,
        "singular_value_overlap": -0.0015566409565508366,
        "subspace_overlap": 0.01013001799583435,
        "right_subspace_overlap": 0.0023801352363079786,
        "activation_l2_distance": 0.015345611609518528,
        "activation_cosine_similarity": 0.014648068696260452,
        "activation_magnitude_ratio": -0.0013175247004255652,
        "activation_dot_product": 0.007218101993203163,
        "encoder_gradient_cosine_similarity": 0.003258275566622615,
        "encoder_gradient_l2_distance": -0.013062011450529099,
        "encoder_gradient_dot_product": 0.002944465959444642,
        "input_gradient_cosine_similarity": 0.007815287448465824,
        "input_gradient_l2_distance": -0.0262135062366724,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7850113242421635,
      "val_r": 0.6063160330496264,
      "n_iterations": 352,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010329579003155231,
        "right_subspace_overlap_bottom_k": -0.005699553526937962,
        "interaction_matrix_overlap_top_k": 0.0020589998457580805,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.051199689507484436,
        "effective_rank_mergeability_score": 0.03961385786533356,
        "stable_rank": 0.0010544307297095656,
        "spectral_gap": 0.040577489882707596,
        "singular_value_ratio": 0.04190541431307793,
        "layerwise_effective_rank": 0.037866298109292984,
        "layerwise_effective_rank_mergeability_score": 0.05956173688173294,
        "task_vector_cosine_similarity": 0.08458662033081055,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0016937959007918835,
        "weight_space_angle": 0.10058653354644775,
        "task_vector_magnitude_ratio": 0.003351234830915928,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0038946918211877346,
        "right_subspace_overlap": 0.007433086633682251,
        "activation_l2_distance": 0.014256340451538563,
        "activation_cosine_similarity": 0.016378581523895264,
        "activation_magnitude_ratio": -0.0013516999315470457,
        "activation_dot_product": 0.006108683068305254,
        "encoder_gradient_cosine_similarity": 0.004454353358596563,
        "encoder_gradient_l2_distance": -0.011696399189531803,
        "encoder_gradient_dot_product": 0.0021869074553251266,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.012609098106622696,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.61811137177849,
      "val_r": 0.35137559386556255,
      "n_iterations": 456,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.001286168466322124,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.012040154077112675,
        "effective_rank": 0.03788142278790474,
        "effective_rank_mergeability_score": 0.04082424193620682,
        "stable_rank": 0.0,
        "spectral_gap": 0.06848742067813873,
        "singular_value_ratio": 0.06101091951131821,
        "layerwise_effective_rank": 0.06809207051992416,
        "layerwise_effective_rank_mergeability_score": 0.06721214205026627,
        "task_vector_cosine_similarity": 0.07787375897169113,
        "task_vector_l2_distance": -0.013742499984800816,
        "task_vector_dot_product": 0.0012969211675226688,
        "weight_space_angle": 0.08172136545181274,
        "task_vector_magnitude_ratio": 0.001028873142786324,
        "singular_value_overlap": -0.0076887174509465694,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": -0.0016468387329950929,
        "activation_l2_distance": 0.0065783304162323475,
        "activation_cosine_similarity": 0.0021388756576925516,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.010752868838608265,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.008225261233747005,
        "encoder_gradient_dot_product": 0.00463744206354022,
        "input_gradient_cosine_similarity": 0.003791617229580879,
        "input_gradient_l2_distance": -0.014353667385876179,
        "input_gradient_dot_product": 0.0
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}