{
  "aggregate_metrics": {
    "train_r": 0.3969919351551527,
    "train_p": 4.2744540672952456e-122,
    "val_r": 0.06638532008320312,
    "val_p": 0.21018420497155335
  },
  "per_fold_stats": {
    "train_r_mean": 0.5886771611431418,
    "train_r_std": 0.06504344261757135,
    "val_r_mean": 0.45068477523106826,
    "val_r_std": 0.17596868409316313,
    "n_nonzero_mean": 19.85,
    "n_nonzero_std": 3.380458548777074
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.003782773856073618,
    "right_subspace_overlap_bottom_k": -0.0016126602422446012,
    "interaction_matrix_overlap_top_k": 3.919284790754318e-05,
    "interaction_matrix_overlap_bottom_k": 0.02263762429356575,
    "effective_rank": -0.0009269095025956631,
    "effective_rank_mergeability_score": 0.0011344959493726492,
    "stable_rank": -0.0008139209821820259,
    "spectral_gap": 0.0002752138243522495,
    "singular_value_ratio": -0.00040968164103105664,
    "layerwise_effective_rank": -7.422269118251279e-05,
    "layerwise_effective_rank_mergeability_score": 7.365470810327679e-05,
    "task_vector_cosine_similarity": -0.001376676606014371,
    "task_vector_l2_distance": -0.021419819444417953,
    "task_vector_dot_product": -0.0008720580372028053,
    "weight_space_angle": 0.0009181160712614655,
    "task_vector_magnitude_ratio": -0.004384725354611874,
    "singular_value_overlap": -0.015078742988407612,
    "subspace_overlap": 0.0030640901532024145,
    "right_subspace_overlap": 0.003953299019485712,
    "activation_l2_distance": -0.0007296672556549311,
    "activation_cosine_similarity": 0.004410469904541969,
    "activation_magnitude_ratio": -0.003674296196550131,
    "activation_dot_product": 0.0031240207608789206,
    "encoder_gradient_cosine_similarity": 0.0013526377733796835,
    "encoder_gradient_l2_distance": -0.026707783341407776,
    "encoder_gradient_dot_product": 0.0014674466801807284,
    "input_gradient_cosine_similarity": 0.0016204711282625794,
    "input_gradient_l2_distance": -0.026874344795942307,
    "input_gradient_dot_product": -0.00783727876842022
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.004989170003682375,
    "right_subspace_overlap_bottom_k": 0.008167548105120659,
    "interaction_matrix_overlap_top_k": 0.0024676055181771517,
    "interaction_matrix_overlap_bottom_k": 0.008478006348013878,
    "effective_rank": 0.0013631018809974194,
    "effective_rank_mergeability_score": 0.0015160468174144626,
    "stable_rank": 0.0012111476389691234,
    "spectral_gap": 0.00091951759532094,
    "singular_value_ratio": 0.0009574048453941941,
    "layerwise_effective_rank": 0.001077749882824719,
    "layerwise_effective_rank_mergeability_score": 0.0016378131695091724,
    "task_vector_cosine_similarity": 0.002594121266156435,
    "task_vector_l2_distance": 0.011569597758352757,
    "task_vector_dot_product": 0.003976170904934406,
    "weight_space_angle": 0.002751634456217289,
    "task_vector_magnitude_ratio": 0.0018921077717095613,
    "singular_value_overlap": 0.007941373623907566,
    "subspace_overlap": 0.004105299711227417,
    "right_subspace_overlap": 0.005735222715884447,
    "activation_l2_distance": 0.0030209971591830254,
    "activation_cosine_similarity": 0.0052911462262272835,
    "activation_magnitude_ratio": 0.0022261522244662046,
    "activation_dot_product": 0.004497924819588661,
    "encoder_gradient_cosine_similarity": 0.0013251072959974408,
    "encoder_gradient_l2_distance": 0.013947958126664162,
    "encoder_gradient_dot_product": 0.001985466806218028,
    "input_gradient_cosine_similarity": 0.0017180655850097537,
    "input_gradient_l2_distance": 0.01668107695877552,
    "input_gradient_dot_product": 0.005649831146001816
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.8,
    "right_subspace_overlap_bottom_k": 0.85,
    "interaction_matrix_overlap_top_k": 0.5,
    "interaction_matrix_overlap_bottom_k": 0.95,
    "effective_rank": 0.4,
    "effective_rank_mergeability_score": 0.55,
    "stable_rank": 0.5,
    "spectral_gap": 0.35,
    "singular_value_ratio": 0.35,
    "layerwise_effective_rank": 0.4,
    "layerwise_effective_rank_mergeability_score": 0.35,
    "task_vector_cosine_similarity": 0.6,
    "task_vector_l2_distance": 0.95,
    "task_vector_dot_product": 0.6,
    "weight_space_angle": 0.65,
    "task_vector_magnitude_ratio": 0.95,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.7,
    "right_subspace_overlap": 0.65,
    "activation_l2_distance": 0.75,
    "activation_cosine_similarity": 0.8,
    "activation_magnitude_ratio": 0.9,
    "activation_dot_product": 0.8,
    "encoder_gradient_cosine_similarity": 0.6,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.45,
    "input_gradient_cosine_similarity": 0.55,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.9
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.62598268311578,
      "val_r": 0.6069644376601067,
      "n_iterations": 482,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0027112921234220266,
        "right_subspace_overlap_bottom_k": 0.006611906923353672,
        "interaction_matrix_overlap_top_k": -0.0019699796102941036,
        "interaction_matrix_overlap_bottom_k": 0.032874200493097305,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0010580765083432198,
        "layerwise_effective_rank": 0.0028221013490110636,
        "layerwise_effective_rank_mergeability_score": -0.0039050057530403137,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0321345254778862,
        "task_vector_dot_product": -0.003933998756110668,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.00610487861558795,
        "singular_value_overlap": -0.029399026185274124,
        "subspace_overlap": 0.015052501112222672,
        "right_subspace_overlap": 0.0014592737425118685,
        "activation_l2_distance": -0.0012064268812537193,
        "activation_cosine_similarity": 0.010025318711996078,
        "activation_magnitude_ratio": -0.010392112657427788,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.034717585891485214,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.004944451153278351,
        "input_gradient_l2_distance": -0.03056325763463974,
        "input_gradient_dot_product": -0.007859572768211365
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.47742064573700466,
      "val_r": 0.4149946628671065,
      "n_iterations": 317,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00605149008333683,
        "right_subspace_overlap_bottom_k": -0.010352012701332569,
        "interaction_matrix_overlap_top_k": 0.0016768991481512785,
        "interaction_matrix_overlap_bottom_k": 0.024332385510206223,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0014189973007887602,
        "spectral_gap": -0.001624859170988202,
        "singular_value_ratio": 0.0017392014851793647,
        "layerwise_effective_rank": 0.0014829867286607623,
        "layerwise_effective_rank_mergeability_score": -0.001912758918479085,
        "task_vector_cosine_similarity": 0.0010974827455356717,
        "task_vector_l2_distance": -0.00920994020998478,
        "task_vector_dot_product": 0.0022897357121109962,
        "weight_space_angle": -0.0028311586938798428,
        "task_vector_magnitude_ratio": -0.004225633107125759,
        "singular_value_overlap": -0.00555286044254899,
        "subspace_overlap": 0.0026813976000994444,
        "right_subspace_overlap": 0.004424413666129112,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.003307162318378687,
        "activation_magnitude_ratio": -0.0015295286430045962,
        "activation_dot_product": 0.004668941721320152,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.014745364896953106,
        "encoder_gradient_dot_product": 0.003107246942818165,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01559995487332344,
        "input_gradient_dot_product": -0.0049713049083948135
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.550082604806365,
      "val_r": 0.5444917628831509,
      "n_iterations": 215,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00864087138324976,
        "right_subspace_overlap_bottom_k": -0.008983196690678596,
        "interaction_matrix_overlap_top_k": 0.0025953773874789476,
        "interaction_matrix_overlap_bottom_k": 0.016862036660313606,
        "effective_rank": -0.002775118686258793,
        "effective_rank_mergeability_score": 0.002072329632937908,
        "stable_rank": -0.001963934162631631,
        "spectral_gap": 0.0015397162642329931,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0015531667741015553,
        "layerwise_effective_rank_mergeability_score": 0.0011188734788447618,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.012248340994119644,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.002720718737691641,
        "task_vector_magnitude_ratio": -0.006185466889292002,
        "singular_value_overlap": -0.014468288980424404,
        "subspace_overlap": 0.002102792728692293,
        "right_subspace_overlap": 0.002890111645683646,
        "activation_l2_distance": -0.00113798794336617,
        "activation_cosine_similarity": 0.0050964439287781715,
        "activation_magnitude_ratio": -0.005145775619894266,
        "activation_dot_product": 0.0027657360769808292,
        "encoder_gradient_cosine_similarity": 0.0020676911808550358,
        "encoder_gradient_l2_distance": -0.01917426474392414,
        "encoder_gradient_dot_product": 0.003126688301563263,
        "input_gradient_cosine_similarity": 0.0014000269584357738,
        "input_gradient_l2_distance": -0.024122724309563637,
        "input_gradient_dot_product": -0.01518973521888256
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5654733255226047,
      "val_r": 0.41536706901372233,
      "n_iterations": 276,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004074949771165848,
        "right_subspace_overlap_bottom_k": -0.008789895102381706,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.02106073684990406,
        "effective_rank": -0.0014471448957920074,
        "effective_rank_mergeability_score": 0.0014554124791175127,
        "stable_rank": -0.001483917934820056,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0011165683390572667,
        "task_vector_l2_distance": -0.01214651484042406,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.006253329571336508,
        "singular_value_overlap": -0.010230659507215023,
        "subspace_overlap": 0.0023111216723918915,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0012222264194861054,
        "activation_cosine_similarity": 0.0022414447739720345,
        "activation_magnitude_ratio": -0.0024976427666842937,
        "activation_dot_product": 0.0032684565521776676,
        "encoder_gradient_cosine_similarity": 0.001224359730258584,
        "encoder_gradient_l2_distance": -0.011838630773127079,
        "encoder_gradient_dot_product": 0.003973703365772963,
        "input_gradient_cosine_similarity": 0.0017384011298418045,
        "input_gradient_l2_distance": -0.01396102923899889,
        "input_gradient_dot_product": -0.0072121829725801945
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6342907731030996,
      "val_r": 0.7332804981536657,
      "n_iterations": 405,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.00399859668686986,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.033627402037382126,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0014466664288192987,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0011358840856701136,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.02765839174389839,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0010326531482860446,
        "task_vector_magnitude_ratio": -0.003355965716764331,
        "singular_value_overlap": -0.018375828862190247,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0011152717052027583,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.004530394449830055,
        "activation_dot_product": 0.0022279543336480856,
        "encoder_gradient_cosine_similarity": 0.0013564021792262793,
        "encoder_gradient_l2_distance": -0.01761046051979065,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.002695862203836441,
        "input_gradient_l2_distance": -0.025880247354507446,
        "input_gradient_dot_product": -0.0023263334296643734
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.6109649631453478,
      "val_r": 0.6620668002364513,
      "n_iterations": 317,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0010259830160066485,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.02442559041082859,
        "effective_rank": -0.0015273533063009381,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0017164999153465033,
        "task_vector_l2_distance": -0.022187545895576477,
        "task_vector_dot_product": 0.0046730050817132,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0061234538443386555,
        "singular_value_overlap": -0.0149494968354702,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0013467057142406702,
        "activation_cosine_similarity": 0.0020077144727110863,
        "activation_magnitude_ratio": -0.0038837238680571318,
        "activation_dot_product": 0.002789819613099098,
        "encoder_gradient_cosine_similarity": 0.003128728596493602,
        "encoder_gradient_l2_distance": -0.022205332294106483,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.00277901953086257,
        "input_gradient_l2_distance": -0.01142074353992939,
        "input_gradient_dot_product": -0.006130892783403397
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5941591344957584,
      "val_r": 0.1420182043761619,
      "n_iterations": 271,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0018623759970068932,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.014939460903406143,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0010115024633705616,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0017795951571315527,
        "task_vector_l2_distance": -0.015300845727324486,
        "task_vector_dot_product": -0.0034842314198613167,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.004405296873301268,
        "singular_value_overlap": -0.011105028912425041,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0012988531962037086,
        "activation_cosine_similarity": 0.0026525547727942467,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0020921325776726007,
        "encoder_gradient_l2_distance": -0.02470073103904724,
        "encoder_gradient_dot_product": 0.0031359673012048006,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0186931099742651,
        "input_gradient_dot_product": -0.0061933910474181175
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5456735748148034,
      "val_r": 0.218234676468107,
      "n_iterations": 296,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0025540830101817846,
        "right_subspace_overlap_bottom_k": -0.006310112774372101,
        "interaction_matrix_overlap_top_k": -0.0020702520851045847,
        "interaction_matrix_overlap_bottom_k": 0.02584431879222393,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0010806478094309568,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.02205166406929493,
        "task_vector_dot_product": -0.0010230811312794685,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.005647765006870031,
        "singular_value_overlap": -0.016316015273332596,
        "subspace_overlap": 0.006132957059890032,
        "right_subspace_overlap": 0.004088551737368107,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.004580298438668251,
        "activation_magnitude_ratio": -0.005903948098421097,
        "activation_dot_product": 0.0010341686429455876,
        "encoder_gradient_cosine_similarity": 0.0020937081426382065,
        "encoder_gradient_l2_distance": -0.024023281410336494,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.013134424574673176,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5832961659278566,
      "val_r": 0.46817225310998656,
      "n_iterations": 367,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.017862267792224884,
        "right_subspace_overlap_bottom_k": 0.015222576446831226,
        "interaction_matrix_overlap_top_k": 0.0023496723733842373,
        "interaction_matrix_overlap_bottom_k": 0.025218866765499115,
        "effective_rank": -0.005202149040997028,
        "effective_rank_mergeability_score": 0.006594863720238209,
        "stable_rank": -0.0037083192728459835,
        "spectral_gap": 0.001671244390308857,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0011602991726249456,
        "layerwise_effective_rank_mergeability_score": 0.003534168004989624,
        "task_vector_cosine_similarity": -0.009298569522798061,
        "task_vector_l2_distance": -0.05171538516879082,
        "task_vector_dot_product": -0.013468698598444462,
        "weight_space_angle": 0.009384207427501678,
        "task_vector_magnitude_ratio": -0.003887744853273034,
        "singular_value_overlap": -0.036215849220752716,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.015501661226153374,
        "activation_l2_distance": -0.01001013908535242,
        "activation_cosine_similarity": 0.017028484493494034,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.009890276938676834,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.06874821335077286,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.07933884114027023,
        "input_gradient_dot_product": -0.019205957651138306
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5982035854472662,
      "val_r": 0.11118263810488499,
      "n_iterations": 216,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0012849525082856417,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.02554757334291935,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0012429719790816307,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0017955484800040722,
        "task_vector_l2_distance": -0.02140290103852749,
        "task_vector_dot_product": 0.00208811042830348,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0028038639575242996,
        "singular_value_overlap": -0.014742684550583363,
        "subspace_overlap": 0.007869618944823742,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": -0.00716578122228384,
        "activation_magnitude_ratio": -0.002429869258776307,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0035320979077368975,
        "encoder_gradient_l2_distance": -0.017343884333968163,
        "encoder_gradient_dot_product": 0.0022991334553807974,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.024021346122026443,
        "input_gradient_dot_product": -0.005260368809103966
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5700026263246705,
      "val_r": 0.19174402064582424,
      "n_iterations": 285,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.008211788721382618,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.028891686350107193,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0015946872299537063,
        "stable_rank": -0.0015866563189774752,
        "spectral_gap": 0.0011684262426570058,
        "singular_value_ratio": -0.001028523431159556,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0344122014939785,
        "task_vector_dot_product": 0.0020368006080389023,
        "weight_space_angle": 0.0016669894102960825,
        "task_vector_magnitude_ratio": -0.003190940711647272,
        "singular_value_overlap": -0.01802612841129303,
        "subspace_overlap": 0.0023875765036791563,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0011961404234170914,
        "activation_cosine_similarity": 0.002780165756121278,
        "activation_magnitude_ratio": -0.004539423156529665,
        "activation_dot_product": 0.009351343847811222,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.038478750735521317,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.019502807408571243,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5396948308400396,
      "val_r": 0.4691565843375923,
      "n_iterations": 208,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0020308338571339846,
        "right_subspace_overlap_bottom_k": -0.008749177679419518,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.018698707222938538,
        "effective_rank": -0.0026335171423852444,
        "effective_rank_mergeability_score": 0.0027776637580245733,
        "stable_rank": -0.0027884971350431442,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.001917990273796022,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.004837851971387863,
        "task_vector_l2_distance": -0.012224910780787468,
        "task_vector_dot_product": -0.00366635131649673,
        "weight_space_angle": 0.0042332373559474945,
        "task_vector_magnitude_ratio": -0.0062951561994850636,
        "singular_value_overlap": -0.015345431864261627,
        "subspace_overlap": 0.007730948273092508,
        "right_subspace_overlap": 0.009389771148562431,
        "activation_l2_distance": -0.004846248310059309,
        "activation_cosine_similarity": 0.005613371264189482,
        "activation_magnitude_ratio": -0.004692621063441038,
        "activation_dot_product": 0.0019461135379970074,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.022736918181180954,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0030732606537640095,
        "input_gradient_l2_distance": -0.026746651157736778,
        "input_gradient_dot_product": -0.010087172500789165
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5672930912602308,
      "val_r": 0.4907708629962491,
      "n_iterations": 217,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.0034816686529666185,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.027981339022517204,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.020368337631225586,
        "task_vector_dot_product": 0.005801868159323931,
        "weight_space_angle": -0.0021740305237472057,
        "task_vector_magnitude_ratio": -0.005218622274696827,
        "singular_value_overlap": -0.013299915008246899,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0022318821866065264,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0018159919418394566,
        "activation_dot_product": 0.006954758893698454,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.021638624370098114,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0028000171296298504,
        "input_gradient_l2_distance": -0.017894292250275612,
        "input_gradient_dot_product": -0.007077984511852264
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5510972676849942,
      "val_r": 0.6379396901828287,
      "n_iterations": 343,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01172013022005558,
        "right_subspace_overlap_bottom_k": -0.005743416491895914,
        "interaction_matrix_overlap_top_k": 0.0048704142682254314,
        "interaction_matrix_overlap_bottom_k": 0.022783061489462852,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.001069835969246924,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0014590146020054817,
        "layerwise_effective_rank_mergeability_score": -0.0023767086677253246,
        "task_vector_cosine_similarity": -0.0011444611009210348,
        "task_vector_l2_distance": -0.020671773701906204,
        "task_vector_dot_product": -0.004782233387231827,
        "weight_space_angle": 0.0012193178990855813,
        "task_vector_magnitude_ratio": -0.002111252164468169,
        "singular_value_overlap": -0.022601371631026268,
        "subspace_overlap": 0.008383545093238354,
        "right_subspace_overlap": 0.011000371538102627,
        "activation_l2_distance": -0.004465809091925621,
        "activation_cosine_similarity": 0.009507899172604084,
        "activation_magnitude_ratio": -0.002973764669150114,
        "activation_dot_product": 0.0012340706307440996,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.04150902107357979,
        "encoder_gradient_dot_product": 0.007696888875216246,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.04768839851021767,
        "input_gradient_dot_product": -0.023274550214409828
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4866480605935888,
      "val_r": 0.6126121041482812,
      "n_iterations": 234,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.008123998530209064,
        "interaction_matrix_overlap_top_k": -0.0023063826374709606,
        "interaction_matrix_overlap_bottom_k": 0.011876455508172512,
        "effective_rank": -0.001768458285368979,
        "effective_rank_mergeability_score": 0.0018348186276853085,
        "stable_rank": -0.0023255026899278164,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01133954431861639,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0031460258178412914,
        "task_vector_magnitude_ratio": -0.004816416185349226,
        "singular_value_overlap": -0.009605800732970238,
        "subspace_overlap": 0.0013536268379539251,
        "right_subspace_overlap": 0.0041817910969257355,
        "activation_l2_distance": -0.0010227428283542395,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.004670524969696999,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0011449818266555667,
        "encoder_gradient_l2_distance": -0.013578797690570354,
        "encoder_gradient_dot_product": 0.0021319000516086817,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.015407631173729897,
        "input_gradient_dot_product": -0.004800369497388601
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.607790473972281,
      "val_r": 0.3177408248671441,
      "n_iterations": 255,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004240983631461859,
        "right_subspace_overlap_bottom_k": -0.005693979095667601,
        "interaction_matrix_overlap_top_k": 0.0018480815924704075,
        "interaction_matrix_overlap_bottom_k": 0.014391524717211723,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0011983360163867474,
        "stable_rank": -0.0012794057838618755,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.013590481132268906,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0010090830037370324,
        "task_vector_magnitude_ratio": -0.006317033898085356,
        "singular_value_overlap": -0.0036585612688213587,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.00545478006824851,
        "activation_l2_distance": 0.0023327814415097237,
        "activation_cosine_similarity": 0.004443441983312368,
        "activation_magnitude_ratio": -0.0027804579585790634,
        "activation_dot_product": 0.0019350413931533694,
        "encoder_gradient_cosine_similarity": 0.0010693459771573544,
        "encoder_gradient_l2_distance": -0.015038993209600449,
        "encoder_gradient_dot_product": 0.0023017143830657005,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0157734677195549,
        "input_gradient_dot_product": -0.0087199155241251
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6142691436932504,
      "val_r": 0.5047744565517832,
      "n_iterations": 256,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0025929659605026245,
        "right_subspace_overlap_bottom_k": -0.0020835930481553078,
        "interaction_matrix_overlap_top_k": 0.0017343799117952585,
        "interaction_matrix_overlap_bottom_k": 0.020968738943338394,
        "effective_rank": -0.0014915346400812268,
        "effective_rank_mergeability_score": 0.001078072702512145,
        "stable_rank": -0.0015496821142733097,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0030157282017171383,
        "task_vector_l2_distance": -0.020308734849095345,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0037698366213589907,
        "task_vector_magnitude_ratio": -0.0023042752873152494,
        "singular_value_overlap": -0.011441349051892757,
        "subspace_overlap": 0.0028176300693303347,
        "right_subspace_overlap": 0.002299138344824314,
        "activation_l2_distance": 0.004637942183762789,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0035954974591732025,
        "activation_dot_product": 0.011127224192023277,
        "encoder_gradient_cosine_similarity": 0.0023109051398932934,
        "encoder_gradient_l2_distance": -0.015150452964007854,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.004774636588990688,
        "input_gradient_l2_distance": -0.01519726775586605,
        "input_gradient_dot_product": -0.0064687873236835
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6008037845467854,
      "val_r": 0.3883841107661064,
      "n_iterations": 226,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0018182151252403855,
        "right_subspace_overlap_bottom_k": 0.0169275663793087,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0400463230907917,
        "effective_rank": -0.0016929141711443663,
        "effective_rank_mergeability_score": 0.0013940958306193352,
        "stable_rank": 0.0,
        "spectral_gap": 0.001270742155611515,
        "singular_value_ratio": -0.0025280455593019724,
        "layerwise_effective_rank": -0.0014480819227173924,
        "layerwise_effective_rank_mergeability_score": 0.0013060690835118294,
        "task_vector_cosine_similarity": -0.0010366698261350393,
        "task_vector_l2_distance": -0.037593405693769455,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0021712842863053083,
        "task_vector_magnitude_ratio": -0.0014855992048978806,
        "singular_value_overlap": -0.014400534331798553,
        "subspace_overlap": 0.0010845991782844067,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0014314244035631418,
        "activation_cosine_similarity": 0.006204295437783003,
        "activation_magnitude_ratio": -0.004362908191978931,
        "activation_dot_product": 0.006908752024173737,
        "encoder_gradient_cosine_similarity": 0.0029922088142484426,
        "encoder_gradient_l2_distance": -0.032044339925050735,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.001054086023941636,
        "input_gradient_l2_distance": -0.05690222233533859,
        "input_gradient_dot_product": -0.0035247216001152992
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7985743096227778,
      "val_r": 0.6485117998611863,
      "n_iterations": 211,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.011859321966767311,
        "right_subspace_overlap_bottom_k": -0.01314103975892067,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0020063607953488827,
        "layerwise_effective_rank_mergeability_score": 0.003708456875756383,
        "task_vector_cosine_similarity": -0.005639017093926668,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.003972087521106005,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0011898300144821405,
        "subspace_overlap": -0.003443934489041567,
        "right_subspace_overlap": 0.02028021402657032,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.014819180592894554,
        "activation_magnitude_ratio": -0.002555566607043147,
        "activation_dot_product": 0.007341211196035147,
        "encoder_gradient_cosine_similarity": 0.004040193278342485,
        "encoder_gradient_l2_distance": -0.050453417003154755,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.00401134230196476,
        "input_gradient_l2_distance": -0.02723843976855278,
        "input_gradient_dot_product": -0.0104000149294734
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6518221782083343,
      "val_r": 0.43528804739102533,
      "n_iterations": 295,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0026232823729515076,
        "right_subspace_overlap_bottom_k": 0.00622364180162549,
        "interaction_matrix_overlap_top_k": -0.007944352924823761,
        "interaction_matrix_overlap_bottom_k": 0.022382063791155815,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0025488429237157106,
        "singular_value_ratio": -0.0022643140982836485,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.002749495906755328,
        "task_vector_l2_distance": -0.03183097764849663,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.00264327647164464,
        "task_vector_magnitude_ratio": -0.006961815524846315,
        "singular_value_overlap": -0.020650213584303856,
        "subspace_overlap": 0.004817422479391098,
        "right_subspace_overlap": -0.0030193733982741833,
        "activation_l2_distance": -0.0023108285386115313,
        "activation_cosine_similarity": 0.005067398771643639,
        "activation_magnitude_ratio": -0.005186174996197224,
        "activation_dot_product": 0.008817099034786224,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.02841861918568611,
        "encoder_gradient_dot_product": 0.0015756909269839525,
        "input_gradient_cosine_similarity": 0.0031383181922137737,
        "input_gradient_l2_distance": -0.038400039076805115,
        "input_gradient_dot_product": -0.00804232619702816
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.3,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}