{
  "aggregate_metrics": {
    "train_r": 0.45862220809299836,
    "train_p": 2.342416506584294e-167,
    "val_r": 0.3428637702189011,
    "val_p": 2.5969614126138596e-11
  },
  "per_fold_stats": {
    "train_r_mean": 0.720340186386959,
    "train_r_std": 0.06599608304768316,
    "val_r_mean": 0.5779734530769707,
    "val_r_std": 0.19911802713444862,
    "n_nonzero_mean": 18.15,
    "n_nonzero_std": 2.5937424698685874
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.004708465188741684,
    "right_subspace_overlap_bottom_k": -0.008010061457753181,
    "interaction_matrix_overlap_top_k": 0.0015117996372282505,
    "interaction_matrix_overlap_bottom_k": -0.00019290500495117158,
    "effective_rank": -0.000283978006336838,
    "effective_rank_mergeability_score": 0.0006323595298454165,
    "stable_rank": -0.0003956049622502178,
    "spectral_gap": 0.0002330624556634575,
    "singular_value_ratio": -0.0003000728029292077,
    "layerwise_effective_rank": -0.000856732833199203,
    "layerwise_effective_rank_mergeability_score": 0.000911047391127795,
    "task_vector_cosine_similarity": -0.0006947992369532585,
    "task_vector_l2_distance": -0.004098940175026655,
    "task_vector_dot_product": -0.0013496583560481668,
    "weight_space_angle": 0.000530845602042973,
    "task_vector_magnitude_ratio": -5.2877825510222465e-05,
    "singular_value_overlap": 0.0009850380010902882,
    "subspace_overlap": 0.00040016035200096667,
    "right_subspace_overlap": 0.004668528214097023,
    "activation_l2_distance": -0.0023866959381848574,
    "activation_cosine_similarity": 0.009782802313566208,
    "activation_magnitude_ratio": -0.0016007922822609544,
    "activation_dot_product": 0.0029884621035307646,
    "encoder_gradient_cosine_similarity": 0.0016119983047246933,
    "encoder_gradient_l2_distance": -0.025692543014883995,
    "encoder_gradient_dot_product": 0.0006849066121503711,
    "input_gradient_cosine_similarity": 0.0008259260794147849,
    "input_gradient_l2_distance": -0.02054845727980137,
    "input_gradient_dot_product": -0.0035039230715483427
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.003134737489745021,
    "right_subspace_overlap_bottom_k": 0.003873331705108285,
    "interaction_matrix_overlap_top_k": 0.0022193919867277145,
    "interaction_matrix_overlap_bottom_k": 0.001780700869858265,
    "effective_rank": 0.0006924796616658568,
    "effective_rank_mergeability_score": 0.0010346906492486596,
    "stable_rank": 0.0009219464845955372,
    "spectral_gap": 0.0005715602310374379,
    "singular_value_ratio": 0.0006091052200645208,
    "layerwise_effective_rank": 0.0012683514505624771,
    "layerwise_effective_rank_mergeability_score": 0.0011349187698215246,
    "task_vector_cosine_similarity": 0.0021343242842704058,
    "task_vector_l2_distance": 0.0030055013485252857,
    "task_vector_dot_product": 0.001533003174699843,
    "weight_space_angle": 0.002132633700966835,
    "task_vector_magnitude_ratio": 0.0008232959662564099,
    "singular_value_overlap": 0.0026589324697852135,
    "subspace_overlap": 0.0018979668384417892,
    "right_subspace_overlap": 0.003097441280260682,
    "activation_l2_distance": 0.003351302118971944,
    "activation_cosine_similarity": 0.005046244245022535,
    "activation_magnitude_ratio": 0.0023664399050176144,
    "activation_dot_product": 0.0052276779897511005,
    "encoder_gradient_cosine_similarity": 0.0020647828932851553,
    "encoder_gradient_l2_distance": 0.011126135475933552,
    "encoder_gradient_dot_product": 0.0010174321942031384,
    "input_gradient_cosine_similarity": 0.0015294657787308097,
    "input_gradient_l2_distance": 0.01357677485793829,
    "input_gradient_dot_product": 0.002385731553658843
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.9,
    "right_subspace_overlap_bottom_k": 1.0,
    "interaction_matrix_overlap_top_k": 0.6,
    "interaction_matrix_overlap_bottom_k": 0.75,
    "effective_rank": 0.15,
    "effective_rank_mergeability_score": 0.35,
    "stable_rank": 0.35,
    "spectral_gap": 0.15,
    "singular_value_ratio": 0.2,
    "layerwise_effective_rank": 0.4,
    "layerwise_effective_rank_mergeability_score": 0.5,
    "task_vector_cosine_similarity": 0.6,
    "task_vector_l2_distance": 0.9,
    "task_vector_dot_product": 0.6,
    "weight_space_angle": 0.55,
    "task_vector_magnitude_ratio": 0.35,
    "singular_value_overlap": 0.4,
    "subspace_overlap": 0.7,
    "right_subspace_overlap": 0.9,
    "activation_l2_distance": 0.75,
    "activation_cosine_similarity": 1.0,
    "activation_magnitude_ratio": 0.9,
    "activation_dot_product": 0.75,
    "encoder_gradient_cosine_similarity": 0.75,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.45,
    "input_gradient_cosine_similarity": 0.4,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.8
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7142320952584036,
      "val_r": 0.5745901561715565,
      "n_iterations": 184,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0015505764167755842,
        "right_subspace_overlap_bottom_k": -0.0030455198138952255,
        "interaction_matrix_overlap_top_k": -0.001096482272259891,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.001764769316650927,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.001219011377543211,
        "task_vector_l2_distance": -0.006922009866684675,
        "task_vector_dot_product": -0.0011440652888268232,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0018811884801834822,
        "singular_value_overlap": -0.0024822596460580826,
        "subspace_overlap": 0.0026371534913778305,
        "right_subspace_overlap": 0.0035960637032985687,
        "activation_l2_distance": -0.010428403504192829,
        "activation_cosine_similarity": 0.011254296638071537,
        "activation_magnitude_ratio": -0.002598159946501255,
        "activation_dot_product": 0.0019810758531093597,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.03631575033068657,
        "encoder_gradient_dot_product": 0.0016058655455708504,
        "input_gradient_cosine_similarity": 0.002502165036275983,
        "input_gradient_l2_distance": -0.0267636738717556,
        "input_gradient_dot_product": -0.005458910018205643
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7120543569915314,
      "val_r": 0.7345470694528385,
      "n_iterations": 201,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.0017782171489670873,
        "interaction_matrix_overlap_top_k": 0.0013067340478301048,
        "interaction_matrix_overlap_bottom_k": -0.001181404571980238,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0013212535995990038,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0017322173807770014,
        "layerwise_effective_rank": -0.0010333836544305086,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0020167632028460503,
        "task_vector_dot_product": -0.002237907610833645,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0014868632424622774,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.002249185461550951,
        "right_subspace_overlap": 0.0026235952973365784,
        "activation_l2_distance": 0.00240729539655149,
        "activation_cosine_similarity": 0.012551973573863506,
        "activation_magnitude_ratio": -0.001923061441630125,
        "activation_dot_product": 0.0022060764022171497,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.023044977337121964,
        "encoder_gradient_dot_product": -0.001074282918125391,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.010508600622415543,
        "input_gradient_dot_product": -0.006413630209863186
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7490220919379982,
      "val_r": 0.7453313871292506,
      "n_iterations": 352,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002335015218704939,
        "right_subspace_overlap_bottom_k": -0.004927630536258221,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.0016286910977214575,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0015210808487609029,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0010510787833482027,
        "task_vector_cosine_similarity": -0.0012538013979792595,
        "task_vector_l2_distance": -0.0029613724909722805,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0015555165009573102,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.005444171838462353,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.012263309210538864,
        "activation_magnitude_ratio": -0.0015438786940649152,
        "activation_dot_product": -0.0010850277030840516,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.022303704172372818,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0025980209466069937,
        "input_gradient_l2_distance": -0.012941693887114525,
        "input_gradient_dot_product": -0.0022370892111212015
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6963257341040913,
      "val_r": 0.6990494955784806,
      "n_iterations": 362,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007211118936538696,
        "right_subspace_overlap_bottom_k": -0.01310938410460949,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.0029290392994880676,
        "effective_rank": -0.002138542477041483,
        "effective_rank_mergeability_score": 0.002165574347600341,
        "stable_rank": -0.002230934565886855,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.001130574382841587,
        "layerwise_effective_rank": -0.002937863813713193,
        "layerwise_effective_rank_mergeability_score": 0.003198445774614811,
        "task_vector_cosine_similarity": -0.00263264705426991,
        "task_vector_l2_distance": -0.006533414125442505,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0024168952368199825,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0010653652716428041,
        "subspace_overlap": -0.0025370363146066666,
        "right_subspace_overlap": 0.0065771122463047504,
        "activation_l2_distance": -0.0015108167426660657,
        "activation_cosine_similarity": 0.011037271469831467,
        "activation_magnitude_ratio": -0.00744458707049489,
        "activation_dot_product": 0.018945403397083282,
        "encoder_gradient_cosine_similarity": -0.0021738128270953894,
        "encoder_gradient_l2_distance": -0.03698243945837021,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.04434309899806976,
        "input_gradient_dot_product": -0.004918564576655626
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7372174208162828,
      "val_r": 0.7753947697783279,
      "n_iterations": 346,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005462018772959709,
        "right_subspace_overlap_bottom_k": -0.007268066518008709,
        "interaction_matrix_overlap_top_k": -0.0012512210523709655,
        "interaction_matrix_overlap_bottom_k": 0.003868637839332223,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.003752325428649783,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.004096112214028835,
        "activation_l2_distance": -0.004041851498186588,
        "activation_cosine_similarity": 0.00587376207113266,
        "activation_magnitude_ratio": -0.0038540896493941545,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0013166820863261819,
        "encoder_gradient_l2_distance": -0.014740494079887867,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0013467947719618678,
        "input_gradient_l2_distance": -0.01183545682579279,
        "input_gradient_dot_product": -0.0019522984512150288
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7429031056975902,
      "val_r": 0.7079855365335811,
      "n_iterations": 184,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003172781551256776,
        "right_subspace_overlap_bottom_k": -0.005626234225928783,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.001131538301706314,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0010951189324259758,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0014780198689550161,
        "layerwise_effective_rank": -0.001374860992655158,
        "layerwise_effective_rank_mergeability_score": 0.001274349633604288,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0031330029014497995,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0013606806751340628,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.003626270452514291,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.003600532654672861,
        "activation_cosine_similarity": 0.007075885310769081,
        "activation_magnitude_ratio": -0.0022692426573485136,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0028929715044796467,
        "encoder_gradient_l2_distance": -0.011354279704391956,
        "encoder_gradient_dot_product": 0.0014043329283595085,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.008439039811491966,
        "input_gradient_dot_product": -0.0027027695905417204
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.711639841025607,
      "val_r": 0.44336522999881833,
      "n_iterations": 258,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010054366663098335,
        "right_subspace_overlap_bottom_k": -0.01615528203547001,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.0015504604671150446,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.001319420407526195,
        "stable_rank": -0.001600738032720983,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0035055375192314386,
        "task_vector_l2_distance": -0.007660426199436188,
        "task_vector_dot_product": -0.0012952093966305256,
        "weight_space_angle": -0.0039044786244630814,
        "task_vector_magnitude_ratio": -0.0011620367877185345,
        "singular_value_overlap": 0.010733304545283318,
        "subspace_overlap": 0.004490875173360109,
        "right_subspace_overlap": 0.011563366279006004,
        "activation_l2_distance": -0.006445854436606169,
        "activation_cosine_similarity": 0.021804848685860634,
        "activation_magnitude_ratio": 0.005524040199816227,
        "activation_dot_product": 0.007254992611706257,
        "encoder_gradient_cosine_similarity": 0.005949615966528654,
        "encoder_gradient_l2_distance": -0.05869036540389061,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.059116534888744354,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6906306037295854,
      "val_r": 0.28008712394749946,
      "n_iterations": 182,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010399539023637772,
        "right_subspace_overlap_bottom_k": -0.008144683204591274,
        "interaction_matrix_overlap_top_k": 0.0018154419958591461,
        "interaction_matrix_overlap_bottom_k": 0.001551143010146916,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0011272861156612635,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0013704168377444148,
        "task_vector_l2_distance": -0.006208081729710102,
        "task_vector_dot_product": -0.0026863226667046547,
        "weight_space_angle": 0.0032166303135454655,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0010546661214902997,
        "right_subspace_overlap": 0.007008115760982037,
        "activation_l2_distance": -0.0035006124526262283,
        "activation_cosine_similarity": 0.010846312157809734,
        "activation_magnitude_ratio": -0.0015101071912795305,
        "activation_dot_product": 0.0024909661151468754,
        "encoder_gradient_cosine_similarity": 0.003228895366191864,
        "encoder_gradient_l2_distance": -0.026546437293291092,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.017432304099202156,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7421264779881397,
      "val_r": 0.32514149979641216,
      "n_iterations": 245,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006884252652525902,
        "right_subspace_overlap_bottom_k": -0.0129082715138793,
        "interaction_matrix_overlap_top_k": 0.00552317826077342,
        "interaction_matrix_overlap_bottom_k": -0.0013613314367830753,
        "effective_rank": -0.0021951664239168167,
        "effective_rank_mergeability_score": 0.004040190484374762,
        "stable_rank": -0.0022860351018607616,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0036802974063903093,
        "layerwise_effective_rank_mergeability_score": 0.0033415481448173523,
        "task_vector_cosine_similarity": -0.004138464108109474,
        "task_vector_l2_distance": -0.0038520931266248226,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0033449125476181507,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0010621591936796904,
        "right_subspace_overlap": 0.006382728461176157,
        "activation_l2_distance": -0.004896563943475485,
        "activation_cosine_similarity": 0.014415232464671135,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.003159543266519904,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.033173829317092896,
        "encoder_gradient_dot_product": 0.002110685920342803,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.03022642992436886,
        "input_gradient_dot_product": -0.007203240878880024
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7092050424315637,
      "val_r": 0.6619421841626209,
      "n_iterations": 204,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007671755738556385,
        "right_subspace_overlap_bottom_k": -0.011548801325261593,
        "interaction_matrix_overlap_top_k": 0.007027201354503632,
        "interaction_matrix_overlap_bottom_k": -0.0028668236918747425,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0012139265891164541,
        "stable_rank": -0.001110621728003025,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0016721533611416817,
        "task_vector_cosine_similarity": -0.0033443481661379337,
        "task_vector_l2_distance": -0.009238621219992638,
        "task_vector_dot_product": -0.0028063426725566387,
        "weight_space_angle": 0.005879449192434549,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0018323555123060942,
        "right_subspace_overlap": 0.004517781548202038,
        "activation_l2_distance": 0.0015341260004788637,
        "activation_cosine_similarity": -0.002358352765440941,
        "activation_magnitude_ratio": -0.0017736625159159303,
        "activation_dot_product": -0.003683757269755006,
        "encoder_gradient_cosine_similarity": 0.0012695660116150975,
        "encoder_gradient_l2_distance": -0.03571387007832527,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.00220216391608119,
        "input_gradient_l2_distance": -0.036335378885269165,
        "input_gradient_dot_product": -0.0038228286430239677
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7548584089287705,
      "val_r": 0.15509635174227562,
      "n_iterations": 209,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005043752957135439,
        "right_subspace_overlap_bottom_k": -0.004038091283291578,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.001514483941718936,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0011927869636565447,
        "task_vector_l2_distance": -0.002915172139182687,
        "task_vector_dot_product": -0.0035294590052217245,
        "weight_space_angle": -0.0012348243035376072,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0022567424457520247,
        "activation_cosine_similarity": 0.010790357366204262,
        "activation_magnitude_ratio": -0.003243571612983942,
        "activation_dot_product": 0.0010443661594763398,
        "encoder_gradient_cosine_similarity": 0.0032466158736497164,
        "encoder_gradient_l2_distance": -0.01851687766611576,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.005240581929683685,
        "input_gradient_dot_product": -0.0028288690373301506
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7370003410753476,
      "val_r": 0.7195878714971773,
      "n_iterations": 402,
      "n_nonzero_coefficients": 13,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005679874215275049,
        "right_subspace_overlap_bottom_k": -0.0073757171630859375,
        "interaction_matrix_overlap_top_k": 0.0013404058991000056,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0010896155145019293,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.001202290179207921,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.002638746751472354,
        "right_subspace_overlap": 0.0017428849823772907,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.011738738045096397,
        "activation_magnitude_ratio": -0.0023257285356521606,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.001752082840539515,
        "encoder_gradient_l2_distance": -0.024661622941493988,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.014047395437955856,
        "input_gradient_dot_product": -0.00256907707080245
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7191416390116987,
      "val_r": 0.7624549183763883,
      "n_iterations": 209,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0014541004784405231,
        "right_subspace_overlap_bottom_k": -0.00716800382360816,
        "interaction_matrix_overlap_top_k": 0.00117532501462847,
        "interaction_matrix_overlap_bottom_k": -0.002325912471860647,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0020177909173071384,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.004068927839398384,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0017483500996604562,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0015317999059334397,
        "right_subspace_overlap": 0.004004692658782005,
        "activation_l2_distance": -0.005424811039119959,
        "activation_cosine_similarity": 0.011370365507900715,
        "activation_magnitude_ratio": -0.0010379136074334383,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.005966357886791229,
        "encoder_gradient_l2_distance": -0.025538237765431404,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.004050276707857847,
        "input_gradient_l2_distance": -0.020463602617383003,
        "input_gradient_dot_product": -0.007505952846258879
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.712521014522835,
      "val_r": 0.7548653927281552,
      "n_iterations": 286,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005539420526474714,
        "right_subspace_overlap_bottom_k": -0.0058557442389428616,
        "interaction_matrix_overlap_top_k": 0.003372043138369918,
        "interaction_matrix_overlap_bottom_k": -0.0024496472906321287,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0015103832120075822,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0013504627859219909,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.001185794360935688,
        "singular_value_overlap": 0.0026224192697554827,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.004216058179736137,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.01045199204236269,
        "activation_magnitude_ratio": -0.0017180072609335184,
        "activation_dot_product": 0.003187564667314291,
        "encoder_gradient_cosine_similarity": 0.0029253684915602207,
        "encoder_gradient_l2_distance": -0.015568162314593792,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.009246883913874626,
        "input_gradient_dot_product": -0.0041497377678751945
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7308353472578193,
      "val_r": 0.7465830213193351,
      "n_iterations": 314,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0019079695921391249,
        "right_subspace_overlap_bottom_k": -0.010504363104701042,
        "interaction_matrix_overlap_top_k": 0.003439404536038637,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.001291878055781126,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.004172000102698803,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0016610368620604277,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.00198942213319242,
        "right_subspace_overlap": 0.00525627238675952,
        "activation_l2_distance": -0.004582843277603388,
        "activation_cosine_similarity": 0.016771679744124413,
        "activation_magnitude_ratio": -0.0016637388616800308,
        "activation_dot_product": -0.0019748916383832693,
        "encoder_gradient_cosine_similarity": 0.0013073517475277185,
        "encoder_gradient_l2_distance": -0.029658062383532524,
        "encoder_gradient_dot_product": 0.002269571181386709,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.026318933814764023,
        "input_gradient_dot_product": -0.0034264251589775085
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7578084573307552,
      "val_r": 0.2713992810916517,
      "n_iterations": 254,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003711894853040576,
        "right_subspace_overlap_bottom_k": -0.006183141376823187,
        "interaction_matrix_overlap_top_k": 0.0029463947284966707,
        "interaction_matrix_overlap_bottom_k": 0.001910249819047749,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0010449578985571861,
        "task_vector_l2_distance": -0.0031339118722826242,
        "task_vector_dot_product": -0.0033547827042639256,
        "weight_space_angle": 0.0026013997849076986,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.004189696162939072,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0050026290118694305,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.00552396010607481,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0015798253007233143,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.015431406907737255,
        "encoder_gradient_dot_product": 0.0021611482370644808,
        "input_gradient_cosine_similarity": 0.0021344893611967564,
        "input_gradient_l2_distance": -0.007154466118663549,
        "input_gradient_dot_product": -0.006301587913185358
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7498605563649172,
      "val_r": 0.7163676589405585,
      "n_iterations": 239,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00916201714426279,
        "right_subspace_overlap_bottom_k": -0.007592316251248121,
        "interaction_matrix_overlap_top_k": 0.004637566860765219,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.001154064666479826,
        "layerwise_effective_rank_mergeability_score": 0.0010019266046583652,
        "task_vector_cosine_similarity": -0.001023646560497582,
        "task_vector_l2_distance": -0.006232148967683315,
        "task_vector_dot_product": -0.0033140024170279503,
        "weight_space_angle": 0.001857350580394268,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0012373242061585188,
        "right_subspace_overlap": 0.004218777641654015,
        "activation_l2_distance": -0.0025808727368712425,
        "activation_cosine_similarity": 0.005291348788887262,
        "activation_magnitude_ratio": -0.0015171397244557738,
        "activation_dot_product": 0.006660662591457367,
        "encoder_gradient_cosine_similarity": 0.002311134710907936,
        "encoder_gradient_l2_distance": -0.021714840084314346,
        "encoder_gradient_dot_product": 0.002462234813719988,
        "input_gradient_cosine_similarity": 0.0038369635585695505,
        "input_gradient_l2_distance": -0.018113460391759872,
        "input_gradient_dot_product": -0.0058984821662306786
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.45753214345728044,
      "val_r": 0.32041893222130086,
      "n_iterations": 409,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.009452849626541138,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.001109507866203785,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0014869080623611808,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.003928965888917446,
        "layerwise_effective_rank_mergeability_score": 0.0012053628452122211,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0027589979581534863,
        "task_vector_dot_product": -0.0032498687505722046,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0011452873004600406,
        "singular_value_overlap": -0.0011619104770943522,
        "subspace_overlap": -0.0012793560745194554,
        "right_subspace_overlap": 0.0028976015746593475,
        "activation_l2_distance": 0.0036557884886860847,
        "activation_cosine_similarity": 0.004957815166562796,
        "activation_magnitude_ratio": -0.003330943640321493,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.001994813559576869,
        "encoder_gradient_l2_distance": -0.008795679546892643,
        "encoder_gradient_dot_product": 0.0010355694685131311,
        "input_gradient_cosine_similarity": 0.002251974307000637,
        "input_gradient_l2_distance": -0.0066670202650129795,
        "input_gradient_dot_product": -0.0026889946311712265
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7787317134713179,
      "val_r": 0.4828688427270315,
      "n_iterations": 500,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005563536658883095,
        "right_subspace_overlap_bottom_k": -0.014120806939899921,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0013496499741449952,
        "effective_rank": -0.0013458512257784605,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0019460555631667376,
        "layerwise_effective_rank_mergeability_score": 0.003236202523112297,
        "task_vector_cosine_similarity": -0.0065154219046235085,
        "task_vector_l2_distance": -0.0026554642245173454,
        "task_vector_dot_product": -0.0013378177536651492,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0031786286272108555,
        "subspace_overlap": -0.0012030813377350569,
        "right_subspace_overlap": 0.012472288683056831,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.010225385427474976,
        "activation_magnitude_ratio": -0.0010984826367348433,
        "activation_dot_product": 0.00400898139923811,
        "encoder_gradient_cosine_similarity": 0.0018792040646076202,
        "encoder_gradient_l2_distance": -0.02201945148408413,
        "encoder_gradient_dot_product": 0.0017230070661753416,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01877264678478241,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8031573363376444,
      "val_r": 0.6823923383461539,
      "n_iterations": 242,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0013653264613822103,
        "right_subspace_overlap_bottom_k": -0.003398091997951269,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0011565500171855092,
        "singular_value_ratio": -0.0016606446588411927,
        "layerwise_effective_rank": -0.001079166424460709,
        "layerwise_effective_rank_mergeability_score": 0.0011502656852826476,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009282066486775875,
        "task_vector_dot_product": -0.0033878525719046593,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0015326421707868576,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0017503122799098492,
        "activation_l2_distance": -0.006061220541596413,
        "activation_cosine_similarity": 0.003769893432036042,
        "activation_magnitude_ratio": 0.0013124305987730622,
        "activation_dot_product": 0.013993466272950172,
        "encoder_gradient_cosine_similarity": -0.0016268800245597959,
        "encoder_gradient_l2_distance": -0.03308041766285896,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.027001911774277687,
        "input_gradient_dot_product": 0.0
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1.0,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}