{
  "aggregate_metrics": {
    "train_r": 0.4557282076370771,
    "train_p": 5.146595948054024e-165,
    "val_r": 0.27141243516009533,
    "val_p": 1.831946481750803e-07
  },
  "per_fold_stats": {
    "train_r_mean": 0.6957871077210825,
    "train_r_std": 0.05831337519053379,
    "val_r_mean": 0.5691189262549902,
    "val_r_std": 0.20546519629445137,
    "n_nonzero_mean": 17.45,
    "n_nonzero_std": 4.421255477802657
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.003440088825300336,
    "right_subspace_overlap_bottom_k": -0.0050061726942658424,
    "interaction_matrix_overlap_top_k": 0.0010014972649514675,
    "interaction_matrix_overlap_bottom_k": -0.0007062021177262068,
    "effective_rank": -0.000304471148410812,
    "effective_rank_mergeability_score": 0.0004592047189362347,
    "stable_rank": -0.00028873616247437894,
    "spectral_gap": 6.75459232297726e-05,
    "singular_value_ratio": 5.198568760533817e-05,
    "layerwise_effective_rank": -0.0002172522945329547,
    "layerwise_effective_rank_mergeability_score": 0.00032226656912826,
    "task_vector_cosine_similarity": 0.0005429887096397579,
    "task_vector_l2_distance": -0.0026038421783596277,
    "task_vector_dot_product": -0.0002590496151242405,
    "weight_space_angle": -0.00027257512556388974,
    "task_vector_magnitude_ratio": -0.00022580446966458112,
    "singular_value_overlap": 0.00038106634747236967,
    "subspace_overlap": 0.0008056505466811359,
    "right_subspace_overlap": 0.003626534715294838,
    "activation_l2_distance": -0.0009883544407784939,
    "activation_cosine_similarity": 0.006743554025888443,
    "activation_magnitude_ratio": -0.002331316005438566,
    "activation_dot_product": 0.0033116801641881466,
    "encoder_gradient_cosine_similarity": 0.0012028670171275735,
    "encoder_gradient_l2_distance": -0.017865829169750214,
    "encoder_gradient_dot_product": 0.0008291208068840206,
    "input_gradient_cosine_similarity": 0.00033528837957419455,
    "input_gradient_l2_distance": -0.013992691412568092,
    "input_gradient_dot_product": -0.00273820455186069
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.003366546705365181,
    "right_subspace_overlap_bottom_k": 0.0034015981946140528,
    "interaction_matrix_overlap_top_k": 0.002616550074890256,
    "interaction_matrix_overlap_bottom_k": 0.002596808597445488,
    "effective_rank": 0.0007320456206798553,
    "effective_rank_mergeability_score": 0.0008119079866446555,
    "stable_rank": 0.0009456192492507398,
    "spectral_gap": 0.000740517454687506,
    "singular_value_ratio": 0.0007013955037109554,
    "layerwise_effective_rank": 0.0006724948179908097,
    "layerwise_effective_rank_mergeability_score": 0.0010542802046984434,
    "task_vector_cosine_similarity": 0.002149622654542327,
    "task_vector_l2_distance": 0.0028996088076382875,
    "task_vector_dot_product": 0.0017304944340139627,
    "weight_space_angle": 0.0016133935423567891,
    "task_vector_magnitude_ratio": 0.0007149576558731496,
    "singular_value_overlap": 0.0019878160674124956,
    "subspace_overlap": 0.001510938978753984,
    "right_subspace_overlap": 0.0025084505323320627,
    "activation_l2_distance": 0.002454506466165185,
    "activation_cosine_similarity": 0.0028035962022840977,
    "activation_magnitude_ratio": 0.002009281422942877,
    "activation_dot_product": 0.004021612927317619,
    "encoder_gradient_cosine_similarity": 0.0013135728659108281,
    "encoder_gradient_l2_distance": 0.007353480905294418,
    "encoder_gradient_dot_product": 0.0018998866435140371,
    "input_gradient_cosine_similarity": 0.0012890950310975313,
    "input_gradient_l2_distance": 0.009620732627809048,
    "input_gradient_dot_product": 0.0019144000252708793
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.9,
    "right_subspace_overlap_bottom_k": 0.9,
    "interaction_matrix_overlap_top_k": 0.6,
    "interaction_matrix_overlap_bottom_k": 0.5,
    "effective_rank": 0.3,
    "effective_rank_mergeability_score": 0.4,
    "stable_rank": 0.35,
    "spectral_gap": 0.3,
    "singular_value_ratio": 0.2,
    "layerwise_effective_rank": 0.25,
    "layerwise_effective_rank_mergeability_score": 0.55,
    "task_vector_cosine_similarity": 0.5,
    "task_vector_l2_distance": 0.75,
    "task_vector_dot_product": 0.6,
    "weight_space_angle": 0.55,
    "task_vector_magnitude_ratio": 0.25,
    "singular_value_overlap": 0.5,
    "subspace_overlap": 0.5,
    "right_subspace_overlap": 0.8,
    "activation_l2_distance": 0.65,
    "activation_cosine_similarity": 1.0,
    "activation_magnitude_ratio": 0.9,
    "activation_dot_product": 0.8,
    "encoder_gradient_cosine_similarity": 0.55,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.6,
    "input_gradient_cosine_similarity": 0.45,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.8
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6751808718075067,
      "val_r": 0.49944589229558206,
      "n_iterations": 431,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0025672190822660923,
        "right_subspace_overlap_bottom_k": -0.004424589686095715,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.004327862523496151,
        "effective_rank": -0.001693223835900426,
        "effective_rank_mergeability_score": 0.0017097459640353918,
        "stable_rank": -0.002491241553798318,
        "spectral_gap": 0.00107980752363801,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0014363229274749756,
        "layerwise_effective_rank_mergeability_score": 0.0013544013490900397,
        "task_vector_cosine_similarity": -0.0029177742544561625,
        "task_vector_l2_distance": -0.0014760743360966444,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0014968104660511017,
        "singular_value_overlap": -0.0017919163219630718,
        "subspace_overlap": 0.0016147292917594314,
        "right_subspace_overlap": 0.005554453935474157,
        "activation_l2_distance": -0.004002803470939398,
        "activation_cosine_similarity": 0.010354415513575077,
        "activation_magnitude_ratio": -0.005333344452083111,
        "activation_dot_product": 0.00646579172462225,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.021622436121106148,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0010755958501249552,
        "input_gradient_l2_distance": -0.016613027080893517,
        "input_gradient_dot_product": -0.003777311183512211
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6523009254648608,
      "val_r": 0.7668672322617485,
      "n_iterations": 235,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003196500241756439,
        "right_subspace_overlap_bottom_k": -0.008264994248747826,
        "interaction_matrix_overlap_top_k": 0.0018034807872027159,
        "interaction_matrix_overlap_bottom_k": -0.003135697916150093,
        "effective_rank": -0.001204678788781166,
        "effective_rank_mergeability_score": 0.0010354924015700817,
        "stable_rank": -0.0018009106861427426,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0017501703696325421,
        "task_vector_cosine_similarity": 0.0028765557799488306,
        "task_vector_l2_distance": -0.0025726810563355684,
        "task_vector_dot_product": -0.002684379927814007,
        "weight_space_angle": -0.0024477653205394745,
        "task_vector_magnitude_ratio": -0.00180247169919312,
        "singular_value_overlap": 0.0019575273618102074,
        "subspace_overlap": 0.0016402511391788721,
        "right_subspace_overlap": 0.004735142923891544,
        "activation_l2_distance": -0.0011884174309670925,
        "activation_cosine_similarity": 0.007294060196727514,
        "activation_magnitude_ratio": -0.001830513821914792,
        "activation_dot_product": 0.0036640085745602846,
        "encoder_gradient_cosine_similarity": 0.0037540942430496216,
        "encoder_gradient_l2_distance": -0.013581927865743637,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.009771141223609447,
        "input_gradient_dot_product": -0.0032579628750681877
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6981424638340211,
      "val_r": 0.5699977630067239,
      "n_iterations": 318,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0035384423099458218,
        "right_subspace_overlap_bottom_k": 0.0010973610915243626,
        "interaction_matrix_overlap_top_k": 0.005608427803963423,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": -0.0024944706819951534,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.007876494899392128,
        "task_vector_dot_product": 0.0010652844794094563,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.003963980358093977,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.007403814233839512,
        "activation_cosine_similarity": 0.007718449924141169,
        "activation_magnitude_ratio": -0.0043665384873747826,
        "activation_dot_product": 0.003104198258370161,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.024386253207921982,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.025219334289431572,
        "input_gradient_dot_product": -0.004597917664796114
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.707829840427302,
      "val_r": 0.6803638852613404,
      "n_iterations": 215,
      "n_nonzero_coefficients": 11,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.005078287795186043,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.004851364530622959,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0011941168922930956,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0057020848616957664,
        "activation_l2_distance": -0.004324705805629492,
        "activation_cosine_similarity": 0.003336439374834299,
        "activation_magnitude_ratio": -0.005221642088145018,
        "activation_dot_product": 0.0020045058336108923,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.016678979620337486,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.010981264524161816,
        "input_gradient_dot_product": -0.003616458736360073
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7392049587558165,
      "val_r": 0.7625057246300342,
      "n_iterations": 269,
      "n_nonzero_coefficients": 13,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0030598281882703304,
        "right_subspace_overlap_bottom_k": -0.004729042761027813,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.003025238635018468,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0010302374139428139,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.003345282981172204,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.007183391135185957,
        "activation_magnitude_ratio": -0.0019618412479758263,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0016503450460731983,
        "encoder_gradient_l2_distance": -0.01239387970417738,
        "encoder_gradient_dot_product": 0.0013179467059671879,
        "input_gradient_cosine_similarity": 0.0016065954696387053,
        "input_gradient_l2_distance": -0.007284520659595728,
        "input_gradient_dot_product": -0.0010038388427346945
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.734189566816991,
      "val_r": 0.6805387466685138,
      "n_iterations": 321,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0026339853648096323,
        "right_subspace_overlap_bottom_k": -0.0031394255347549915,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.0014572555664926767,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0034291697666049004,
        "task_vector_l2_distance": -0.0018916005501523614,
        "task_vector_dot_product": -0.0014147722395136952,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0038300324231386185,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.007418851833790541,
        "activation_magnitude_ratio": -0.001773237599991262,
        "activation_dot_product": 0.0016644243150949478,
        "encoder_gradient_cosine_similarity": 0.003746610600501299,
        "encoder_gradient_l2_distance": -0.016680167987942696,
        "encoder_gradient_dot_product": -0.0010169411543756723,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.005629167892038822,
        "input_gradient_dot_product": -0.004283955320715904
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7230455940979084,
      "val_r": 0.43167183079772586,
      "n_iterations": 296,
      "n_nonzero_coefficients": 12,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0013963145902380347,
        "right_subspace_overlap_bottom_k": -0.008785824291408062,
        "interaction_matrix_overlap_top_k": 0.004383638501167297,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.00226769526489079,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0039834375493228436,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.006239918991923332,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.004281810950487852,
        "encoder_gradient_cosine_similarity": 0.002381074707955122,
        "encoder_gradient_l2_distance": -0.018038146197795868,
        "encoder_gradient_dot_product": 0.0011047270381823182,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01172672864049673,
        "input_gradient_dot_product": -0.005479619838297367
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7000514136652616,
      "val_r": 0.3475733195475303,
      "n_iterations": 172,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00679611274972558,
        "right_subspace_overlap_bottom_k": -0.005937065929174423,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0015233473386615515,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0012474264949560165,
        "task_vector_cosine_similarity": 0.0016595146153122187,
        "task_vector_l2_distance": -0.003619971452280879,
        "task_vector_dot_product": -0.0013320611324161291,
        "weight_space_angle": -0.002174416556954384,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0011156618129462004,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0031381254084408283,
        "activation_l2_distance": -0.0014928552554920316,
        "activation_cosine_similarity": 0.006923635955899954,
        "activation_magnitude_ratio": -0.0033061360009014606,
        "activation_dot_product": 0.0028029230888932943,
        "encoder_gradient_cosine_similarity": 0.003511369926854968,
        "encoder_gradient_l2_distance": -0.01663525402545929,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0030393118504434824,
        "input_gradient_l2_distance": -0.007450274657458067,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7477814025903287,
      "val_r": 0.30367445539356297,
      "n_iterations": 390,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003220587968826294,
        "right_subspace_overlap_bottom_k": -0.005581643432378769,
        "interaction_matrix_overlap_top_k": -0.0010975683107972145,
        "interaction_matrix_overlap_bottom_k": -0.001751987379975617,
        "effective_rank": -0.001155761070549488,
        "effective_rank_mergeability_score": 0.0014504431746900082,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0013425133656710386,
        "layerwise_effective_rank_mergeability_score": 0.0014553675428032875,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.002216313499957323,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0016438813181594014,
        "right_subspace_overlap": 0.0051809451542794704,
        "activation_l2_distance": 0.0011379660572856665,
        "activation_cosine_similarity": 0.009228291921317577,
        "activation_magnitude_ratio": -0.0012883724411949515,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0010366030037403107,
        "encoder_gradient_l2_distance": -0.010172666050493717,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.008675183169543743,
        "input_gradient_dot_product": -0.0017569898627698421
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6938580959412699,
      "val_r": 0.7043212314075438,
      "n_iterations": 222,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0012786410516127944,
        "right_subspace_overlap_bottom_k": -0.0035034161992371082,
        "interaction_matrix_overlap_top_k": -0.0015837126411497593,
        "interaction_matrix_overlap_bottom_k": 0.001765172346495092,
        "effective_rank": -0.001883053919300437,
        "effective_rank_mergeability_score": 0.0013651323970407248,
        "stable_rank": -0.0011614777613431215,
        "spectral_gap": 0.0011344450758770108,
        "singular_value_ratio": -0.0013207989977672696,
        "layerwise_effective_rank": -0.0017019128426909447,
        "layerwise_effective_rank_mergeability_score": 0.0014913998311385512,
        "task_vector_cosine_similarity": 0.0027351034805178642,
        "task_vector_l2_distance": -0.008962634950876236,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.001160198706202209,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.002384900813922286,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0013440256007015705,
        "activation_cosine_similarity": -0.0018559497548267245,
        "activation_magnitude_ratio": -0.0025113809388130903,
        "activation_dot_product": -0.0038332203403115273,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.03735797852277756,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.04122008755803108,
        "input_gradient_dot_product": -0.003994918428361416
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7445281900081,
      "val_r": 0.18662460953836524,
      "n_iterations": 336,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006351863034069538,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.0017060277750715613,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0012379365507513285,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0023220940493047237,
        "task_vector_dot_product": -0.0012786962324753404,
        "weight_space_angle": 0.0012027223128825426,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.00809512846171856,
        "activation_magnitude_ratio": -0.0030076720286160707,
        "activation_dot_product": 0.0027556123677641153,
        "encoder_gradient_cosine_similarity": 0.0010740343714132905,
        "encoder_gradient_l2_distance": -0.011272636242210865,
        "encoder_gradient_dot_product": 0.0013759947614744306,
        "input_gradient_cosine_similarity": -0.0010545694967731833,
        "input_gradient_l2_distance": -0.010413240641355515,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7193196148634391,
      "val_r": 0.7269676833640235,
      "n_iterations": 193,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0069041806273162365,
        "right_subspace_overlap_bottom_k": -0.01211527455598116,
        "interaction_matrix_overlap_top_k": -0.0029375525191426277,
        "interaction_matrix_overlap_bottom_k": 0.0033826425205916166,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0022828057408332825,
        "stable_rank": -0.0013878633035346866,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0012611030833795667,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": -0.0011086361482739449,
        "task_vector_cosine_similarity": -0.004908127710223198,
        "task_vector_l2_distance": -0.0023788828402757645,
        "task_vector_dot_product": -0.0048544742166996,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0017876101192086935,
        "right_subspace_overlap": 0.006671993061900139,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.005095062777400017,
        "activation_magnitude_ratio": -0.001706290990114212,
        "activation_dot_product": 0.005331417080014944,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.025983154773712158,
        "encoder_gradient_dot_product": 0.0020847967825829983,
        "input_gradient_cosine_similarity": 0.002179676666855812,
        "input_gradient_l2_distance": -0.019747115671634674,
        "input_gradient_dot_product": -0.001707881805486977
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6799764310852981,
      "val_r": 0.6902299819946306,
      "n_iterations": 371,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003484461922198534,
        "right_subspace_overlap_bottom_k": -0.0012703543761745095,
        "interaction_matrix_overlap_top_k": 0.001583591802045703,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0012171610724180937,
        "spectral_gap": -0.0011857720091938972,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0034941029734909534,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.002938436344265938,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0020507159642875195,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0067823040299117565,
        "activation_magnitude_ratio": -0.0024041070137172937,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0022900807671248913,
        "encoder_gradient_l2_distance": -0.00898075383156538,
        "encoder_gradient_dot_product": 0.0014265691861510277,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.007580230478197336,
        "input_gradient_dot_product": -0.006430169567465782
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6918910299495051,
      "val_r": 0.8174873576775264,
      "n_iterations": 196,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0035765215288847685,
        "right_subspace_overlap_bottom_k": -0.00514595303684473,
        "interaction_matrix_overlap_top_k": 0.00259309820830822,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0010708445915952325,
        "task_vector_cosine_similarity": -0.0016587870195508003,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0030622752383351326,
        "weight_space_angle": -0.0026638733688741922,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0032850601710379124,
        "right_subspace_overlap": 0.0057960692793130875,
        "activation_l2_distance": 0.0012127060908824205,
        "activation_cosine_similarity": 0.007573112845420837,
        "activation_magnitude_ratio": -0.0026986622251570225,
        "activation_dot_product": 0.005990568082779646,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.01301355380564928,
        "encoder_gradient_dot_product": 0.0029994247015565634,
        "input_gradient_cosine_similarity": -0.0010608816519379616,
        "input_gradient_l2_distance": -0.007627448998391628,
        "input_gradient_dot_product": -0.003416722873225808
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7131918990910228,
      "val_r": 0.7602928224069363,
      "n_iterations": 229,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007285463623702526,
        "right_subspace_overlap_bottom_k": -0.010764535516500473,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0020739075262099504,
        "effective_rank": -0.00137255375739187,
        "effective_rank_mergeability_score": 0.0012108972296118736,
        "stable_rank": -0.0017082509584724903,
        "spectral_gap": 0.0013152729952707887,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0012005874887108803,
        "layerwise_effective_rank_mergeability_score": 0.0016788970679044724,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.007203814573585987,
        "task_vector_dot_product": -0.0018934332765638828,
        "weight_space_angle": 0.0010044934460893273,
        "task_vector_magnitude_ratio": -0.0015125605277717113,
        "singular_value_overlap": 0.003323872108012438,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0028109815903007984,
        "activation_l2_distance": -0.0019388552755117416,
        "activation_cosine_similarity": 0.012181789614260197,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.01060065720230341,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.02994215115904808,
        "encoder_gradient_dot_product": -0.0017253069672733545,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.02955150231719017,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7708659963260581,
      "val_r": 0.592085037019595,
      "n_iterations": 179,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0032670414075255394,
        "right_subspace_overlap_bottom_k": -0.004316915757954121,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0010233053471893072,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0032553640194237232,
        "task_vector_dot_product": 0.001515815150924027,
        "weight_space_angle": 0.0032347054220736027,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0027554333209991455,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0014116273960098624,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0064491992816329,
        "activation_magnitude_ratio": -0.003111689817160368,
        "activation_dot_product": -0.0015807503368705511,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.01448154728859663,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.005288081709295511,
        "input_gradient_dot_product": -0.0015081650344654918
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5455857302253044,
      "val_r": 0.4726432499224851,
      "n_iterations": 201,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00335569866001606,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0055658211931586266,
        "interaction_matrix_overlap_bottom_k": -0.003311408683657646,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0015578599413856864,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0018213354051113129,
        "layerwise_effective_rank": 0.001336290966719389,
        "layerwise_effective_rank_mergeability_score": -0.0010233742650598288,
        "task_vector_cosine_similarity": 0.0021887437906116247,
        "task_vector_l2_distance": 0.0012354664504528046,
        "task_vector_dot_product": -0.0010640054242685437,
        "weight_space_angle": -0.002476703841239214,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0021821341942995787,
        "subspace_overlap": 0.0010532417800277472,
        "right_subspace_overlap": 0.008825995028018951,
        "activation_l2_distance": 0.0011721453629434109,
        "activation_cosine_similarity": 0.007468619849532843,
        "activation_magnitude_ratio": -0.0010720170103013515,
        "activation_dot_product": 0.001404851209372282,
        "encoder_gradient_cosine_similarity": 0.001569579471834004,
        "encoder_gradient_l2_distance": -0.011827435344457626,
        "encoder_gradient_dot_product": 0.0026839652564376593,
        "input_gradient_cosine_similarity": -0.0028626464772969484,
        "input_gradient_l2_distance": -0.0057301209308207035,
        "input_gradient_dot_product": -0.0015687095001339912
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.70880387071522,
      "val_r": 0.6054197223259259,
      "n_iterations": 310,
      "n_nonzero_coefficients": 10,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.005379674956202507,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.003551453584805131,
        "right_subspace_overlap": 0.0025671774055808783,
        "activation_l2_distance": -0.003254314884543419,
        "activation_cosine_similarity": 0.006335408426821232,
        "activation_magnitude_ratio": -0.0016083703376352787,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.001407048781402409,
        "encoder_gradient_l2_distance": -0.016341913491487503,
        "encoder_gradient_dot_product": 0.0017864448018372059,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.016049081459641457,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5363578103008338,
      "val_r": 0.05767565927696462,
      "n_iterations": 298,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.012629088014364243,
        "right_subspace_overlap_bottom_k": -0.004195877816528082,
        "interaction_matrix_overlap_top_k": 0.006825210060924292,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0012198486365377903,
        "effective_rank_mergeability_score": -0.0011083590798079967,
        "stable_rank": 0.0,
        "spectral_gap": -0.002073877491056919,
        "singular_value_ratio": 0.0018002804135903716,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.003961273469030857,
        "task_vector_l2_distance": 0.0012741864193230867,
        "task_vector_dot_product": 0.002435526344925165,
        "weight_space_angle": -0.0014387787086889148,
        "task_vector_magnitude_ratio": 0.0014559519477188587,
        "singular_value_overlap": 0.004275579005479813,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.006926624104380608,
        "activation_l2_distance": 0.0030929800122976303,
        "activation_cosine_similarity": 0.007941313087940216,
        "activation_magnitude_ratio": 0.0028223046101629734,
        "activation_dot_product": 0.008697658777236938,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.011129229329526424,
        "encoder_gradient_dot_product": -0.0022540760692209005,
        "input_gradient_cosine_similarity": 0.001599338254891336,
        "input_gradient_l2_distance": -0.005997458938509226,
        "input_gradient_dot_product": -0.003991913050413132
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7336364484556026,
      "val_r": 0.7259923203030438,
      "n_iterations": 193,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0031828908249735832,
        "right_subspace_overlap_bottom_k": -0.00858792569488287,
        "interaction_matrix_overlap_top_k": -0.0010084602981805801,
        "interaction_matrix_overlap_bottom_k": -0.008884900249540806,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.001081042573787272,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.005150286015123129,
        "task_vector_dot_product": 0.001261929515749216,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.005039219278842211,
        "subspace_overlap": -0.0012368771713227034,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0041211433708667755,
        "activation_cosine_similarity": 0.003107630182057619,
        "activation_magnitude_ratio": -0.006246805656701326,
        "activation_dot_product": 0.0128791444003582,
        "encoder_gradient_cosine_similarity": 0.0016364981420338154,
        "encoder_gradient_l2_distance": -0.026796510443091393,
        "encoder_gradient_dot_product": 0.006798870861530304,
        "input_gradient_cosine_similarity": 0.002183347474783659,
        "input_gradient_l2_distance": -0.02729879505932331,
        "input_gradient_dot_product": -0.004371557384729385
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1.5,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}