{
  "weight_avg": {
    "aggregate_metrics": {
      "train_r": 0.4557282076370771,
      "train_p": 5.146595948054024e-165,
      "val_r": 0.27141243516009533,
      "val_p": 1.831946481750803e-07
    },
    "per_fold_stats": {
      "train_r_mean": 0.6957871077210825,
      "train_r_std": 0.05831337519053379,
      "val_r_mean": 0.5691189262549902,
      "val_r_std": 0.20546519629445137,
      "n_nonzero_mean": 17.45,
      "n_nonzero_std": 4.421255477802657
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.003440088825300336,
      "right_subspace_overlap_bottom_k": -0.0050061726942658424,
      "interaction_matrix_overlap_top_k": 0.0010014972649514675,
      "interaction_matrix_overlap_bottom_k": -0.0007062021177262068,
      "effective_rank": -0.000304471148410812,
      "effective_rank_mergeability_score": 0.0004592047189362347,
      "stable_rank": -0.00028873616247437894,
      "spectral_gap": 6.75459232297726e-05,
      "singular_value_ratio": 5.198568760533817e-05,
      "layerwise_effective_rank": -0.0002172522945329547,
      "layerwise_effective_rank_mergeability_score": 0.00032226656912826,
      "task_vector_cosine_similarity": 0.0005429887096397579,
      "task_vector_l2_distance": -0.0026038421783596277,
      "task_vector_dot_product": -0.0002590496151242405,
      "weight_space_angle": -0.00027257512556388974,
      "task_vector_magnitude_ratio": -0.00022580446966458112,
      "singular_value_overlap": 0.00038106634747236967,
      "subspace_overlap": 0.0008056505466811359,
      "right_subspace_overlap": 0.003626534715294838,
      "activation_l2_distance": -0.0009883544407784939,
      "activation_cosine_similarity": 0.006743554025888443,
      "activation_magnitude_ratio": -0.002331316005438566,
      "activation_dot_product": 0.0033116801641881466,
      "encoder_gradient_cosine_similarity": 0.0012028670171275735,
      "encoder_gradient_l2_distance": -0.017865829169750214,
      "encoder_gradient_dot_product": 0.0008291208068840206,
      "input_gradient_cosine_similarity": 0.00033528837957419455,
      "input_gradient_l2_distance": -0.013992691412568092,
      "input_gradient_dot_product": -0.00273820455186069
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.003366546705365181,
      "right_subspace_overlap_bottom_k": 0.0034015981946140528,
      "interaction_matrix_overlap_top_k": 0.002616550074890256,
      "interaction_matrix_overlap_bottom_k": 0.002596808597445488,
      "effective_rank": 0.0007320456206798553,
      "effective_rank_mergeability_score": 0.0008119079866446555,
      "stable_rank": 0.0009456192492507398,
      "spectral_gap": 0.000740517454687506,
      "singular_value_ratio": 0.0007013955037109554,
      "layerwise_effective_rank": 0.0006724948179908097,
      "layerwise_effective_rank_mergeability_score": 0.0010542802046984434,
      "task_vector_cosine_similarity": 0.002149622654542327,
      "task_vector_l2_distance": 0.0028996088076382875,
      "task_vector_dot_product": 0.0017304944340139627,
      "weight_space_angle": 0.0016133935423567891,
      "task_vector_magnitude_ratio": 0.0007149576558731496,
      "singular_value_overlap": 0.0019878160674124956,
      "subspace_overlap": 0.001510938978753984,
      "right_subspace_overlap": 0.0025084505323320627,
      "activation_l2_distance": 0.002454506466165185,
      "activation_cosine_similarity": 0.0028035962022840977,
      "activation_magnitude_ratio": 0.002009281422942877,
      "activation_dot_product": 0.004021612927317619,
      "encoder_gradient_cosine_similarity": 0.0013135728659108281,
      "encoder_gradient_l2_distance": 0.007353480905294418,
      "encoder_gradient_dot_product": 0.0018998866435140371,
      "input_gradient_cosine_similarity": 0.0012890950310975313,
      "input_gradient_l2_distance": 0.009620732627809048,
      "input_gradient_dot_product": 0.0019144000252708793
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.9,
      "right_subspace_overlap_bottom_k": 0.9,
      "interaction_matrix_overlap_top_k": 0.6,
      "interaction_matrix_overlap_bottom_k": 0.5,
      "effective_rank": 0.3,
      "effective_rank_mergeability_score": 0.4,
      "stable_rank": 0.35,
      "spectral_gap": 0.3,
      "singular_value_ratio": 0.2,
      "layerwise_effective_rank": 0.25,
      "layerwise_effective_rank_mergeability_score": 0.55,
      "task_vector_cosine_similarity": 0.5,
      "task_vector_l2_distance": 0.75,
      "task_vector_dot_product": 0.6,
      "weight_space_angle": 0.55,
      "task_vector_magnitude_ratio": 0.25,
      "singular_value_overlap": 0.5,
      "subspace_overlap": 0.5,
      "right_subspace_overlap": 0.8,
      "activation_l2_distance": 0.65,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.9,
      "activation_dot_product": 0.8,
      "encoder_gradient_cosine_similarity": 0.55,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.6,
      "input_gradient_cosine_similarity": 0.45,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.8
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6751808718075067,
        "val_r": 0.49944589229558206,
        "n_iterations": 431,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0025672190822660923,
          "right_subspace_overlap_bottom_k": -0.004424589686095715,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.004327862523496151,
          "effective_rank": -0.001693223835900426,
          "effective_rank_mergeability_score": 0.0017097459640353918,
          "stable_rank": -0.002491241553798318,
          "spectral_gap": 0.00107980752363801,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0014363229274749756,
          "layerwise_effective_rank_mergeability_score": 0.0013544013490900397,
          "task_vector_cosine_similarity": -0.0029177742544561625,
          "task_vector_l2_distance": -0.0014760743360966444,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0014968104660511017,
          "singular_value_overlap": -0.0017919163219630718,
          "subspace_overlap": 0.0016147292917594314,
          "right_subspace_overlap": 0.005554453935474157,
          "activation_l2_distance": -0.004002803470939398,
          "activation_cosine_similarity": 0.010354415513575077,
          "activation_magnitude_ratio": -0.005333344452083111,
          "activation_dot_product": 0.00646579172462225,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.021622436121106148,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0010755958501249552,
          "input_gradient_l2_distance": -0.016613027080893517,
          "input_gradient_dot_product": -0.003777311183512211
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6523009254648608,
        "val_r": 0.7668672322617485,
        "n_iterations": 235,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003196500241756439,
          "right_subspace_overlap_bottom_k": -0.008264994248747826,
          "interaction_matrix_overlap_top_k": 0.0018034807872027159,
          "interaction_matrix_overlap_bottom_k": -0.003135697916150093,
          "effective_rank": -0.001204678788781166,
          "effective_rank_mergeability_score": 0.0010354924015700817,
          "stable_rank": -0.0018009106861427426,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0017501703696325421,
          "task_vector_cosine_similarity": 0.0028765557799488306,
          "task_vector_l2_distance": -0.0025726810563355684,
          "task_vector_dot_product": -0.002684379927814007,
          "weight_space_angle": -0.0024477653205394745,
          "task_vector_magnitude_ratio": -0.00180247169919312,
          "singular_value_overlap": 0.0019575273618102074,
          "subspace_overlap": 0.0016402511391788721,
          "right_subspace_overlap": 0.004735142923891544,
          "activation_l2_distance": -0.0011884174309670925,
          "activation_cosine_similarity": 0.007294060196727514,
          "activation_magnitude_ratio": -0.001830513821914792,
          "activation_dot_product": 0.0036640085745602846,
          "encoder_gradient_cosine_similarity": 0.0037540942430496216,
          "encoder_gradient_l2_distance": -0.013581927865743637,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.009771141223609447,
          "input_gradient_dot_product": -0.0032579628750681877
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6981424638340211,
        "val_r": 0.5699977630067239,
        "n_iterations": 318,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0035384423099458218,
          "right_subspace_overlap_bottom_k": 0.0010973610915243626,
          "interaction_matrix_overlap_top_k": 0.005608427803963423,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": -0.0024944706819951534,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.007876494899392128,
          "task_vector_dot_product": 0.0010652844794094563,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.003963980358093977,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.007403814233839512,
          "activation_cosine_similarity": 0.007718449924141169,
          "activation_magnitude_ratio": -0.0043665384873747826,
          "activation_dot_product": 0.003104198258370161,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.024386253207921982,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.025219334289431572,
          "input_gradient_dot_product": -0.004597917664796114
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.707829840427302,
        "val_r": 0.6803638852613404,
        "n_iterations": 215,
        "n_nonzero_coefficients": 11,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.005078287795186043,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.004851364530622959,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0011941168922930956,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0057020848616957664,
          "activation_l2_distance": -0.004324705805629492,
          "activation_cosine_similarity": 0.003336439374834299,
          "activation_magnitude_ratio": -0.005221642088145018,
          "activation_dot_product": 0.0020045058336108923,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.016678979620337486,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010981264524161816,
          "input_gradient_dot_product": -0.003616458736360073
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7392049587558165,
        "val_r": 0.7625057246300342,
        "n_iterations": 269,
        "n_nonzero_coefficients": 13,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0030598281882703304,
          "right_subspace_overlap_bottom_k": -0.004729042761027813,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.003025238635018468,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0010302374139428139,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.003345282981172204,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.007183391135185957,
          "activation_magnitude_ratio": -0.0019618412479758263,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0016503450460731983,
          "encoder_gradient_l2_distance": -0.01239387970417738,
          "encoder_gradient_dot_product": 0.0013179467059671879,
          "input_gradient_cosine_similarity": 0.0016065954696387053,
          "input_gradient_l2_distance": -0.007284520659595728,
          "input_gradient_dot_product": -0.0010038388427346945
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.734189566816991,
        "val_r": 0.6805387466685138,
        "n_iterations": 321,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0026339853648096323,
          "right_subspace_overlap_bottom_k": -0.0031394255347549915,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.0014572555664926767,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0034291697666049004,
          "task_vector_l2_distance": -0.0018916005501523614,
          "task_vector_dot_product": -0.0014147722395136952,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0038300324231386185,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.007418851833790541,
          "activation_magnitude_ratio": -0.001773237599991262,
          "activation_dot_product": 0.0016644243150949478,
          "encoder_gradient_cosine_similarity": 0.003746610600501299,
          "encoder_gradient_l2_distance": -0.016680167987942696,
          "encoder_gradient_dot_product": -0.0010169411543756723,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.005629167892038822,
          "input_gradient_dot_product": -0.004283955320715904
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7230455940979084,
        "val_r": 0.43167183079772586,
        "n_iterations": 296,
        "n_nonzero_coefficients": 12,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0013963145902380347,
          "right_subspace_overlap_bottom_k": -0.008785824291408062,
          "interaction_matrix_overlap_top_k": 0.004383638501167297,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.00226769526489079,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0039834375493228436,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.006239918991923332,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.004281810950487852,
          "encoder_gradient_cosine_similarity": 0.002381074707955122,
          "encoder_gradient_l2_distance": -0.018038146197795868,
          "encoder_gradient_dot_product": 0.0011047270381823182,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01172672864049673,
          "input_gradient_dot_product": -0.005479619838297367
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7000514136652616,
        "val_r": 0.3475733195475303,
        "n_iterations": 172,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00679611274972558,
          "right_subspace_overlap_bottom_k": -0.005937065929174423,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0015233473386615515,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0012474264949560165,
          "task_vector_cosine_similarity": 0.0016595146153122187,
          "task_vector_l2_distance": -0.003619971452280879,
          "task_vector_dot_product": -0.0013320611324161291,
          "weight_space_angle": -0.002174416556954384,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0011156618129462004,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0031381254084408283,
          "activation_l2_distance": -0.0014928552554920316,
          "activation_cosine_similarity": 0.006923635955899954,
          "activation_magnitude_ratio": -0.0033061360009014606,
          "activation_dot_product": 0.0028029230888932943,
          "encoder_gradient_cosine_similarity": 0.003511369926854968,
          "encoder_gradient_l2_distance": -0.01663525402545929,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0030393118504434824,
          "input_gradient_l2_distance": -0.007450274657458067,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7477814025903287,
        "val_r": 0.30367445539356297,
        "n_iterations": 390,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003220587968826294,
          "right_subspace_overlap_bottom_k": -0.005581643432378769,
          "interaction_matrix_overlap_top_k": -0.0010975683107972145,
          "interaction_matrix_overlap_bottom_k": -0.001751987379975617,
          "effective_rank": -0.001155761070549488,
          "effective_rank_mergeability_score": 0.0014504431746900082,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0013425133656710386,
          "layerwise_effective_rank_mergeability_score": 0.0014553675428032875,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.002216313499957323,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0016438813181594014,
          "right_subspace_overlap": 0.0051809451542794704,
          "activation_l2_distance": 0.0011379660572856665,
          "activation_cosine_similarity": 0.009228291921317577,
          "activation_magnitude_ratio": -0.0012883724411949515,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0010366030037403107,
          "encoder_gradient_l2_distance": -0.010172666050493717,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.008675183169543743,
          "input_gradient_dot_product": -0.0017569898627698421
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6938580959412699,
        "val_r": 0.7043212314075438,
        "n_iterations": 222,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0012786410516127944,
          "right_subspace_overlap_bottom_k": -0.0035034161992371082,
          "interaction_matrix_overlap_top_k": -0.0015837126411497593,
          "interaction_matrix_overlap_bottom_k": 0.001765172346495092,
          "effective_rank": -0.001883053919300437,
          "effective_rank_mergeability_score": 0.0013651323970407248,
          "stable_rank": -0.0011614777613431215,
          "spectral_gap": 0.0011344450758770108,
          "singular_value_ratio": -0.0013207989977672696,
          "layerwise_effective_rank": -0.0017019128426909447,
          "layerwise_effective_rank_mergeability_score": 0.0014913998311385512,
          "task_vector_cosine_similarity": 0.0027351034805178642,
          "task_vector_l2_distance": -0.008962634950876236,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.001160198706202209,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.002384900813922286,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0013440256007015705,
          "activation_cosine_similarity": -0.0018559497548267245,
          "activation_magnitude_ratio": -0.0025113809388130903,
          "activation_dot_product": -0.0038332203403115273,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.03735797852277756,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.04122008755803108,
          "input_gradient_dot_product": -0.003994918428361416
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7445281900081,
        "val_r": 0.18662460953836524,
        "n_iterations": 336,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006351863034069538,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.0017060277750715613,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0012379365507513285,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0023220940493047237,
          "task_vector_dot_product": -0.0012786962324753404,
          "weight_space_angle": 0.0012027223128825426,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.00809512846171856,
          "activation_magnitude_ratio": -0.0030076720286160707,
          "activation_dot_product": 0.0027556123677641153,
          "encoder_gradient_cosine_similarity": 0.0010740343714132905,
          "encoder_gradient_l2_distance": -0.011272636242210865,
          "encoder_gradient_dot_product": 0.0013759947614744306,
          "input_gradient_cosine_similarity": -0.0010545694967731833,
          "input_gradient_l2_distance": -0.010413240641355515,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7193196148634391,
        "val_r": 0.7269676833640235,
        "n_iterations": 193,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0069041806273162365,
          "right_subspace_overlap_bottom_k": -0.01211527455598116,
          "interaction_matrix_overlap_top_k": -0.0029375525191426277,
          "interaction_matrix_overlap_bottom_k": 0.0033826425205916166,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0022828057408332825,
          "stable_rank": -0.0013878633035346866,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0012611030833795667,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": -0.0011086361482739449,
          "task_vector_cosine_similarity": -0.004908127710223198,
          "task_vector_l2_distance": -0.0023788828402757645,
          "task_vector_dot_product": -0.0048544742166996,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0017876101192086935,
          "right_subspace_overlap": 0.006671993061900139,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.005095062777400017,
          "activation_magnitude_ratio": -0.001706290990114212,
          "activation_dot_product": 0.005331417080014944,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.025983154773712158,
          "encoder_gradient_dot_product": 0.0020847967825829983,
          "input_gradient_cosine_similarity": 0.002179676666855812,
          "input_gradient_l2_distance": -0.019747115671634674,
          "input_gradient_dot_product": -0.001707881805486977
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6799764310852981,
        "val_r": 0.6902299819946306,
        "n_iterations": 371,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003484461922198534,
          "right_subspace_overlap_bottom_k": -0.0012703543761745095,
          "interaction_matrix_overlap_top_k": 0.001583591802045703,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0012171610724180937,
          "spectral_gap": -0.0011857720091938972,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0034941029734909534,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.002938436344265938,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0020507159642875195,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0067823040299117565,
          "activation_magnitude_ratio": -0.0024041070137172937,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0022900807671248913,
          "encoder_gradient_l2_distance": -0.00898075383156538,
          "encoder_gradient_dot_product": 0.0014265691861510277,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.007580230478197336,
          "input_gradient_dot_product": -0.006430169567465782
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6918910299495051,
        "val_r": 0.8174873576775264,
        "n_iterations": 196,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0035765215288847685,
          "right_subspace_overlap_bottom_k": -0.00514595303684473,
          "interaction_matrix_overlap_top_k": 0.00259309820830822,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0010708445915952325,
          "task_vector_cosine_similarity": -0.0016587870195508003,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0030622752383351326,
          "weight_space_angle": -0.0026638733688741922,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0032850601710379124,
          "right_subspace_overlap": 0.0057960692793130875,
          "activation_l2_distance": 0.0012127060908824205,
          "activation_cosine_similarity": 0.007573112845420837,
          "activation_magnitude_ratio": -0.0026986622251570225,
          "activation_dot_product": 0.005990568082779646,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.01301355380564928,
          "encoder_gradient_dot_product": 0.0029994247015565634,
          "input_gradient_cosine_similarity": -0.0010608816519379616,
          "input_gradient_l2_distance": -0.007627448998391628,
          "input_gradient_dot_product": -0.003416722873225808
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7131918990910228,
        "val_r": 0.7602928224069363,
        "n_iterations": 229,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007285463623702526,
          "right_subspace_overlap_bottom_k": -0.010764535516500473,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0020739075262099504,
          "effective_rank": -0.00137255375739187,
          "effective_rank_mergeability_score": 0.0012108972296118736,
          "stable_rank": -0.0017082509584724903,
          "spectral_gap": 0.0013152729952707887,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0012005874887108803,
          "layerwise_effective_rank_mergeability_score": 0.0016788970679044724,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.007203814573585987,
          "task_vector_dot_product": -0.0018934332765638828,
          "weight_space_angle": 0.0010044934460893273,
          "task_vector_magnitude_ratio": -0.0015125605277717113,
          "singular_value_overlap": 0.003323872108012438,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0028109815903007984,
          "activation_l2_distance": -0.0019388552755117416,
          "activation_cosine_similarity": 0.012181789614260197,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.01060065720230341,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.02994215115904808,
          "encoder_gradient_dot_product": -0.0017253069672733545,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.02955150231719017,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.7708659963260581,
        "val_r": 0.592085037019595,
        "n_iterations": 179,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0032670414075255394,
          "right_subspace_overlap_bottom_k": -0.004316915757954121,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0010233053471893072,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0032553640194237232,
          "task_vector_dot_product": 0.001515815150924027,
          "weight_space_angle": 0.0032347054220736027,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0027554333209991455,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0014116273960098624,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0064491992816329,
          "activation_magnitude_ratio": -0.003111689817160368,
          "activation_dot_product": -0.0015807503368705511,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.01448154728859663,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.005288081709295511,
          "input_gradient_dot_product": -0.0015081650344654918
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5455857302253044,
        "val_r": 0.4726432499224851,
        "n_iterations": 201,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00335569866001606,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0055658211931586266,
          "interaction_matrix_overlap_bottom_k": -0.003311408683657646,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0015578599413856864,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0018213354051113129,
          "layerwise_effective_rank": 0.001336290966719389,
          "layerwise_effective_rank_mergeability_score": -0.0010233742650598288,
          "task_vector_cosine_similarity": 0.0021887437906116247,
          "task_vector_l2_distance": 0.0012354664504528046,
          "task_vector_dot_product": -0.0010640054242685437,
          "weight_space_angle": -0.002476703841239214,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0021821341942995787,
          "subspace_overlap": 0.0010532417800277472,
          "right_subspace_overlap": 0.008825995028018951,
          "activation_l2_distance": 0.0011721453629434109,
          "activation_cosine_similarity": 0.007468619849532843,
          "activation_magnitude_ratio": -0.0010720170103013515,
          "activation_dot_product": 0.001404851209372282,
          "encoder_gradient_cosine_similarity": 0.001569579471834004,
          "encoder_gradient_l2_distance": -0.011827435344457626,
          "encoder_gradient_dot_product": 0.0026839652564376593,
          "input_gradient_cosine_similarity": -0.0028626464772969484,
          "input_gradient_l2_distance": -0.0057301209308207035,
          "input_gradient_dot_product": -0.0015687095001339912
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.70880387071522,
        "val_r": 0.6054197223259259,
        "n_iterations": 310,
        "n_nonzero_coefficients": 10,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.005379674956202507,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.003551453584805131,
          "right_subspace_overlap": 0.0025671774055808783,
          "activation_l2_distance": -0.003254314884543419,
          "activation_cosine_similarity": 0.006335408426821232,
          "activation_magnitude_ratio": -0.0016083703376352787,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.001407048781402409,
          "encoder_gradient_l2_distance": -0.016341913491487503,
          "encoder_gradient_dot_product": 0.0017864448018372059,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.016049081459641457,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5363578103008338,
        "val_r": 0.05767565927696462,
        "n_iterations": 298,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.012629088014364243,
          "right_subspace_overlap_bottom_k": -0.004195877816528082,
          "interaction_matrix_overlap_top_k": 0.006825210060924292,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0012198486365377903,
          "effective_rank_mergeability_score": -0.0011083590798079967,
          "stable_rank": 0.0,
          "spectral_gap": -0.002073877491056919,
          "singular_value_ratio": 0.0018002804135903716,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.003961273469030857,
          "task_vector_l2_distance": 0.0012741864193230867,
          "task_vector_dot_product": 0.002435526344925165,
          "weight_space_angle": -0.0014387787086889148,
          "task_vector_magnitude_ratio": 0.0014559519477188587,
          "singular_value_overlap": 0.004275579005479813,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.006926624104380608,
          "activation_l2_distance": 0.0030929800122976303,
          "activation_cosine_similarity": 0.007941313087940216,
          "activation_magnitude_ratio": 0.0028223046101629734,
          "activation_dot_product": 0.008697658777236938,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.011129229329526424,
          "encoder_gradient_dot_product": -0.0022540760692209005,
          "input_gradient_cosine_similarity": 0.001599338254891336,
          "input_gradient_l2_distance": -0.005997458938509226,
          "input_gradient_dot_product": -0.003991913050413132
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7336364484556026,
        "val_r": 0.7259923203030438,
        "n_iterations": 193,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0031828908249735832,
          "right_subspace_overlap_bottom_k": -0.00858792569488287,
          "interaction_matrix_overlap_top_k": -0.0010084602981805801,
          "interaction_matrix_overlap_bottom_k": -0.008884900249540806,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.001081042573787272,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.005150286015123129,
          "task_vector_dot_product": 0.001261929515749216,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.005039219278842211,
          "subspace_overlap": -0.0012368771713227034,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0041211433708667755,
          "activation_cosine_similarity": 0.003107630182057619,
          "activation_magnitude_ratio": -0.006246805656701326,
          "activation_dot_product": 0.0128791444003582,
          "encoder_gradient_cosine_similarity": 0.0016364981420338154,
          "encoder_gradient_l2_distance": -0.026796510443091393,
          "encoder_gradient_dot_product": 0.006798870861530304,
          "input_gradient_cosine_similarity": 0.002183347474783659,
          "input_gradient_l2_distance": -0.02729879505932331,
          "input_gradient_dot_product": -0.004371557384729385
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1.5,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "arithmetic": {
    "aggregate_metrics": {
      "train_r": 0.4076342900004527,
      "train_p": 2.988332951371494e-129,
      "val_r": 0.02161719615394042,
      "val_p": 0.6835425789417914
    },
    "per_fold_stats": {
      "train_r_mean": 0.5605880627094761,
      "train_r_std": 0.06690443177279888,
      "val_r_mean": 0.48507219615164,
      "val_r_std": 0.1431777763376688,
      "n_nonzero_mean": 17.2,
      "n_nonzero_std": 3.4727510708370675
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.0024517152924090624,
      "right_subspace_overlap_bottom_k": 0.0011023199185729027,
      "interaction_matrix_overlap_top_k": 0.0005715301958844066,
      "interaction_matrix_overlap_bottom_k": 0.00665674451738596,
      "effective_rank": -0.0003917944268323481,
      "effective_rank_mergeability_score": 0.0006482239114120603,
      "stable_rank": -0.000497723463922739,
      "spectral_gap": 0.0009271434391848743,
      "singular_value_ratio": -0.0005744005320593715,
      "layerwise_effective_rank": -0.0003914072585757822,
      "layerwise_effective_rank_mergeability_score": 0.00028989012935198843,
      "task_vector_cosine_similarity": 6.849004421383142e-07,
      "task_vector_l2_distance": -0.010161987505853176,
      "task_vector_dot_product": 0.0001600960677023977,
      "weight_space_angle": 0.0002686892985366285,
      "task_vector_magnitude_ratio": -0.0011814769823104143,
      "singular_value_overlap": -0.0070360624231398106,
      "subspace_overlap": 0.0006428906926885247,
      "right_subspace_overlap": 0.0022568649146705866,
      "activation_l2_distance": -0.0019223010167479515,
      "activation_cosine_similarity": 0.0023802744690328836,
      "activation_magnitude_ratio": -0.0020703317131847143,
      "activation_dot_product": 0.0019410375971347094,
      "encoder_gradient_cosine_similarity": 0.000936667260248214,
      "encoder_gradient_l2_distance": -0.01443017739802599,
      "encoder_gradient_dot_product": 0.0009406910394318402,
      "input_gradient_cosine_similarity": 0.00030315364710986614,
      "input_gradient_l2_distance": -0.01589168794453144,
      "input_gradient_dot_product": -0.0022949837148189545
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.003450439078733325,
      "right_subspace_overlap_bottom_k": 0.003987317439168692,
      "interaction_matrix_overlap_top_k": 0.0013945965329185128,
      "interaction_matrix_overlap_bottom_k": 0.003686317475512624,
      "effective_rank": 0.0007770971860736609,
      "effective_rank_mergeability_score": 0.001033373293466866,
      "stable_rank": 0.0007990191224962473,
      "spectral_gap": 0.001166299101896584,
      "singular_value_ratio": 0.000983147881925106,
      "layerwise_effective_rank": 0.0007139832014217973,
      "layerwise_effective_rank_mergeability_score": 0.0006005637696944177,
      "task_vector_cosine_similarity": 0.0018047416815534234,
      "task_vector_l2_distance": 0.00466288672760129,
      "task_vector_dot_product": 0.001785371219739318,
      "weight_space_angle": 0.0017509470926597714,
      "task_vector_magnitude_ratio": 0.0009245088440366089,
      "singular_value_overlap": 0.0033157519064843655,
      "subspace_overlap": 0.0017471250612288713,
      "right_subspace_overlap": 0.0024133932311087847,
      "activation_l2_distance": 0.00220052944496274,
      "activation_cosine_similarity": 0.00226463726721704,
      "activation_magnitude_ratio": 0.0017515908693894744,
      "activation_dot_product": 0.003333326196298003,
      "encoder_gradient_cosine_similarity": 0.0014453900512307882,
      "encoder_gradient_l2_distance": 0.005029983352869749,
      "encoder_gradient_dot_product": 0.00113813322968781,
      "input_gradient_cosine_similarity": 0.0010957496706396341,
      "input_gradient_l2_distance": 0.006893472280353308,
      "input_gradient_dot_product": 0.0019585806876420975
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.55,
      "right_subspace_overlap_bottom_k": 0.7,
      "interaction_matrix_overlap_top_k": 0.35,
      "interaction_matrix_overlap_bottom_k": 1.0,
      "effective_rank": 0.35,
      "effective_rank_mergeability_score": 0.35,
      "stable_rank": 0.3,
      "spectral_gap": 0.55,
      "singular_value_ratio": 0.4,
      "layerwise_effective_rank": 0.25,
      "layerwise_effective_rank_mergeability_score": 0.2,
      "task_vector_cosine_similarity": 0.3,
      "task_vector_l2_distance": 0.9,
      "task_vector_dot_product": 0.5,
      "weight_space_angle": 0.5,
      "task_vector_magnitude_ratio": 0.7,
      "singular_value_overlap": 0.95,
      "subspace_overlap": 0.55,
      "right_subspace_overlap": 0.8,
      "activation_l2_distance": 0.7,
      "activation_cosine_similarity": 0.8,
      "activation_magnitude_ratio": 0.75,
      "activation_dot_product": 0.6,
      "encoder_gradient_cosine_similarity": 0.6,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.6,
      "input_gradient_cosine_similarity": 0.3,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.65
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5873199214786576,
        "val_r": 0.6469197090989678,
        "n_iterations": 340,
        "n_nonzero_coefficients": 10,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.013768425211310387,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.011165727861225605,
          "task_vector_dot_product": 0.0017798678018152714,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.007848395965993404,
          "subspace_overlap": 0.002525290008634329,
          "right_subspace_overlap": 0.0018686328548938036,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0027649058029055595,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.011905275285243988,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.011340068653225899,
          "input_gradient_dot_product": -0.004528702702373266
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5164957390027166,
        "val_r": 0.5212738097592381,
        "n_iterations": 384,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007465125061571598,
          "right_subspace_overlap_bottom_k": -0.002267077099531889,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.00591712212190032,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.002855525352060795,
          "singular_value_ratio": -0.0010507404804229736,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0017936022486537695,
          "task_vector_l2_distance": -0.00986732728779316,
          "task_vector_dot_product": -0.004076141864061356,
          "weight_space_angle": 0.0022398349829018116,
          "task_vector_magnitude_ratio": -0.0017085947329178452,
          "singular_value_overlap": -0.011377790942788124,
          "subspace_overlap": -0.003499262034893036,
          "right_subspace_overlap": 0.0022040512412786484,
          "activation_l2_distance": -0.003984573297202587,
          "activation_cosine_similarity": 0.006113119889050722,
          "activation_magnitude_ratio": -0.00485537713393569,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": -0.0011986595345661044,
          "encoder_gradient_l2_distance": -0.02789941243827343,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0338900201022625,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.564702564886449,
        "val_r": 0.5404793484185039,
        "n_iterations": 293,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0036848075687885284,
          "right_subspace_overlap_bottom_k": 0.002193686319515109,
          "interaction_matrix_overlap_top_k": 0.0026576484087854624,
          "interaction_matrix_overlap_bottom_k": 0.006104892585426569,
          "effective_rank": -0.0012347509618848562,
          "effective_rank_mergeability_score": 0.001390696270391345,
          "stable_rank": -0.0022632889449596405,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0014813675079494715,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.010040554217994213,
          "task_vector_dot_product": -0.0010371205862611532,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0019250897457823157,
          "singular_value_overlap": -0.009513987228274345,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.001571783795952797,
          "activation_l2_distance": -0.003888342995196581,
          "activation_cosine_similarity": 0.001911381259560585,
          "activation_magnitude_ratio": -0.005120354704558849,
          "activation_dot_product": 0.0016503814840689301,
          "encoder_gradient_cosine_similarity": 0.0017462018877267838,
          "encoder_gradient_l2_distance": -0.011465143412351608,
          "encoder_gradient_dot_product": 0.0017742780037224293,
          "input_gradient_cosine_similarity": 0.002087798435240984,
          "input_gradient_l2_distance": -0.013237693347036839,
          "input_gradient_dot_product": -0.0031177345663309097
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5830747535856372,
        "val_r": 0.4988095791707083,
        "n_iterations": 266,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006084047723561525,
          "right_subspace_overlap_bottom_k": 0.004276257008314133,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.00792190432548523,
          "effective_rank": -0.0012014805106446147,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0014958708779886365,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0011044745333492756,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.012623465619981289,
          "task_vector_dot_product": 0.0014510734472423792,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.001044062664732337,
          "singular_value_overlap": -0.009201682172715664,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.002054906217381358,
          "activation_l2_distance": 0.0011141751892864704,
          "activation_cosine_similarity": 0.002508314559236169,
          "activation_magnitude_ratio": -0.0034801550209522247,
          "activation_dot_product": 0.002027785172685981,
          "encoder_gradient_cosine_similarity": 0.0016397279687225819,
          "encoder_gradient_l2_distance": -0.014073065482079983,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.018065812066197395,
          "input_gradient_dot_product": -0.004868708085268736
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5933284082436407,
        "val_r": 0.48976277040506294,
        "n_iterations": 320,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0019200219539925456,
          "right_subspace_overlap_bottom_k": 0.006012754514813423,
          "interaction_matrix_overlap_top_k": -0.001369044533930719,
          "interaction_matrix_overlap_bottom_k": 0.014687025919556618,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.020057756453752518,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.001723847002722323,
          "task_vector_magnitude_ratio": -0.0016636487562209368,
          "singular_value_overlap": -0.013547364622354507,
          "subspace_overlap": -0.0014261328615248203,
          "right_subspace_overlap": -0.002058687387034297,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.00554652139544487,
          "activation_dot_product": 0.0014314533909782767,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.011591996066272259,
          "encoder_gradient_dot_product": 0.002637523226439953,
          "input_gradient_cosine_similarity": 0.0029455730691552162,
          "input_gradient_l2_distance": -0.0193453598767519,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5849186696456639,
        "val_r": 0.7238606087084734,
        "n_iterations": 246,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0028339065611362457,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.009383495897054672,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0013326520565897226,
          "singular_value_ratio": -0.0016376555431634188,
          "layerwise_effective_rank": -0.0014425343833863735,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.014650802128016949,
          "task_vector_dot_product": 0.0019338539568707347,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.001100885565392673,
          "singular_value_overlap": -0.010236764326691628,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0030682003125548363,
          "activation_l2_distance": -0.005278217606246471,
          "activation_cosine_similarity": 0.0019160587107762694,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.016366202384233475,
          "encoder_gradient_dot_product": 0.002147065242752433,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.016764679923653603,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.564865782564603,
        "val_r": 0.286499298896675,
        "n_iterations": 301,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.002277478575706482,
          "interaction_matrix_overlap_bottom_k": 0.0072657265700399876,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0012388823088258505,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0017248571384698153,
          "task_vector_l2_distance": -0.006494789384305477,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0014637152198702097,
          "singular_value_overlap": -0.002996477298438549,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0011333914007991552,
          "activation_l2_distance": -0.0013374215923249722,
          "activation_cosine_similarity": 0.0026028817519545555,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0011137713445350528,
          "encoder_gradient_l2_distance": -0.010992911644279957,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.007690551690757275,
          "input_gradient_dot_product": -0.001456861151382327
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.4543204630275329,
        "val_r": 0.29625210436222593,
        "n_iterations": 320,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.006601434201002121,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.006429703906178474,
          "effective_rank": 0.001144637819379568,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0010338732972741127,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.012374759651720524,
          "task_vector_dot_product": 0.001852322369813919,
          "weight_space_angle": 0.0010183167178183794,
          "task_vector_magnitude_ratio": -0.0011693473206833005,
          "singular_value_overlap": -0.004788472317159176,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0015948107466101646,
          "activation_cosine_similarity": -0.0016025581862777472,
          "activation_magnitude_ratio": -0.0023082029074430466,
          "activation_dot_product": 0.003692477708682418,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.012560774572193623,
          "encoder_gradient_dot_product": 0.0013028817484155297,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.005592679139226675,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5733315384742722,
        "val_r": 0.5542828075704419,
        "n_iterations": 248,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0042280880734324455,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.007078502792865038,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0022616686765104532,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.012212523259222507,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0010921789798885584,
          "task_vector_magnitude_ratio": -0.0010941758519038558,
          "singular_value_overlap": -0.0057786074467003345,
          "subspace_overlap": 0.0012766649015247822,
          "right_subspace_overlap": 0.001687570009380579,
          "activation_l2_distance": -0.002693211892619729,
          "activation_cosine_similarity": 0.0023438623175024986,
          "activation_magnitude_ratio": -0.0016914841253310442,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.011467237025499344,
          "encoder_gradient_dot_product": 0.0017061287071555853,
          "input_gradient_cosine_similarity": 0.001667299889959395,
          "input_gradient_l2_distance": -0.014964237809181213,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5563973412857499,
        "val_r": 0.4481628938128986,
        "n_iterations": 281,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0027557010762393475,
          "right_subspace_overlap_bottom_k": 0.0010383558692410588,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.00681322580203414,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0010617355583235621,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.010676106438040733,
          "task_vector_dot_product": -0.002779340837150812,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0014437673380598426,
          "singular_value_overlap": -0.009828702546656132,
          "subspace_overlap": 0.0013421783223748207,
          "right_subspace_overlap": 0.0035419510677456856,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0010780820157378912,
          "activation_magnitude_ratio": -0.0013866735389456153,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.02108681946992874,
          "encoder_gradient_dot_product": 0.0010548296850174665,
          "input_gradient_cosine_similarity": 0.0010276816319674253,
          "input_gradient_l2_distance": -0.026212627068161964,
          "input_gradient_dot_product": -0.0016966145485639572
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.46574721809474734,
        "val_r": 0.2356411157044241,
        "n_iterations": 182,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0028347643092274666,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.006359940394759178,
          "effective_rank": -0.0019187191501259804,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0022496175952255726,
          "singular_value_ratio": -0.001438220962882042,
          "layerwise_effective_rank": -0.0012421014253050089,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.00793678592890501,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0010529900901019573,
          "task_vector_magnitude_ratio": -0.001514430157840252,
          "singular_value_overlap": -0.0031352443620562553,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0014916106592863798,
          "activation_l2_distance": -0.003680958179756999,
          "activation_cosine_similarity": 0.0014167793560773134,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0017778455512598157,
          "encoder_gradient_cosine_similarity": -0.0011461273534223437,
          "encoder_gradient_l2_distance": -0.008166652172803879,
          "encoder_gradient_dot_product": 0.0020675905980169773,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.005293450318276882,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5502957500580045,
        "val_r": 0.5046937481153649,
        "n_iterations": 383,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0027888319455087185,
          "right_subspace_overlap_bottom_k": -0.0015926191117614508,
          "interaction_matrix_overlap_top_k": -0.0010699727572500706,
          "interaction_matrix_overlap_bottom_k": 0.0064287325367331505,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0014674321282655,
          "spectral_gap": 0.0021199905313551426,
          "singular_value_ratio": -0.0014083784772083163,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0020560859702527523,
          "task_vector_l2_distance": -0.006613853387534618,
          "task_vector_dot_product": -0.002286122180521488,
          "weight_space_angle": 0.003128283191472292,
          "task_vector_magnitude_ratio": -0.0015112558612599969,
          "singular_value_overlap": -0.006815006956458092,
          "subspace_overlap": 0.004512857645750046,
          "right_subspace_overlap": 0.001353265717625618,
          "activation_l2_distance": -0.0013487073592841625,
          "activation_cosine_similarity": 0.003192978911101818,
          "activation_magnitude_ratio": -0.0011467286385595798,
          "activation_dot_product": 0.0014781320933252573,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.014505538158118725,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.014006896875798702,
          "input_gradient_dot_product": -0.0033537759445607662
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.45220454570206337,
        "val_r": 0.3779973450048288,
        "n_iterations": 234,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0014720647595822811,
          "interaction_matrix_overlap_bottom_k": 0.003175221849232912,
          "effective_rank": -0.001534485025331378,
          "effective_rank_mergeability_score": 0.0038375570438802242,
          "stable_rank": 0.0,
          "spectral_gap": 0.0019733719527721405,
          "singular_value_ratio": -0.002880288753658533,
          "layerwise_effective_rank": -0.0022758152335882187,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.005375674460083246,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0024997477885335684,
          "weight_space_angle": -0.0058027044869959354,
          "task_vector_magnitude_ratio": -0.0033239852637052536,
          "singular_value_overlap": -0.007441715802997351,
          "subspace_overlap": 0.002215270884335041,
          "right_subspace_overlap": 0.003722522174939513,
          "activation_l2_distance": -0.005921541713178158,
          "activation_cosine_similarity": 0.0070512136444449425,
          "activation_magnitude_ratio": -0.0018164190696552396,
          "activation_dot_product": 0.004188144579529762,
          "encoder_gradient_cosine_similarity": 0.004165479447692633,
          "encoder_gradient_l2_distance": -0.017367620021104813,
          "encoder_gradient_dot_product": 0.0024083489552140236,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.018774284049868584,
          "input_gradient_dot_product": -0.005179013591259718
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5763953381915536,
        "val_r": 0.7279711791167848,
        "n_iterations": 292,
        "n_nonzero_coefficients": 11,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0028394286055117846,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.007163072936236858,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0012238183990120888,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.001018791226670146,
          "layerwise_effective_rank_mergeability_score": 0.0012049797223880887,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01023052353411913,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.005628833081573248,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.003900852520018816,
          "encoder_gradient_cosine_similarity": 0.002098141238093376,
          "encoder_gradient_l2_distance": -0.011542834341526031,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.011953148059546947,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5124438908853232,
        "val_r": 0.5937393119347972,
        "n_iterations": 250,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0038059097714722157,
          "right_subspace_overlap_bottom_k": -0.0011719728354364634,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.005063754040747881,
          "effective_rank": -0.0013785870978608727,
          "effective_rank_mergeability_score": 0.0019493956351652741,
          "stable_rank": -0.0022022516932338476,
          "spectral_gap": 0.0020132786594331264,
          "singular_value_ratio": -0.0016690475167706609,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.013565653003752232,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.002406755927950144,
          "singular_value_overlap": -0.0076529295183718204,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0028076551388949156,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.00471105333417654,
          "activation_magnitude_ratio": -0.0019074635347351432,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.013818087056279182,
          "encoder_gradient_dot_product": 0.0026323425117880106,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01746547222137451,
          "input_gradient_dot_product": -0.004698914475739002
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.5457654205902205,
        "val_r": 0.33988524412527676,
        "n_iterations": 267,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011357590556144714,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.004005898255854845,
          "interaction_matrix_overlap_bottom_k": 0.0017089378088712692,
          "effective_rank": -0.0017125033773481846,
          "effective_rank_mergeability_score": 0.001278341980651021,
          "stable_rank": 0.0,
          "spectral_gap": 0.0018580014584586024,
          "singular_value_ratio": -0.00243755173869431,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01010213978588581,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0022598279174417257,
          "singular_value_overlap": -0.0030868700705468655,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.006810326594859362,
          "activation_l2_distance": -0.0016392710385844111,
          "activation_cosine_similarity": 0.004275770392268896,
          "activation_magnitude_ratio": -0.0010565274860709906,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.004173284862190485,
          "encoder_gradient_l2_distance": -0.013950249180197716,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01194679830223322,
          "input_gradient_dot_product": -0.004802321549504995
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.557201682215107,
        "val_r": 0.3590863912756767,
        "n_iterations": 211,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.001235250849276781,
          "right_subspace_overlap_bottom_k": 0.005669973324984312,
          "interaction_matrix_overlap_top_k": 0.0034565303940325975,
          "interaction_matrix_overlap_bottom_k": 0.001392120961099863,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.011323951184749603,
          "task_vector_dot_product": 0.003863781224936247,
          "weight_space_angle": -0.0019522388465702534,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.008655470795929432,
          "subspace_overlap": 0.001963779330253601,
          "right_subspace_overlap": 0.00544344587251544,
          "activation_l2_distance": -0.002442318247631192,
          "activation_cosine_similarity": 0.001610838109627366,
          "activation_magnitude_ratio": -0.0036900269333273172,
          "activation_dot_product": 0.0027053379453718662,
          "encoder_gradient_cosine_similarity": 0.0023907003924250603,
          "encoder_gradient_l2_distance": -0.011878348886966705,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.013555453158915043,
          "input_gradient_dot_product": -0.004454921931028366
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5828547140466014,
        "val_r": 0.3989728569330687,
        "n_iterations": 367,
        "n_nonzero_coefficients": 13,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.010127485729753971,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.001703982474282384,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.00689023407176137,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.003411875804886222,
          "subspace_overlap": 0.0015527609502896667,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0011071815388277173,
          "activation_dot_product": -0.0014217328280210495,
          "encoder_gradient_cosine_similarity": 0.0011261459439992905,
          "encoder_gradient_l2_distance": -0.005775080528110266,
          "encoder_gradient_dot_product": 0.001344044809229672,
          "input_gradient_cosine_similarity": 0.0011158839333802462,
          "input_gradient_l2_distance": -0.011656379327178001,
          "input_gradient_dot_product": -0.002736027119681239
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7753170930563794,
        "val_r": 0.7094007403953708,
        "n_iterations": 197,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.008937631733715534,
          "right_subspace_overlap_bottom_k": -0.012247536331415176,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.001444084569811821,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.001093695405870676,
          "spectral_gap": -0.0013174507766962051,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0018489026697352529,
          "layerwise_effective_rank_mergeability_score": 0.0020069805905222893,
          "task_vector_cosine_similarity": -0.004826750140637159,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0013016783632338047,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0011288031237199903,
          "right_subspace_overlap": 0.008436672389507294,
          "activation_l2_distance": -0.004564887378364801,
          "activation_cosine_similarity": 0.002239333000034094,
          "activation_magnitude_ratio": -0.0035286126658320427,
          "activation_dot_product": 0.01487582828849554,
          "encoder_gradient_cosine_similarity": 0.001352954306639731,
          "encoder_gradient_l2_distance": -0.022100983187556267,
          "encoder_gradient_dot_product": 0.0013398559531196952,
          "input_gradient_cosine_similarity": -0.0027811636682599783,
          "input_gradient_l2_distance": -0.020100565627217293,
          "input_gradient_dot_product": -0.002661824692040682
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6147804191546016,
        "val_r": 0.447753060224011,
        "n_iterations": 341,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.003636380657553673,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.007789672818034887,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.001007936429232359,
          "stable_rank": 0.0,
          "spectral_gap": 0.002900276333093643,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.001589604769833386,
          "task_vector_l2_distance": -0.016412781551480293,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0015716003254055977,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.009775055572390556,
          "subspace_overlap": 0.0035232086665928364,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.004375554155558348,
          "activation_cosine_similarity": 0.006236382760107517,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0025142482481896877,
          "encoder_gradient_cosine_similarity": 0.001271725632250309,
          "encoder_gradient_l2_distance": -0.020089320838451385,
          "encoder_gradient_dot_product": -0.0016010728431865573,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.025977591052651405,
          "input_gradient_dot_product": -0.0023442537058144808
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1.5,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "tsv": {
    "aggregate_metrics": {
      "train_r": 0.5290633709942661,
      "train_p": 6.587689925154428e-232,
      "val_r": 0.4294298914784088,
      "val_p": 1.6974690095593796e-17
    },
    "per_fold_stats": {
      "train_r_mean": 0.7316460138260129,
      "train_r_std": 0.05502860076223991,
      "val_r_mean": 0.650375420419637,
      "val_r_std": 0.14850503398965997,
      "n_nonzero_mean": 15.85,
      "n_nonzero_std": 3.9404948927767944
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.005235358141362667,
      "right_subspace_overlap_bottom_k": -0.010832762345671654,
      "interaction_matrix_overlap_top_k": 0.0016651041805744171,
      "interaction_matrix_overlap_bottom_k": -0.0008830794831737876,
      "effective_rank": 0.0003325382713228464,
      "effective_rank_mergeability_score": -0.0001228251203428954,
      "stable_rank": 6.782588025089353e-05,
      "spectral_gap": -0.0005311515415087342,
      "singular_value_ratio": 0.0003939929883927107,
      "layerwise_effective_rank": -0.00048267710371874273,
      "layerwise_effective_rank_mergeability_score": 0.0003646916593424976,
      "task_vector_cosine_similarity": 7.832822302589193e-05,
      "task_vector_l2_distance": -0.0005659348680637777,
      "task_vector_dot_product": 0.0007299001445062459,
      "weight_space_angle": -0.000987150939181447,
      "task_vector_magnitude_ratio": 0.00042212969856336713,
      "singular_value_overlap": 0.004108462482690811,
      "subspace_overlap": 0.00041928552673198283,
      "right_subspace_overlap": 0.005432952661067247,
      "activation_l2_distance": -0.0009091203100979328,
      "activation_cosine_similarity": 0.0077171288430690765,
      "activation_magnitude_ratio": -0.0011999184498563409,
      "activation_dot_product": 0.0035313882399350405,
      "encoder_gradient_cosine_similarity": 0.0014940901892259717,
      "encoder_gradient_l2_distance": -0.015350237488746643,
      "encoder_gradient_dot_product": 0.0003060023591388017,
      "input_gradient_cosine_similarity": 0.00032560410909354687,
      "input_gradient_l2_distance": -0.010015105828642845,
      "input_gradient_dot_product": -0.0013603048864752054
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.0025316071696579456,
      "right_subspace_overlap_bottom_k": 0.0025025370996445417,
      "interaction_matrix_overlap_top_k": 0.002434283262118697,
      "interaction_matrix_overlap_bottom_k": 0.002186831785365939,
      "effective_rank": 0.0007700594724155962,
      "effective_rank_mergeability_score": 0.000755267683416605,
      "stable_rank": 0.0006573242135345936,
      "spectral_gap": 0.0010597172658890486,
      "singular_value_ratio": 0.0010648672468960285,
      "layerwise_effective_rank": 0.0012403368018567562,
      "layerwise_effective_rank_mergeability_score": 0.0006352490745484829,
      "task_vector_cosine_similarity": 0.00154915452003479,
      "task_vector_l2_distance": 0.0014877647627145052,
      "task_vector_dot_product": 0.002485217759385705,
      "weight_space_angle": 0.002037431811913848,
      "task_vector_magnitude_ratio": 0.0010192285990342498,
      "singular_value_overlap": 0.0018658811459317803,
      "subspace_overlap": 0.0012871354119852185,
      "right_subspace_overlap": 0.002553565427660942,
      "activation_l2_distance": 0.001669451710768044,
      "activation_cosine_similarity": 0.0034852251410484314,
      "activation_magnitude_ratio": 0.0014418908394873142,
      "activation_dot_product": 0.004725202452391386,
      "encoder_gradient_cosine_similarity": 0.0017557725077494979,
      "encoder_gradient_l2_distance": 0.004913958255201578,
      "encoder_gradient_dot_product": 0.0012090642703697085,
      "input_gradient_cosine_similarity": 0.0012937994906678796,
      "input_gradient_l2_distance": 0.005296805873513222,
      "input_gradient_dot_product": 0.0018615596927702427
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.9,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.4,
      "interaction_matrix_overlap_bottom_k": 0.5,
      "effective_rank": 0.2,
      "effective_rank_mergeability_score": 0.15,
      "stable_rank": 0.15,
      "spectral_gap": 0.35,
      "singular_value_ratio": 0.4,
      "layerwise_effective_rank": 0.4,
      "layerwise_effective_rank_mergeability_score": 0.25,
      "task_vector_cosine_similarity": 0.45,
      "task_vector_l2_distance": 0.4,
      "task_vector_dot_product": 0.55,
      "weight_space_angle": 0.6,
      "task_vector_magnitude_ratio": 0.2,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.35,
      "right_subspace_overlap": 0.95,
      "activation_l2_distance": 0.55,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.6,
      "activation_dot_product": 0.7,
      "encoder_gradient_cosine_similarity": 0.6,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.45,
      "input_gradient_cosine_similarity": 0.35,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.4
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7460757587703115,
        "val_r": 0.48473623878417865,
        "n_iterations": 227,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004939467180520296,
          "right_subspace_overlap_bottom_k": -0.007220138795673847,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0025594111066311598,
          "task_vector_dot_product": -0.002209023805335164,
          "weight_space_angle": -0.0025507966056466103,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.00348083907738328,
          "subspace_overlap": 0.003922568634152412,
          "right_subspace_overlap": 0.0050598266534507275,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.01447668019682169,
          "activation_magnitude_ratio": -0.002844018628820777,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0020093382336199284,
          "encoder_gradient_l2_distance": -0.022952958941459656,
          "encoder_gradient_dot_product": -0.00286259688436985,
          "input_gradient_cosine_similarity": -0.0028334783855825663,
          "input_gradient_l2_distance": -0.013292110525071621,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7431747476565332,
        "val_r": 0.7804530490476721,
        "n_iterations": 180,
        "n_nonzero_coefficients": 12,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0035942397080361843,
          "right_subspace_overlap_bottom_k": -0.00939579401165247,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.001015659305267036,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0011777296895161271,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0010044265072792768,
          "weight_space_angle": -0.0012046193005517125,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.003189152805134654,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.008194162510335445,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.008832637220621109,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.015373100526630878,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.006413559895008802,
          "input_gradient_dot_product": -0.0033504543825984
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7604816933891827,
        "val_r": 0.8110674944810811,
        "n_iterations": 218,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006120740901678801,
          "right_subspace_overlap_bottom_k": -0.01195450872182846,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.0010650078766047955,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0020519935060292482,
          "layerwise_effective_rank_mergeability_score": 0.0016661378322169185,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0020138034597039223,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0017866939306259155,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.00539473257958889,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0045649269595742226,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.007271338254213333,
          "activation_magnitude_ratio": -0.001256838208064437,
          "activation_dot_product": 0.006512367632240057,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.016992513090372086,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.013374474830925465,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.752049902992376,
        "val_r": 0.7202556824916212,
        "n_iterations": 304,
        "n_nonzero_coefficients": 10,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0054786959663033485,
          "right_subspace_overlap_bottom_k": -0.010535621084272861,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.004943337291479111,
          "subspace_overlap": -0.0020071298349648714,
          "right_subspace_overlap": 0.005949452985078096,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.007012778427451849,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0020752977579832077,
          "encoder_gradient_cosine_similarity": 0.0013209140161052346,
          "encoder_gradient_l2_distance": -0.01645980402827263,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.00861264392733574,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7349801363184286,
        "val_r": 0.7372228405363558,
        "n_iterations": 184,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009308171458542347,
          "right_subspace_overlap_bottom_k": -0.014870303682982922,
          "interaction_matrix_overlap_top_k": 0.0054614427499473095,
          "interaction_matrix_overlap_bottom_k": -0.0017879446968436241,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0012369519099593163,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.002450081519782543,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0017862844979390502,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.007453626021742821,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.008754932321608067,
          "activation_l2_distance": -0.001295741181820631,
          "activation_cosine_similarity": 0.015863271430134773,
          "activation_magnitude_ratio": 0.0011747080134227872,
          "activation_dot_product": 0.0047609745524823666,
          "encoder_gradient_cosine_similarity": -0.0014121863059699535,
          "encoder_gradient_l2_distance": -0.028998691588640213,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.002215879037976265,
          "input_gradient_l2_distance": -0.02459561452269554,
          "input_gradient_dot_product": -0.0023965928703546524
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7292148630851963,
        "val_r": 0.7314106386995965,
        "n_iterations": 297,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0045795077458024025,
          "right_subspace_overlap_bottom_k": -0.005825150292366743,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.002606799826025963,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.001008512219414115,
          "singular_value_ratio": -0.001213743700645864,
          "layerwise_effective_rank": -0.0016066060634329915,
          "layerwise_effective_rank_mergeability_score": 0.0013138847425580025,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0012097735889256,
          "task_vector_dot_product": -0.0019158790819346905,
          "weight_space_angle": -0.0022879389580339193,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0015955627895891666,
          "subspace_overlap": 0.0017552158096805215,
          "right_subspace_overlap": 0.001700956141576171,
          "activation_l2_distance": -0.0027789354790002108,
          "activation_cosine_similarity": 0.005284746177494526,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.00309855118393898,
          "encoder_gradient_cosine_similarity": 0.002138867974281311,
          "encoder_gradient_l2_distance": -0.009617635048925877,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.006023216526955366,
          "input_gradient_dot_product": -0.0024902168661355972
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7590039882679394,
        "val_r": 0.6341496567882572,
        "n_iterations": 321,
        "n_nonzero_coefficients": 8,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0060069365426898,
          "right_subspace_overlap_bottom_k": -0.013125593774020672,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0010762521997094154,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0021653559524565935,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.002732814522460103,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.009675728157162666,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.014667442068457603,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.005394076928496361,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6753080392378696,
        "val_r": 0.3939443361983645,
        "n_iterations": 173,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007171315606683493,
          "right_subspace_overlap_bottom_k": -0.008806966245174408,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0010602069087326527,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": -0.0010389171075075865,
          "stable_rank": 0.0,
          "spectral_gap": -0.001227633561939001,
          "singular_value_ratio": 0.001570333493873477,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0019516728352755308,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.0019786013290286064,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.001015920890495181,
          "singular_value_overlap": 0.003128973999992013,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0059214564971625805,
          "activation_l2_distance": -0.002596492413431406,
          "activation_cosine_similarity": 0.006218931172043085,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.003019528230652213,
          "encoder_gradient_l2_distance": -0.014379989355802536,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.0011963710421696305,
          "input_gradient_l2_distance": -0.00852806307375431,
          "input_gradient_dot_product": -0.0023159547708928585
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.660273236056212,
        "val_r": 0.6455597208080806,
        "n_iterations": 216,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006770221516489983,
          "right_subspace_overlap_bottom_k": -0.012858601287007332,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.002035801764577627,
          "singular_value_ratio": 0.0021048691123723984,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0029965818393975496,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0017030219314619899,
          "singular_value_overlap": 0.0017089927569031715,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005365757271647453,
          "activation_l2_distance": 0.0017383540980517864,
          "activation_cosine_similarity": 0.006749924272298813,
          "activation_magnitude_ratio": -0.0027326056733727455,
          "activation_dot_product": 0.0037920381873846054,
          "encoder_gradient_cosine_similarity": 0.004246370401233435,
          "encoder_gradient_l2_distance": -0.012962661683559418,
          "encoder_gradient_dot_product": 0.002622943837195635,
          "input_gradient_cosine_similarity": 0.0026017569471150637,
          "input_gradient_l2_distance": -0.00827745534479618,
          "input_gradient_dot_product": -0.00621039979159832
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7552335115331923,
        "val_r": 0.557853500871393,
        "n_iterations": 287,
        "n_nonzero_coefficients": 13,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004682696424424648,
          "right_subspace_overlap_bottom_k": -0.01159114483743906,
          "interaction_matrix_overlap_top_k": 0.0011889422312378883,
          "interaction_matrix_overlap_bottom_k": 0.0010879866313189268,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.001543678343296051,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.003138749860227108,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.004656417295336723,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": -0.0013633206253871322,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.0029800934717059135,
          "encoder_gradient_cosine_similarity": 0.0025913347490131855,
          "encoder_gradient_l2_distance": -0.00933835282921791,
          "encoder_gradient_dot_product": 0.002144918777048588,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0055945697240531445,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.756051162257753,
        "val_r": 0.26695617854928194,
        "n_iterations": 350,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004557818174362183,
          "right_subspace_overlap_bottom_k": -0.009406044147908688,
          "interaction_matrix_overlap_top_k": 0.003145844442769885,
          "interaction_matrix_overlap_bottom_k": -0.0011672705877572298,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.00141719460953027,
          "layerwise_effective_rank": 0.0014049762394279242,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0011936649680137634,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0012890321668237448,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005993725266307592,
          "subspace_overlap": 0.0010023625800386071,
          "right_subspace_overlap": 0.006631241180002689,
          "activation_l2_distance": -0.003064910415560007,
          "activation_cosine_similarity": 0.008076783269643784,
          "activation_magnitude_ratio": -0.0026194611564278603,
          "activation_dot_product": 0.0052791316993534565,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.012232553213834763,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01111050695180893,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7576353308911983,
        "val_r": 0.7356917474630699,
        "n_iterations": 357,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004123079590499401,
          "right_subspace_overlap_bottom_k": -0.008891246281564236,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.002129010856151581,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.002028773771598935,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0019540912471711636,
          "subspace_overlap": 0.0017753047868609428,
          "right_subspace_overlap": 0.006810033228248358,
          "activation_l2_distance": -0.0024834293872117996,
          "activation_cosine_similarity": 0.006169133819639683,
          "activation_magnitude_ratio": -0.0013178146909922361,
          "activation_dot_product": 0.0010433838469907641,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.013001257553696632,
          "encoder_gradient_dot_product": 0.0011763419024646282,
          "input_gradient_cosine_similarity": 0.0034420976880937815,
          "input_gradient_l2_distance": -0.00807165540754795,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7489792048421116,
        "val_r": 0.7493075336029957,
        "n_iterations": 314,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0033433684147894382,
          "right_subspace_overlap_bottom_k": -0.011165331117808819,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0012483660830184817,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0015172016574069858,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.001431598560884595,
          "task_vector_cosine_similarity": 0.0013096145121380687,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0033218106254935265,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.006485395133495331,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.009267369285225868,
          "activation_magnitude_ratio": -0.001959618180990219,
          "activation_dot_product": 0.0014021615497767925,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.017170468345284462,
          "encoder_gradient_dot_product": -0.0019372347742319107,
          "input_gradient_cosine_similarity": 0.001201448030769825,
          "input_gradient_l2_distance": -0.01112083625048399,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5377582770860767,
        "val_r": 0.4545180145235257,
        "n_iterations": 262,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011149607598781586,
          "right_subspace_overlap_bottom_k": -0.00990502443164587,
          "interaction_matrix_overlap_top_k": 0.0074616242200136185,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.003157667350023985,
          "effective_rank_mergeability_score": -0.0029026686679571867,
          "stable_rank": 0.0020812556613236666,
          "spectral_gap": -0.003767079208046198,
          "singular_value_ratio": 0.003214651718735695,
          "layerwise_effective_rank": 0.001903551397845149,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.005001392215490341,
          "task_vector_l2_distance": 0.0027950459625571966,
          "task_vector_dot_product": 0.009356082417070866,
          "weight_space_angle": -0.007157469168305397,
          "task_vector_magnitude_ratio": 0.0042809690348804,
          "singular_value_overlap": 0.007266528904438019,
          "subspace_overlap": 0.0029837985057383776,
          "right_subspace_overlap": 0.012081893160939217,
          "activation_l2_distance": -0.001137584913522005,
          "activation_cosine_similarity": 0.008489669300615788,
          "activation_magnitude_ratio": -0.0047652823850512505,
          "activation_dot_product": 0.01236993819475174,
          "encoder_gradient_cosine_similarity": 0.004798866808414459,
          "encoder_gradient_l2_distance": -0.018957726657390594,
          "encoder_gradient_dot_product": 0.001275714486837387,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.014026942662894726,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7597432499781291,
        "val_r": 0.7394650596511906,
        "n_iterations": 181,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00690007209777832,
          "right_subspace_overlap_bottom_k": -0.011490773409605026,
          "interaction_matrix_overlap_top_k": 0.0010332392994314432,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0014850833686068654,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0014479949604719877,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.001054266351275146,
          "task_vector_l2_distance": 0.0010047310497611761,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0017555209342390299,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005127580836415291,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.004009398631751537,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.00920871365815401,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0017853295430541039,
          "encoder_gradient_l2_distance": -0.011040212586522102,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.005136732943356037,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.7640989126705746,
        "val_r": 0.8681077669167268,
        "n_iterations": 350,
        "n_nonzero_coefficients": 12,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0052687544375658035,
          "right_subspace_overlap_bottom_k": -0.013051792979240417,
          "interaction_matrix_overlap_top_k": 0.004647812806069851,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.003247868036851287,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0013358163414523005,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0022499042097479105,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0029793584253638983,
          "activation_l2_distance": -0.0022592961322516203,
          "activation_cosine_similarity": 0.00599423423409462,
          "activation_magnitude_ratio": -0.002724143210798502,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.014950891956686974,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.003796098753809929,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7146031115713901,
        "val_r": 0.753077431902018,
        "n_iterations": 437,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.013017037883400917,
          "interaction_matrix_overlap_top_k": 0.00455487472936511,
          "interaction_matrix_overlap_bottom_k": 0.0012555464636534452,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0023569315671920776,
          "layerwise_effective_rank_mergeability_score": 0.0015539610758423805,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.004309171810746193,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005831524264067411,
          "activation_l2_distance": 0.0021884050220251083,
          "activation_cosine_similarity": 0.009779260493814945,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0027379710227251053,
          "encoder_gradient_cosine_similarity": 0.0023660052102059126,
          "encoder_gradient_l2_distance": -0.00800544023513794,
          "encoder_gradient_dot_product": 0.0012091356329619884,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.004753232467919588,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7220802925535983,
        "val_r": 0.6434840876742607,
        "n_iterations": 271,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006509613711386919,
          "right_subspace_overlap_bottom_k": -0.01594272069633007,
          "interaction_matrix_overlap_top_k": 0.005808302666991949,
          "interaction_matrix_overlap_bottom_k": -0.003455009311437607,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0018468741327524185,
          "singular_value_ratio": 0.0012419933918863535,
          "layerwise_effective_rank": -0.0023817671462893486,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0028062118217349052,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0029173349030315876,
          "weight_space_angle": -0.003702213056385517,
          "task_vector_magnitude_ratio": 0.001442682114429772,
          "singular_value_overlap": 0.007330550812184811,
          "subspace_overlap": -0.0010464100632816553,
          "right_subspace_overlap": 0.004426212050020695,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0060499911196529865,
          "activation_magnitude_ratio": -0.0025129884015768766,
          "activation_dot_product": 0.011490955948829651,
          "encoder_gradient_cosine_similarity": 0.0021580432076007128,
          "encoder_gradient_l2_distance": -0.016636764630675316,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01774664968252182,
          "input_gradient_dot_product": -0.00476971548050642
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7351809694584512,
        "val_r": 0.5833262940307162,
        "n_iterations": 294,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0042028664611279964,
          "right_subspace_overlap_bottom_k": -0.007776312530040741,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.001080938964150846,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0010913594160228968,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0027095999103039503,
          "weight_space_angle": 0.0012956801801919937,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.002908392809331417,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.006503301206976175,
          "activation_l2_distance": -0.0016216569347307086,
          "activation_cosine_similarity": 0.007539503276348114,
          "activation_magnitude_ratio": -0.0012523403856903315,
          "activation_dot_product": 0.002856090199202299,
          "encoder_gradient_cosine_similarity": 0.004859393462538719,
          "encoder_gradient_l2_distance": -0.011652067303657532,
          "encoder_gradient_dot_product": 0.0010148773435503244,
          "input_gradient_cosine_similarity": 0.0010807502549141645,
          "input_gradient_l2_distance": -0.0064039211720228195,
          "input_gradient_dot_product": -0.00240437313914299
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8209938879037342,
        "val_r": 0.7169211353723542,
        "n_iterations": 409,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.009825140237808228,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.008854287676513195,
          "effective_rank": 0.0012290726881474257,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0018009901978075504,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0015363773563876748,
          "layerwise_effective_rank": -0.0031167762354016304,
          "layerwise_effective_rank_mergeability_score": 0.0013282508589327335,
          "task_vector_cosine_similarity": 0.0021431329660117626,
          "task_vector_l2_distance": -0.003637536196038127,
          "task_vector_dot_product": -0.00160032301209867,
          "weight_space_angle": -0.0030120969749987125,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005508167203515768,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.004871118348091841,
          "activation_cosine_similarity": 0.003745216177776456,
          "activation_magnitude_ratio": -0.0011879679514095187,
          "activation_dot_product": 0.01618899032473564,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.021614206954836845,
          "encoder_gradient_dot_product": 0.0014759463956579566,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.018029779195785522,
          "input_gradient_dot_product": -0.0032683927565813065
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1.5,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "isotropic": {
    "aggregate_metrics": {
      "train_r": 0.421620837883215,
      "train_p": 4.64161144617585e-139,
      "val_r": 0.1070809943945154,
      "val_p": 0.04288718413441424
    },
    "per_fold_stats": {
      "train_r_mean": 0.5024487030867464,
      "train_r_std": 0.05680290509516255,
      "val_r_mean": 0.4055317888759008,
      "val_r_std": 0.14569052101049115,
      "n_nonzero_mean": 16.15,
      "n_nonzero_std": 4.065402809070707
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.000805655843578279,
      "right_subspace_overlap_bottom_k": 0.002635219134390354,
      "interaction_matrix_overlap_top_k": 3.265680425101891e-05,
      "interaction_matrix_overlap_bottom_k": 0.014827171340584755,
      "effective_rank": -0.00045544159365817904,
      "effective_rank_mergeability_score": 0.0003584517980925739,
      "stable_rank": -0.0006458301795646548,
      "spectral_gap": 0.0005114486557431519,
      "singular_value_ratio": -0.0005408239085227251,
      "layerwise_effective_rank": -0.00045433081686496735,
      "layerwise_effective_rank_mergeability_score": 0.0001990750606637448,
      "task_vector_cosine_similarity": 0.00024969756486825645,
      "task_vector_l2_distance": -0.009389296174049377,
      "task_vector_dot_product": -0.00043643469689413905,
      "weight_space_angle": 0.0001781316677806899,
      "task_vector_magnitude_ratio": -0.0010780319571495056,
      "singular_value_overlap": -0.009563101455569267,
      "subspace_overlap": 0.0007844320498406887,
      "right_subspace_overlap": -9.37360746320337e-05,
      "activation_l2_distance": -0.00047822119086049497,
      "activation_cosine_similarity": -0.0001839774486143142,
      "activation_magnitude_ratio": -0.0023684550542384386,
      "activation_dot_product": -0.0010212415363639593,
      "encoder_gradient_cosine_similarity": -0.00016947943367995322,
      "encoder_gradient_l2_distance": -0.005303363315761089,
      "encoder_gradient_dot_product": 0.00012993000564165413,
      "input_gradient_cosine_similarity": 0.0007108992431312799,
      "input_gradient_l2_distance": -0.011019079945981503,
      "input_gradient_dot_product": -0.0021924260072410107
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.0020825702231377363,
      "right_subspace_overlap_bottom_k": 0.003239803947508335,
      "interaction_matrix_overlap_top_k": 0.0010138218058273196,
      "interaction_matrix_overlap_bottom_k": 0.004454140551388264,
      "effective_rank": 0.0006450212677009404,
      "effective_rank_mergeability_score": 0.000757409434299916,
      "stable_rank": 0.0007352279499173164,
      "spectral_gap": 0.0008289241814054549,
      "singular_value_ratio": 0.0009193870355375111,
      "layerwise_effective_rank": 0.0007528779678978026,
      "layerwise_effective_rank_mergeability_score": 0.0008836191846057773,
      "task_vector_cosine_similarity": 0.0013643766287714243,
      "task_vector_l2_distance": 0.003601330565288663,
      "task_vector_dot_product": 0.0020834757015109062,
      "weight_space_angle": 0.0015238921623677015,
      "task_vector_magnitude_ratio": 0.000996178132481873,
      "singular_value_overlap": 0.0022803270258009434,
      "subspace_overlap": 0.0011169963981956244,
      "right_subspace_overlap": 0.0011875246418640018,
      "activation_l2_distance": 0.0019319171551615,
      "activation_cosine_similarity": 0.0007783207111060619,
      "activation_magnitude_ratio": 0.0008975396049208939,
      "activation_dot_product": 0.001674165716394782,
      "encoder_gradient_cosine_similarity": 0.000848659488838166,
      "encoder_gradient_l2_distance": 0.002117765136063099,
      "encoder_gradient_dot_product": 0.0012944330228492618,
      "input_gradient_cosine_similarity": 0.000991123029962182,
      "input_gradient_l2_distance": 0.0027732413727790117,
      "input_gradient_dot_product": 0.0015784751158207655
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.35,
      "right_subspace_overlap_bottom_k": 0.85,
      "interaction_matrix_overlap_top_k": 0.4,
      "interaction_matrix_overlap_bottom_k": 0.95,
      "effective_rank": 0.35,
      "effective_rank_mergeability_score": 0.35,
      "stable_rank": 0.45,
      "spectral_gap": 0.45,
      "singular_value_ratio": 0.3,
      "layerwise_effective_rank": 0.3,
      "layerwise_effective_rank_mergeability_score": 0.25,
      "task_vector_cosine_similarity": 0.4,
      "task_vector_l2_distance": 1.0,
      "task_vector_dot_product": 0.5,
      "weight_space_angle": 0.55,
      "task_vector_magnitude_ratio": 0.65,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.4,
      "right_subspace_overlap": 0.4,
      "activation_l2_distance": 0.6,
      "activation_cosine_similarity": 0.3,
      "activation_magnitude_ratio": 0.95,
      "activation_dot_product": 0.5,
      "encoder_gradient_cosine_similarity": 0.25,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.3,
      "input_gradient_cosine_similarity": 0.55,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.8
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.44571185559094634,
        "val_r": 0.4222463259977923,
        "n_iterations": 280,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0023203983437269926,
          "right_subspace_overlap_bottom_k": 0.0021194303408265114,
          "interaction_matrix_overlap_top_k": -0.001140923472121358,
          "interaction_matrix_overlap_bottom_k": 0.013346751220524311,
          "effective_rank": -0.0018136712023988366,
          "effective_rank_mergeability_score": 0.0011418345384299755,
          "stable_rank": -0.0016534366877749562,
          "spectral_gap": 0.0022520325146615505,
          "singular_value_ratio": -0.0023279183078557253,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0014915046049281955,
          "task_vector_l2_distance": -0.007901482284069061,
          "task_vector_dot_product": -0.003193603130057454,
          "weight_space_angle": 0.004511088132858276,
          "task_vector_magnitude_ratio": -0.0036335764452815056,
          "singular_value_overlap": -0.011697445064783096,
          "subspace_overlap": 0.0014839833602309227,
          "right_subspace_overlap": 0.0011793591547757387,
          "activation_l2_distance": -0.0035930625163018703,
          "activation_cosine_similarity": 0.0012809396721422672,
          "activation_magnitude_ratio": -0.002092531882226467,
          "activation_dot_product": -0.0033512571826577187,
          "encoder_gradient_cosine_similarity": -0.0014425376430153847,
          "encoder_gradient_l2_distance": -0.006484708283096552,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.007723072078078985,
          "input_gradient_dot_product": -0.005421279463917017
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.39286968024858393,
        "val_r": 0.4527938212566739,
        "n_iterations": 370,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002347813919186592,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.011839976534247398,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": -0.0012218230403959751,
          "stable_rank": 0.0,
          "spectral_gap": -0.0011791171273216605,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": -0.0012400668347254395,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.004510622937232256,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0010091352742165327,
          "singular_value_overlap": -0.009576906450092793,
          "subspace_overlap": 0.0019212467595934868,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002894094679504633,
          "activation_dot_product": -0.0026500271633267403,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.008138502016663551,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.001103008515201509,
          "input_gradient_l2_distance": -0.009985480457544327,
          "input_gradient_dot_product": -0.0013316994300112128
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5091263655071478,
        "val_r": 0.48135550710057395,
        "n_iterations": 219,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0011311606504023075,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.015773914754390717,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.003730436787009239,
          "task_vector_l2_distance": -0.008537748828530312,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0019212665501981974,
          "task_vector_magnitude_ratio": -0.0012363189598545432,
          "singular_value_overlap": -0.009208344854414463,
          "subspace_overlap": 0.0011077579110860825,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0017499782843515277,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0017974991351366043,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.005102494265884161,
          "encoder_gradient_dot_product": 0.0014464739942923188,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010709858499467373,
          "input_gradient_dot_product": -0.0020882762037217617
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.461974952597424,
        "val_r": 0.49440456993283666,
        "n_iterations": 450,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.002531318925321102,
          "interaction_matrix_overlap_top_k": -0.0010171683970838785,
          "interaction_matrix_overlap_bottom_k": 0.018459107726812363,
          "effective_rank": -0.0010221963748335838,
          "effective_rank_mergeability_score": 0.0021201292984187603,
          "stable_rank": -0.0017331361304968596,
          "spectral_gap": 0.0010148759465664625,
          "singular_value_ratio": -0.0017621696460992098,
          "layerwise_effective_rank": -0.0015539826126769185,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.00967493001371622,
          "task_vector_dot_product": -0.0011629078071564436,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0012375029036775231,
          "singular_value_overlap": -0.01061371061950922,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002974801231175661,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.001663600793108344,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010411418043076992,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5676493249769774,
        "val_r": 0.5996495069981022,
        "n_iterations": 274,
        "n_nonzero_coefficients": 12,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.006091718561947346,
          "interaction_matrix_overlap_top_k": -0.0014750820118933916,
          "interaction_matrix_overlap_bottom_k": 0.01552807167172432,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01384891476482153,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0010690196650102735,
          "singular_value_overlap": -0.010451487265527248,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.0018930187216028571,
          "activation_l2_distance": 0.00212780199944973,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002306812908500433,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0014547175960615277,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0122010363265872,
          "input_gradient_dot_product": -0.002056861063465476
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.44870857452606383,
        "val_r": 0.775132297944561,
        "n_iterations": 170,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0014500803081318736,
          "right_subspace_overlap_bottom_k": 0.004181359428912401,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.022548800334334373,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.001125953858718276,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": -0.001018450129777193,
          "task_vector_cosine_similarity": 0.0035276487469673157,
          "task_vector_l2_distance": -0.011588611640036106,
          "task_vector_dot_product": 0.001334197586402297,
          "weight_space_angle": -0.0010486497776582837,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.010213136672973633,
          "subspace_overlap": 0.0014709761599078774,
          "right_subspace_overlap": 0.0010734976967796683,
          "activation_l2_distance": 0.0011034727795049548,
          "activation_cosine_similarity": -0.0015862511936575174,
          "activation_magnitude_ratio": -0.0023220342118293047,
          "activation_dot_product": 0.0010268723126500845,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.007174415048211813,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0011241178726777434,
          "input_gradient_l2_distance": -0.011929403059184551,
          "input_gradient_dot_product": -0.001540245721116662
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.5821125889266203,
        "val_r": 0.14645334625705625,
        "n_iterations": 296,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0012238050112500787,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.015305436216294765,
          "effective_rank": -0.0010979793732985854,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0012277838541194797,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0012690227013081312,
          "task_vector_l2_distance": -0.007482216227799654,
          "task_vector_dot_product": -0.0041897352784872055,
          "weight_space_angle": 0.001013915054500103,
          "task_vector_magnitude_ratio": -0.0015986048383638263,
          "singular_value_overlap": -0.008794387802481651,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.0010664567817002535,
          "activation_l2_distance": -0.0037347530014812946,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.004996657371520996,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.007537780795246363,
          "encoder_gradient_dot_product": 0.001392293837852776,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010918382555246353,
          "input_gradient_dot_product": -0.0033074317034333944
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.45684139809392077,
        "val_r": 0.29162013931463054,
        "n_iterations": 346,
        "n_nonzero_coefficients": 11,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0018539070151746273,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.017741352319717407,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.010144067928195,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.009122844785451889,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": -0.001834700582548976,
          "activation_magnitude_ratio": -0.0024103899486362934,
          "activation_dot_product": -0.0037911534309387207,
          "encoder_gradient_cosine_similarity": 0.0024318513460457325,
          "encoder_gradient_l2_distance": -0.0044255065731704235,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.006046957802027464,
          "input_gradient_dot_product": -0.0013490698765963316
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5229965223968887,
        "val_r": 0.4301127952767928,
        "n_iterations": 192,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0050124856643378735,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.01410472672432661,
          "effective_rank": -0.0011550089111551642,
          "effective_rank_mergeability_score": 0.0010081508662551641,
          "stable_rank": -0.0014482707483693957,
          "spectral_gap": 0.0013177110813558102,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0011779589112848043,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0012908177450299263,
          "task_vector_l2_distance": -0.013642065227031708,
          "task_vector_dot_product": -0.0012243182864040136,
          "weight_space_angle": -0.001292425673455,
          "task_vector_magnitude_ratio": -0.0024761250242590904,
          "singular_value_overlap": -0.010678036138415337,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.0012710430892184377,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002535407431423664,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.006084258668124676,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0015526553615927696,
          "input_gradient_l2_distance": -0.012652521952986717,
          "input_gradient_dot_product": -0.001978909131139517
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5416763123362207,
        "val_r": 0.12554357039016265,
        "n_iterations": 302,
        "n_nonzero_coefficients": 13,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0011104519944638014,
          "interaction_matrix_overlap_bottom_k": 0.01901133731007576,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009270046837627888,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0010757308918982744,
          "task_vector_magnitude_ratio": -0.0011221537133678794,
          "singular_value_overlap": -0.0117877759039402,
          "subspace_overlap": 0.0011610242072492838,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002654546871781349,
          "activation_dot_product": -0.002929706359282136,
          "encoder_gradient_cosine_similarity": -0.0020852030720561743,
          "encoder_gradient_l2_distance": -0.003764198161661625,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.0016281340504065156,
          "input_gradient_l2_distance": -0.011006636545062065,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.512786172081922,
        "val_r": 0.40026867601164595,
        "n_iterations": 285,
        "n_nonzero_coefficients": 12,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.004650072194635868,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.01773810014128685,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0013689125189557672,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.013224311172962189,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0011978994589298964,
          "singular_value_overlap": -0.012077565304934978,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.002903333166614175,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0030341418460011482,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.007036716677248478,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0018709942232817411,
          "input_gradient_l2_distance": -0.01156660821288824,
          "input_gradient_dot_product": -0.0018999448511749506
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.45062470296605384,
        "val_r": 0.31427006149389736,
        "n_iterations": 205,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0019071708666160703,
          "right_subspace_overlap_bottom_k": -0.0013132755411788821,
          "interaction_matrix_overlap_top_k": -0.00224139541387558,
          "interaction_matrix_overlap_bottom_k": 0.012960173189640045,
          "effective_rank": -0.0010479460470378399,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0013522794470191002,
          "spectral_gap": 0.0014064429560676217,
          "singular_value_ratio": -0.0012832351494580507,
          "layerwise_effective_rank": -0.0010870866244658828,
          "layerwise_effective_rank_mergeability_score": 0.0014384605456143618,
          "task_vector_cosine_similarity": -0.0012599441688507795,
          "task_vector_l2_distance": -0.006917568854987621,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.001555847586132586,
          "singular_value_overlap": -0.00688306475058198,
          "subspace_overlap": 0.0022116354666650295,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0017668663058429956,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": -0.0010943937813863158,
          "encoder_gradient_l2_distance": -0.004904343280941248,
          "encoder_gradient_dot_product": -0.0012080720625817776,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.007916110567748547,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.4531981215851895,
        "val_r": 0.4817735515808811,
        "n_iterations": 296,
        "n_nonzero_coefficients": 13,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0014351021964102983,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.018854252994060516,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009138327091932297,
          "task_vector_dot_product": 0.003216539043933153,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.010195150040090084,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.001034726737998426,
          "activation_l2_distance": 0.0019723628647625446,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0015764669515192509,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0057089561596512794,
          "encoder_gradient_dot_product": 0.004646002314984798,
          "input_gradient_cosine_similarity": 0.0027144313789904118,
          "input_gradient_l2_distance": -0.0109324986115098,
          "input_gradient_dot_product": -0.002830484649166465
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5092316254651469,
        "val_r": 0.5570392266193287,
        "n_iterations": 441,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0038765829522162676,
          "interaction_matrix_overlap_top_k": 0.001891683554276824,
          "interaction_matrix_overlap_bottom_k": 0.012549313716590405,
          "effective_rank": -0.0012847371399402618,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0010844095377251506,
          "task_vector_l2_distance": -0.009684487245976925,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0023163175210356712,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.009575161151587963,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0015075546689331532,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0019793016836047173,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": -0.001199305639602244,
          "encoder_gradient_l2_distance": -0.0048032477498054504,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0013692504726350307,
          "input_gradient_l2_distance": -0.010200755670666695,
          "input_gradient_dot_product": -0.0021259940695017576
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.453310627391652,
        "val_r": 0.47313669749576975,
        "n_iterations": 223,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0018236563773825765,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.014656581915915012,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.010521027259528637,
          "task_vector_dot_product": 0.0010526261758059263,
          "weight_space_angle": -0.0017765236552804708,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.011949615553021431,
          "subspace_overlap": 0.0022469155956059694,
          "right_subspace_overlap": 0.0025337375700473785,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0025384072214365005,
          "activation_dot_product": -0.0010790566448122263,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0065032243728637695,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0014968190807849169,
          "input_gradient_l2_distance": -0.013079710304737091,
          "input_gradient_dot_product": -0.0036103278398513794
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.5099625093628805,
        "val_r": 0.3708040488278689,
        "n_iterations": 282,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.002914929296821356,
          "interaction_matrix_overlap_top_k": 0.0016745371976867318,
          "interaction_matrix_overlap_bottom_k": 0.011722266674041748,
          "effective_rank": -0.0016872929409146309,
          "effective_rank_mergeability_score": 0.0012064606416970491,
          "stable_rank": -0.0012113905977457762,
          "spectral_gap": 0.001147003029473126,
          "singular_value_ratio": -0.001252182642929256,
          "layerwise_effective_rank": -0.001244403189048171,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.010555845685303211,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0014293510466814041,
          "singular_value_overlap": -0.00532348221167922,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0014432856114581227,
          "activation_cosine_similarity": -0.0016111378790810704,
          "activation_magnitude_ratio": -0.00407773582264781,
          "activation_dot_product": -0.0022621818352490664,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.005802331492304802,
          "encoder_gradient_dot_product": -0.001771858660504222,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01084964070469141,
          "input_gradient_dot_product": -0.003138167317956686
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5089611192108546,
        "val_r": 0.32915354571429495,
        "n_iterations": 237,
        "n_nonzero_coefficients": 9,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.005366808269172907,
          "interaction_matrix_overlap_top_k": 0.0018510326044633985,
          "interaction_matrix_overlap_bottom_k": 0.011521491222083569,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01029190979897976,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.009727745316922665,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002283476060256362,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0020906743593513966,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0012549696257337928,
          "input_gradient_l2_distance": -0.011020966805517673,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5267837371146333,
        "val_r": 0.2635261604396759,
        "n_iterations": 221,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0063421051017940044,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.018129749223589897,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0013284790329635143,
          "stable_rank": -0.0018927042838186026,
          "spectral_gap": 0.001919551519677043,
          "singular_value_ratio": -0.003152377437800169,
          "layerwise_effective_rank": -0.0013638725504279137,
          "layerwise_effective_rank_mergeability_score": 0.002056812634691596,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0070373909547924995,
          "task_vector_dot_product": -0.005632298532873392,
          "weight_space_angle": 0.001785901258699596,
          "task_vector_magnitude_ratio": -0.002646197099238634,
          "singular_value_overlap": -0.009749110788106918,
          "subspace_overlap": 0.004085102118551731,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.003513542003929615,
          "activation_cosine_similarity": 0.001191473682411015,
          "activation_magnitude_ratio": -0.004425188060849905,
          "activation_dot_product": -0.0014854302862659097,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0027938843704760075,
          "encoder_gradient_dot_product": -0.0019062390783801675,
          "input_gradient_cosine_similarity": 0.001613496569916606,
          "input_gradient_l2_distance": -0.01902633160352707,
          "input_gradient_dot_product": -0.005622257478535175
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6405888430379537,
        "val_r": 0.35591086836630675,
        "n_iterations": 359,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.008604146540164948,
          "right_subspace_overlap_bottom_k": -0.0011452274629846215,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0015858043916523457,
          "stable_rank": -0.0010286883916705847,
          "spectral_gap": 0.0012245199177414179,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0026593119837343693,
          "layerwise_effective_rank_mergeability_score": 0.002744744997471571,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0015563133638352156,
          "task_vector_dot_product": -0.0021564646158367395,
          "weight_space_angle": 0.0015031910734251142,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0024986830540001392,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0035677198320627213,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.00196931604295969,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.009542731568217278,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.007053387816995382,
          "input_gradient_dot_product": -0.0035294685512781143
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5538590283178486,
        "val_r": 0.3454410604991651,
        "n_iterations": 231,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0023703977931290865,
          "right_subspace_overlap_bottom_k": 0.011524985544383526,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.014752030372619629,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0010385948698967695,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.001962746027857065,
          "task_vector_l2_distance": -0.015370659530162811,
          "task_vector_dot_product": 0.0032272711396217346,
          "weight_space_angle": 0.00202799029648304,
          "task_vector_magnitude_ratio": -0.0013489078264683485,
          "singular_value_overlap": -0.01113838329911232,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.0034655241761356592,
          "activation_l2_distance": 0.0013434863649308681,
          "activation_cosine_similarity": -0.0011198726715520024,
          "activation_magnitude_ratio": -0.0017300860490649939,
          "activation_dot_product": 0.0010937649058178067,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.005050968378782272,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0017463758122175932,
          "input_gradient_l2_distance": -0.015150820836424828,
          "input_gradient_dot_product": -0.002018110593780875
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1.5,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  }
}