{
  "excluded_metrics": [
    "activation_cosine_similarity",
    "activation_dot_product",
    "activation_l2_distance",
    "activation_magnitude_ratio"
  ],
  "n_metrics_used": 25,
  "metrics_used": [
    "right_subspace_overlap_top_k",
    "right_subspace_overlap_bottom_k",
    "interaction_matrix_overlap_top_k",
    "interaction_matrix_overlap_bottom_k",
    "effective_rank",
    "effective_rank_mergeability_score",
    "stable_rank",
    "spectral_gap",
    "singular_value_ratio",
    "layerwise_effective_rank",
    "layerwise_effective_rank_mergeability_score",
    "task_vector_cosine_similarity",
    "task_vector_l2_distance",
    "task_vector_dot_product",
    "weight_space_angle",
    "task_vector_magnitude_ratio",
    "singular_value_overlap",
    "subspace_overlap",
    "right_subspace_overlap",
    "encoder_gradient_cosine_similarity",
    "encoder_gradient_l2_distance",
    "encoder_gradient_dot_product",
    "input_gradient_cosine_similarity",
    "input_gradient_l2_distance",
    "input_gradient_dot_product"
  ],
  "methods": {
    "weight_avg": {
      "aggregate_metrics": {
        "train_r": 0.3081560084998685,
        "train_p": 7.815410353686358e-72,
        "val_r": 0.25023409597565494,
        "val_p": 1.6301159313618725e-06
      },
      "per_fold_stats": {
        "train_r_mean": 0.5987373357814293,
        "train_r_std": 0.14894481906902488,
        "val_r_mean": 0.5136336458395625,
        "val_r_std": 0.174851013861217
      },
      "average_coefficients": {
        "right_subspace_overlap_top_k": 30.061878204345703,
        "right_subspace_overlap_bottom_k": -20.329557418823242,
        "interaction_matrix_overlap_top_k": 28.193359375,
        "interaction_matrix_overlap_bottom_k": -13.377527236938477,
        "effective_rank": -0.3749411702156067,
        "effective_rank_mergeability_score": -12.241896629333496,
        "stable_rank": -20.168991088867188,
        "spectral_gap": 2.6433753967285156,
        "singular_value_ratio": 10.26717758178711,
        "layerwise_effective_rank": -4.108586311340332,
        "layerwise_effective_rank_mergeability_score": 6.143611907958984,
        "task_vector_cosine_similarity": 19.856746673583984,
        "task_vector_l2_distance": -13.014312744140625,
        "task_vector_dot_product": 13.921127319335938,
        "weight_space_angle": -10.037684440612793,
        "task_vector_magnitude_ratio": 0.29567378759384155,
        "singular_value_overlap": 1.439159631729126,
        "subspace_overlap": -0.02333373948931694,
        "right_subspace_overlap": 3.858647108078003,
        "encoder_gradient_cosine_similarity": 27.874353408813477,
        "encoder_gradient_l2_distance": -24.457103729248047,
        "encoder_gradient_dot_product": 29.208438873291016,
        "input_gradient_cosine_similarity": 6.365433692932129,
        "input_gradient_l2_distance": -44.449974060058594,
        "input_gradient_dot_product": -16.545608520507812
      },
      "coefficient_std": {
        "right_subspace_overlap_top_k": 52.609100341796875,
        "right_subspace_overlap_bottom_k": 30.47812271118164,
        "interaction_matrix_overlap_top_k": 40.6084098815918,
        "interaction_matrix_overlap_bottom_k": 27.854665756225586,
        "effective_rank": 32.2656364440918,
        "effective_rank_mergeability_score": 53.114585876464844,
        "stable_rank": 43.567291259765625,
        "spectral_gap": 33.306304931640625,
        "singular_value_ratio": 25.40228271484375,
        "layerwise_effective_rank": 37.01395034790039,
        "layerwise_effective_rank_mergeability_score": 53.09374237060547,
        "task_vector_cosine_similarity": 63.90947341918945,
        "task_vector_l2_distance": 29.839933395385742,
        "task_vector_dot_product": 21.28866958618164,
        "weight_space_angle": 30.869651794433594,
        "task_vector_magnitude_ratio": 25.6010684967041,
        "singular_value_overlap": 21.03470230102539,
        "subspace_overlap": 34.6933479309082,
        "right_subspace_overlap": 46.115211486816406,
        "encoder_gradient_cosine_similarity": 36.19207763671875,
        "encoder_gradient_l2_distance": 36.33167266845703,
        "encoder_gradient_dot_product": 40.47578048706055,
        "input_gradient_cosine_similarity": 20.162046432495117,
        "input_gradient_l2_distance": 49.66156768798828,
        "input_gradient_dot_product": 37.42958068847656
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.6800711387035088,
          "val_r": 0.7673876336194255,
          "n_iterations": 801,
          "coefficients": {
            "right_subspace_overlap_top_k": 16.509336471557617,
            "right_subspace_overlap_bottom_k": -15.20195198059082,
            "interaction_matrix_overlap_top_k": 11.09233570098877,
            "interaction_matrix_overlap_bottom_k": 3.27517032623291,
            "effective_rank": 9.639944076538086,
            "effective_rank_mergeability_score": 5.114923000335693,
            "stable_rank": -0.7865902781486511,
            "spectral_gap": 2.5499067306518555,
            "singular_value_ratio": -0.0562378466129303,
            "layerwise_effective_rank": 10.091578483581543,
            "layerwise_effective_rank_mergeability_score": 11.99970531463623,
            "task_vector_cosine_similarity": -12.196418762207031,
            "task_vector_l2_distance": -9.61866569519043,
            "task_vector_dot_product": -4.159532070159912,
            "weight_space_angle": 4.019112586975098,
            "task_vector_magnitude_ratio": -2.101897954940796,
            "singular_value_overlap": -6.418807029724121,
            "subspace_overlap": 0.4599720239639282,
            "right_subspace_overlap": 11.69342041015625,
            "encoder_gradient_cosine_similarity": 8.803751945495605,
            "encoder_gradient_l2_distance": -28.447372436523438,
            "encoder_gradient_dot_product": 5.049064636230469,
            "input_gradient_cosine_similarity": 2.8171329498291016,
            "input_gradient_l2_distance": -10.783092498779297,
            "input_gradient_dot_product": -12.346527099609375
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6837504612689993,
          "val_r": 0.7189276147633015,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.6399855613708496,
            "right_subspace_overlap_bottom_k": -3.695446014404297,
            "interaction_matrix_overlap_top_k": 0.6654148697853088,
            "interaction_matrix_overlap_bottom_k": -1.5910449028015137,
            "effective_rank": 3.5655531883239746,
            "effective_rank_mergeability_score": 8.364029884338379,
            "stable_rank": -2.6399173736572266,
            "spectral_gap": -0.9255524277687073,
            "singular_value_ratio": 2.183548927307129,
            "layerwise_effective_rank": 4.838817596435547,
            "layerwise_effective_rank_mergeability_score": 0.06050168350338936,
            "task_vector_cosine_similarity": 2.4624264240264893,
            "task_vector_l2_distance": -5.223520755767822,
            "task_vector_dot_product": 0.07695663720369339,
            "weight_space_angle": 3.0180301666259766,
            "task_vector_magnitude_ratio": -2.2747232913970947,
            "singular_value_overlap": -0.3282022774219513,
            "subspace_overlap": -2.4654040336608887,
            "right_subspace_overlap": 8.780803680419922,
            "encoder_gradient_cosine_similarity": 3.978753089904785,
            "encoder_gradient_l2_distance": -12.913397789001465,
            "encoder_gradient_dot_product": 4.006263256072998,
            "input_gradient_cosine_similarity": 0.32609352469444275,
            "input_gradient_l2_distance": -8.66537094116211,
            "input_gradient_dot_product": -4.245733261108398
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.6771207093304432,
          "val_r": 0.562760785804842,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 11.370861053466797,
            "right_subspace_overlap_bottom_k": -19.793846130371094,
            "interaction_matrix_overlap_top_k": 16.91474723815918,
            "interaction_matrix_overlap_bottom_k": -2.2463645935058594,
            "effective_rank": -2.9859530925750732,
            "effective_rank_mergeability_score": 8.84941291809082,
            "stable_rank": -9.922136306762695,
            "spectral_gap": -3.7297604084014893,
            "singular_value_ratio": 9.529345512390137,
            "layerwise_effective_rank": 2.6267974376678467,
            "layerwise_effective_rank_mergeability_score": -5.482705593109131,
            "task_vector_cosine_similarity": 15.630732536315918,
            "task_vector_l2_distance": -7.503546714782715,
            "task_vector_dot_product": -2.289834976196289,
            "weight_space_angle": 12.369190216064453,
            "task_vector_magnitude_ratio": -4.1878461837768555,
            "singular_value_overlap": -1.9424912929534912,
            "subspace_overlap": 7.218624591827393,
            "right_subspace_overlap": 7.678624153137207,
            "encoder_gradient_cosine_similarity": 10.127492904663086,
            "encoder_gradient_l2_distance": -15.921706199645996,
            "encoder_gradient_dot_product": 11.06100845336914,
            "input_gradient_cosine_similarity": 5.068501949310303,
            "input_gradient_l2_distance": -20.847702026367188,
            "input_gradient_dot_product": -20.592918395996094
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6902502513832667,
          "val_r": 0.49327028669520123,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.373915433883667,
            "right_subspace_overlap_bottom_k": -3.5619583129882812,
            "interaction_matrix_overlap_top_k": 3.542733907699585,
            "interaction_matrix_overlap_bottom_k": 0.8806107640266418,
            "effective_rank": 5.429708003997803,
            "effective_rank_mergeability_score": 2.325190305709839,
            "stable_rank": -4.662481784820557,
            "spectral_gap": 0.677977979183197,
            "singular_value_ratio": -2.9499404430389404,
            "layerwise_effective_rank": 0.8714336156845093,
            "layerwise_effective_rank_mergeability_score": 0.42357364296913147,
            "task_vector_cosine_similarity": 2.975113868713379,
            "task_vector_l2_distance": -1.683394193649292,
            "task_vector_dot_product": -3.214970111846924,
            "weight_space_angle": 2.0112197399139404,
            "task_vector_magnitude_ratio": 4.253445148468018,
            "singular_value_overlap": -0.8554108142852783,
            "subspace_overlap": -2.262190341949463,
            "right_subspace_overlap": 2.396235942840576,
            "encoder_gradient_cosine_similarity": 2.3141422271728516,
            "encoder_gradient_l2_distance": -5.82631254196167,
            "encoder_gradient_dot_product": 2.156752586364746,
            "input_gradient_cosine_similarity": 0.07361587136983871,
            "input_gradient_l2_distance": -5.06129789352417,
            "input_gradient_dot_product": -2.628453016281128
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6139158966397267,
          "val_r": 0.5684829030606675,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 26.99551773071289,
            "right_subspace_overlap_bottom_k": -19.896385192871094,
            "interaction_matrix_overlap_top_k": -5.858401775360107,
            "interaction_matrix_overlap_bottom_k": -33.29988098144531,
            "effective_rank": -61.70061111450195,
            "effective_rank_mergeability_score": -9.103799819946289,
            "stable_rank": -45.637386322021484,
            "spectral_gap": 24.276912689208984,
            "singular_value_ratio": 20.788732528686523,
            "layerwise_effective_rank": 59.28065490722656,
            "layerwise_effective_rank_mergeability_score": -21.271751403808594,
            "task_vector_cosine_similarity": 5.317526340484619,
            "task_vector_l2_distance": -29.817243576049805,
            "task_vector_dot_product": 54.135128021240234,
            "weight_space_angle": 22.58089256286621,
            "task_vector_magnitude_ratio": 19.47783851623535,
            "singular_value_overlap": 0.4646006226539612,
            "subspace_overlap": -22.472562789916992,
            "right_subspace_overlap": 59.21455001831055,
            "encoder_gradient_cosine_similarity": 28.748872756958008,
            "encoder_gradient_l2_distance": -61.168052673339844,
            "encoder_gradient_dot_product": 11.890721321105957,
            "input_gradient_cosine_similarity": 15.324645042419434,
            "input_gradient_l2_distance": -4.445045471191406,
            "input_gradient_dot_product": -32.82707595825195
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.5566351657736085,
          "val_r": 0.4549692508470823,
          "n_iterations": 502,
          "coefficients": {
            "right_subspace_overlap_top_k": 51.527347564697266,
            "right_subspace_overlap_bottom_k": -25.373693466186523,
            "interaction_matrix_overlap_top_k": -2.2782270908355713,
            "interaction_matrix_overlap_bottom_k": -18.338947296142578,
            "effective_rank": 91.98855590820312,
            "effective_rank_mergeability_score": 115.03936004638672,
            "stable_rank": -31.801433563232422,
            "spectral_gap": 39.155296325683594,
            "singular_value_ratio": -3.3004889488220215,
            "layerwise_effective_rank": 7.482936859130859,
            "layerwise_effective_rank_mergeability_score": -107.3845443725586,
            "task_vector_cosine_similarity": -66.71881866455078,
            "task_vector_l2_distance": -33.30224609375,
            "task_vector_dot_product": 50.51726531982422,
            "weight_space_angle": -88.4361343383789,
            "task_vector_magnitude_ratio": -30.457529067993164,
            "singular_value_overlap": 1.4891736507415771,
            "subspace_overlap": -21.663787841796875,
            "right_subspace_overlap": 79.3016357421875,
            "encoder_gradient_cosine_similarity": -18.91836166381836,
            "encoder_gradient_l2_distance": 5.655179500579834,
            "encoder_gradient_dot_product": 74.22525024414062,
            "input_gradient_cosine_similarity": 44.52933883666992,
            "input_gradient_l2_distance": -151.37969970703125,
            "input_gradient_dot_product": 39.439674377441406
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.5709257636377174,
          "val_r": 0.43647404198823764,
          "n_iterations": 804,
          "coefficients": {
            "right_subspace_overlap_top_k": 69.45716094970703,
            "right_subspace_overlap_bottom_k": -15.043959617614746,
            "interaction_matrix_overlap_top_k": 67.38423156738281,
            "interaction_matrix_overlap_bottom_k": -51.43782043457031,
            "effective_rank": -20.7965087890625,
            "effective_rank_mergeability_score": -81.89859771728516,
            "stable_rank": -50.456172943115234,
            "spectral_gap": 87.5328598022461,
            "singular_value_ratio": 7.410624980926514,
            "layerwise_effective_rank": 39.395965576171875,
            "layerwise_effective_rank_mergeability_score": -11.87989616394043,
            "task_vector_cosine_similarity": 38.193546295166016,
            "task_vector_l2_distance": -47.11946105957031,
            "task_vector_dot_product": 28.104564666748047,
            "weight_space_angle": -38.018131256103516,
            "task_vector_magnitude_ratio": 9.58967399597168,
            "singular_value_overlap": -10.514525413513184,
            "subspace_overlap": -38.79973220825195,
            "right_subspace_overlap": -37.614742279052734,
            "encoder_gradient_cosine_similarity": 33.59958267211914,
            "encoder_gradient_l2_distance": -34.18234634399414,
            "encoder_gradient_dot_product": 121.65654754638672,
            "input_gradient_cosine_similarity": 4.4635009765625,
            "input_gradient_l2_distance": -103.95075225830078,
            "input_gradient_dot_product": 35.92245864868164
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.659397667084712,
          "val_r": 0.26611036914620506,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 6.453690528869629,
            "right_subspace_overlap_bottom_k": -2.5460944175720215,
            "interaction_matrix_overlap_top_k": -0.0660906583070755,
            "interaction_matrix_overlap_bottom_k": -2.0602755546569824,
            "effective_rank": 0.752940833568573,
            "effective_rank_mergeability_score": 3.271496295928955,
            "stable_rank": 2.9769363403320312,
            "spectral_gap": -0.432425320148468,
            "singular_value_ratio": 2.276301145553589,
            "layerwise_effective_rank": -0.15978609025478363,
            "layerwise_effective_rank_mergeability_score": 1.3567626476287842,
            "task_vector_cosine_similarity": 3.5991389751434326,
            "task_vector_l2_distance": -5.188724040985107,
            "task_vector_dot_product": -4.094612121582031,
            "weight_space_angle": 1.8904316425323486,
            "task_vector_magnitude_ratio": -3.653193712234497,
            "singular_value_overlap": -0.9910544157028198,
            "subspace_overlap": -3.3678550720214844,
            "right_subspace_overlap": 8.760705947875977,
            "encoder_gradient_cosine_similarity": 3.9308009147644043,
            "encoder_gradient_l2_distance": -10.23470687866211,
            "encoder_gradient_dot_product": 3.1227807998657227,
            "input_gradient_cosine_similarity": 1.518373966217041,
            "input_gradient_l2_distance": -5.589851379394531,
            "input_gradient_dot_product": -0.5268537402153015
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.026684118795944917,
          "val_r": 0.3412605083858768,
          "n_iterations": 51,
          "coefficients": {
            "right_subspace_overlap_top_k": -0.21472038328647614,
            "right_subspace_overlap_bottom_k": -0.368704229593277,
            "interaction_matrix_overlap_top_k": 0.6981685161590576,
            "interaction_matrix_overlap_bottom_k": -0.22596313059329987,
            "effective_rank": 0.46845507621765137,
            "effective_rank_mergeability_score": -0.10270346701145172,
            "stable_rank": 0.0017264913767576218,
            "spectral_gap": -0.5409911870956421,
            "singular_value_ratio": 0.16478222608566284,
            "layerwise_effective_rank": 0.09410392493009567,
            "layerwise_effective_rank_mergeability_score": 0.07272721081972122,
            "task_vector_cosine_similarity": -0.18091194331645966,
            "task_vector_l2_distance": -0.23897671699523926,
            "task_vector_dot_product": 0.2697652280330658,
            "weight_space_angle": -0.05914029851555824,
            "task_vector_magnitude_ratio": 0.7143641114234924,
            "singular_value_overlap": -0.5937680602073669,
            "subspace_overlap": 0.1128772646188736,
            "right_subspace_overlap": 0.5173827409744263,
            "encoder_gradient_cosine_similarity": 0.20932653546333313,
            "encoder_gradient_l2_distance": 0.08826428651809692,
            "encoder_gradient_dot_product": -0.06828498840332031,
            "input_gradient_cosine_similarity": 0.18597009778022766,
            "input_gradient_l2_distance": -0.11798095703125,
            "input_gradient_dot_product": 0.13682448863983154
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5978105385040435,
          "val_r": 0.4417539351818198,
          "n_iterations": 806,
          "coefficients": {
            "right_subspace_overlap_top_k": 93.02692413330078,
            "right_subspace_overlap_bottom_k": -77.25761413574219,
            "interaction_matrix_overlap_top_k": 24.553150177001953,
            "interaction_matrix_overlap_bottom_k": -55.95151138305664,
            "effective_rank": -48.20625686645508,
            "effective_rank_mergeability_score": 7.499451637268066,
            "stable_rank": -23.690980911254883,
            "spectral_gap": 10.717833518981934,
            "singular_value_ratio": 13.968156814575195,
            "layerwise_effective_rank": -45.79341506958008,
            "layerwise_effective_rank_mergeability_score": -56.51004409790039,
            "task_vector_cosine_similarity": 68.09501647949219,
            "task_vector_l2_distance": 46.525325775146484,
            "task_vector_dot_product": -21.348344802856445,
            "weight_space_angle": 13.287802696228027,
            "task_vector_magnitude_ratio": 45.032962799072266,
            "singular_value_overlap": 24.913707733154297,
            "subspace_overlap": 30.985841751098633,
            "right_subspace_overlap": 13.31196403503418,
            "encoder_gradient_cosine_similarity": 4.058264255523682,
            "encoder_gradient_l2_distance": 12.97447681427002,
            "encoder_gradient_dot_product": 49.34876251220703,
            "input_gradient_cosine_similarity": 26.96826934814453,
            "input_gradient_l2_distance": -76.56171417236328,
            "input_gradient_dot_product": -78.94986724853516
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5902291140106712,
          "val_r": 0.21847658746943538,
          "n_iterations": 425,
          "coefficients": {
            "right_subspace_overlap_top_k": 42.39413833618164,
            "right_subspace_overlap_bottom_k": -17.67967414855957,
            "interaction_matrix_overlap_top_k": 31.120384216308594,
            "interaction_matrix_overlap_bottom_k": 0.23338955640792847,
            "effective_rank": 29.830162048339844,
            "effective_rank_mergeability_score": 52.30778503417969,
            "stable_rank": -115.5929183959961,
            "spectral_gap": -35.83604049682617,
            "singular_value_ratio": 66.97175598144531,
            "layerwise_effective_rank": 23.441162109375,
            "layerwise_effective_rank_mergeability_score": -51.22582244873047,
            "task_vector_cosine_similarity": 60.935428619384766,
            "task_vector_l2_distance": 10.248490333557129,
            "task_vector_dot_product": 3.5813472270965576,
            "weight_space_angle": -12.146636009216309,
            "task_vector_magnitude_ratio": -52.0915412902832,
            "singular_value_overlap": 47.36117172241211,
            "subspace_overlap": -46.00664138793945,
            "right_subspace_overlap": 8.1957368850708,
            "encoder_gradient_cosine_similarity": 39.62770462036133,
            "encoder_gradient_l2_distance": -79.95745849609375,
            "encoder_gradient_dot_product": 35.00328063964844,
            "input_gradient_cosine_similarity": -4.928718566894531,
            "input_gradient_l2_distance": -60.78287887573242,
            "input_gradient_dot_product": 25.99305534362793
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.704532694397987,
          "val_r": 0.7027827769622037,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 4.24968147277832,
            "right_subspace_overlap_bottom_k": -2.6405181884765625,
            "interaction_matrix_overlap_top_k": 0.1740407645702362,
            "interaction_matrix_overlap_bottom_k": -0.16948729753494263,
            "effective_rank": 0.3221634030342102,
            "effective_rank_mergeability_score": 0.924318790435791,
            "stable_rank": 0.3408426344394684,
            "spectral_gap": 1.268438458442688,
            "singular_value_ratio": 0.7337084412574768,
            "layerwise_effective_rank": 1.2363492250442505,
            "layerwise_effective_rank_mergeability_score": 0.3539445102214813,
            "task_vector_cosine_similarity": -0.8145534992218018,
            "task_vector_l2_distance": -1.3721877336502075,
            "task_vector_dot_product": 0.2093021124601364,
            "weight_space_angle": 2.137883424758911,
            "task_vector_magnitude_ratio": -0.34138453006744385,
            "singular_value_overlap": -0.28931331634521484,
            "subspace_overlap": -0.7480429410934448,
            "right_subspace_overlap": 2.1907029151916504,
            "encoder_gradient_cosine_similarity": 1.3220607042312622,
            "encoder_gradient_l2_distance": -4.252832412719727,
            "encoder_gradient_dot_product": 1.2749375104904175,
            "input_gradient_cosine_similarity": 0.15900030732154846,
            "input_gradient_l2_distance": -3.2705647945404053,
            "input_gradient_dot_product": -1.9989144802093506
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5388832538366963,
          "val_r": 0.7028412508240647,
          "n_iterations": 799,
          "coefficients": {
            "right_subspace_overlap_top_k": 114.86746978759766,
            "right_subspace_overlap_bottom_k": -92.87462615966797,
            "interaction_matrix_overlap_top_k": 80.49569702148438,
            "interaction_matrix_overlap_bottom_k": -70.75859832763672,
            "effective_rank": -39.3358039855957,
            "effective_rank_mergeability_score": -153.00323486328125,
            "stable_rank": 97.77800750732422,
            "spectral_gap": 50.088279724121094,
            "singular_value_ratio": 1.8461596965789795,
            "layerwise_effective_rank": -103.61890411376953,
            "layerwise_effective_rank_mergeability_score": 73.63704681396484,
            "task_vector_cosine_similarity": -99.98285675048828,
            "task_vector_l2_distance": 59.354190826416016,
            "task_vector_dot_product": 38.45291519165039,
            "weight_space_angle": -21.98729705810547,
            "task_vector_magnitude_ratio": -1.654091238975525,
            "singular_value_overlap": -5.520482540130615,
            "subspace_overlap": 65.44847106933594,
            "right_subspace_overlap": 37.91646194458008,
            "encoder_gradient_cosine_similarity": 128.93812561035156,
            "encoder_gradient_l2_distance": -75.85507202148438,
            "encoder_gradient_dot_product": 5.51995325088501,
            "input_gradient_cosine_similarity": -48.43157958984375,
            "input_gradient_l2_distance": -12.788911819458008,
            "input_gradient_dot_product": -27.533349990844727
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6128980761413436,
          "val_r": 0.6877121504645918,
          "n_iterations": 754,
          "coefficients": {
            "right_subspace_overlap_top_k": -20.3190860748291,
            "right_subspace_overlap_bottom_k": -7.992713451385498,
            "interaction_matrix_overlap_top_k": 103.00154113769531,
            "interaction_matrix_overlap_bottom_k": -33.0210075378418,
            "effective_rank": 31.011348724365234,
            "effective_rank_mergeability_score": -8.183887481689453,
            "stable_rank": -41.441986083984375,
            "spectral_gap": 5.478028297424316,
            "singular_value_ratio": 82.65080261230469,
            "layerwise_effective_rank": -37.451271057128906,
            "layerwise_effective_rank_mergeability_score": -7.344688892364502,
            "task_vector_cosine_similarity": 41.153053283691406,
            "task_vector_l2_distance": -24.621559143066406,
            "task_vector_dot_product": 21.979019165039062,
            "weight_space_angle": -8.679244041442871,
            "task_vector_magnitude_ratio": -59.85881042480469,
            "singular_value_overlap": 1.140635371208191,
            "subspace_overlap": 1.0689197778701782,
            "right_subspace_overlap": -11.37098217010498,
            "encoder_gradient_cosine_similarity": 36.01760482788086,
            "encoder_gradient_l2_distance": -50.04277420043945,
            "encoder_gradient_dot_product": 33.24822998046875,
            "input_gradient_cosine_similarity": 38.810001373291016,
            "input_gradient_l2_distance": -41.53047561645508,
            "input_gradient_dot_product": -42.70278549194336
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4809083656875949,
          "val_r": 0.5221004526218799,
          "n_iterations": 858,
          "coefficients": {
            "right_subspace_overlap_top_k": 194.17291259765625,
            "right_subspace_overlap_bottom_k": -85.35838317871094,
            "interaction_matrix_overlap_top_k": -13.590764999389648,
            "interaction_matrix_overlap_bottom_k": 60.53139877319336,
            "effective_rank": -15.32730484008789,
            "effective_rank_mergeability_score": -66.46944427490234,
            "stable_rank": -88.16410827636719,
            "spectral_gap": -74.32254028320312,
            "singular_value_ratio": 16.395668029785156,
            "layerwise_effective_rank": 13.576980590820312,
            "layerwise_effective_rank_mergeability_score": 149.2571563720703,
            "task_vector_cosine_similarity": 243.54554748535156,
            "task_vector_l2_distance": -52.72982406616211,
            "task_vector_dot_product": 18.177898406982422,
            "weight_space_angle": -93.9410171508789,
            "task_vector_magnitude_ratio": 44.56228256225586,
            "singular_value_overlap": 45.95026397705078,
            "subspace_overlap": -83.76570129394531,
            "right_subspace_overlap": -157.42039489746094,
            "encoder_gradient_cosine_similarity": 59.57744216918945,
            "encoder_gradient_l2_distance": 14.34050178527832,
            "encoder_gradient_dot_product": 123.80430603027344,
            "input_gradient_cosine_similarity": -0.10205025970935822,
            "input_gradient_l2_distance": -128.66871643066406,
            "input_gradient_dot_product": -123.03402709960938
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.7523990435706305,
          "val_r": 0.7648244425182564,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 11.24205493927002,
            "right_subspace_overlap_bottom_k": -8.87767505645752,
            "interaction_matrix_overlap_top_k": 14.644187927246094,
            "interaction_matrix_overlap_bottom_k": 0.9644711017608643,
            "effective_rank": -3.5536251068115234,
            "effective_rank_mergeability_score": 9.664801597595215,
            "stable_rank": 18.497974395751953,
            "spectral_gap": 6.681545257568359,
            "singular_value_ratio": 11.458066940307617,
            "layerwise_effective_rank": -6.762487411499023,
            "layerwise_effective_rank_mergeability_score": -1.9683787822723389,
            "task_vector_cosine_similarity": -9.587102890014648,
            "task_vector_l2_distance": -10.13046932220459,
            "task_vector_dot_product": 12.66232967376709,
            "weight_space_angle": 0.3732554614543915,
            "task_vector_magnitude_ratio": -10.247685432434082,
            "singular_value_overlap": 2.2822329998016357,
            "subspace_overlap": -19.43990135192871,
            "right_subspace_overlap": 3.1440911293029785,
            "encoder_gradient_cosine_similarity": 2.092855453491211,
            "encoder_gradient_l2_distance": -11.071854591369629,
            "encoder_gradient_dot_product": 5.231098175048828,
            "input_gradient_cosine_similarity": 1.3134642839431763,
            "input_gradient_l2_distance": -11.608409881591797,
            "input_gradient_dot_product": -6.005901336669922
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5322329389677694,
          "val_r": 0.47704444768233634,
          "n_iterations": 489,
          "coefficients": {
            "right_subspace_overlap_top_k": -40.916839599609375,
            "right_subspace_overlap_bottom_k": -43.80784606933594,
            "interaction_matrix_overlap_top_k": 132.64141845703125,
            "interaction_matrix_overlap_bottom_k": -30.936235427856445,
            "effective_rank": 15.859237670898438,
            "effective_rank_mergeability_score": -47.339195251464844,
            "stable_rank": -57.85771942138672,
            "spectral_gap": -50.49928665161133,
            "singular_value_ratio": -21.69800567626953,
            "layerwise_effective_rank": -74.0440673828125,
            "layerwise_effective_rank_mergeability_score": 4.171014785766602,
            "task_vector_cosine_similarity": 26.61461067199707,
            "task_vector_l2_distance": -39.42531967163086,
            "task_vector_dot_product": 18.969587326049805,
            "weight_space_angle": -30.335405349731445,
            "task_vector_magnitude_ratio": 25.252365112304688,
            "singular_value_overlap": 15.85074520111084,
            "subspace_overlap": 64.42965698242188,
            "right_subspace_overlap": 61.1020622253418,
            "encoder_gradient_cosine_similarity": 93.99760437011719,
            "encoder_gradient_l2_distance": -26.77532958984375,
            "encoder_gradient_dot_product": 94.71672821044922,
            "input_gradient_cosine_similarity": 22.287900924682617,
            "input_gradient_l2_distance": -47.12602615356445,
            "input_gradient_dot_product": -64.13469696044922
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7494386847265531,
          "val_r": 0.4877860126036708,
          "n_iterations": 961,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.1700059473514557,
            "right_subspace_overlap_bottom_k": -0.8499748110771179,
            "interaction_matrix_overlap_top_k": -0.26428574323654175,
            "interaction_matrix_overlap_bottom_k": 0.8789678812026978,
            "effective_rank": 0.2148408740758896,
            "effective_rank_mergeability_score": -0.28579601645469666,
            "stable_rank": -0.6074293255805969,
            "spectral_gap": 0.1639944463968277,
            "singular_value_ratio": 0.5880624651908875,
            "layerwise_effective_rank": 0.5493453741073608,
            "layerwise_effective_rank_mergeability_score": 0.5326855778694153,
            "task_vector_cosine_similarity": 0.2570246756076813,
            "task_vector_l2_distance": -0.0690900981426239,
            "task_vector_dot_product": 0.09940598905086517,
            "weight_space_angle": 0.21297915279865265,
            "task_vector_magnitude_ratio": -0.336761474609375,
            "singular_value_overlap": -0.021205950528383255,
            "subspace_overlap": -0.11029504984617233,
            "right_subspace_overlap": 0.14213325083255768,
            "encoder_gradient_cosine_similarity": 0.017892614006996155,
            "encoder_gradient_l2_distance": -0.12681050598621368,
            "encoder_gradient_dot_product": 0.045677512884140015,
            "input_gradient_cosine_similarity": 0.0061901467852294445,
            "input_gradient_l2_distance": -0.15176402032375336,
            "input_gradient_dot_product": -0.05604821816086769
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6383136787414607,
          "val_r": 0.1403309935427412,
          "n_iterations": 690,
          "coefficients": {
            "right_subspace_overlap_top_k": 29.902870178222656,
            "right_subspace_overlap_bottom_k": 19.41661262512207,
            "interaction_matrix_overlap_top_k": 83.57173919677734,
            "interaction_matrix_overlap_bottom_k": -33.63555145263672,
            "effective_rank": -31.877775192260742,
            "effective_rank_mergeability_score": -77.27506256103516,
            "stable_rank": -59.65348434448242,
            "spectral_gap": 9.711835861206055,
            "singular_value_ratio": 29.917593002319336,
            "layerwise_effective_rank": 40.555171966552734,
            "layerwise_effective_rank_mergeability_score": 92.78167724609375,
            "task_vector_cosine_similarity": 42.78835678100586,
            "task_vector_l2_distance": -59.73001480102539,
            "task_vector_dot_product": 9.277902603149414,
            "weight_space_angle": 15.56783676147461,
            "task_vector_magnitude_ratio": 24.410852432250977,
            "singular_value_overlap": -43.37433624267578,
            "subspace_overlap": 28.526386260986328,
            "right_subspace_overlap": 8.433370590209961,
            "encoder_gradient_cosine_similarity": 70.0314712524414,
            "encoder_gradient_l2_distance": -125.55601501464844,
            "encoder_gradient_dot_product": 7.3838276863098145,
            "input_gradient_cosine_similarity": -18.20299530029297,
            "input_gradient_l2_distance": -48.299495697021484,
            "input_gradient_dot_product": -13.674935340881348
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6183491544259063,
          "val_r": 0.5173764726094082,
          "n_iterations": 616,
          "coefficients": {
            "right_subspace_overlap_top_k": -16.66564178466797,
            "right_subspace_overlap_bottom_k": 16.813312530517578,
            "interaction_matrix_overlap_top_k": 15.425193786621094,
            "interaction_matrix_overlap_bottom_k": -0.6418673396110535,
            "effective_rank": 27.20210838317871,
            "effective_rank_mergeability_score": -14.536968231201172,
            "stable_rank": 9.939421653747559,
            "spectral_gap": -19.14881706237793,
            "singular_value_ratio": -33.53507614135742,
            "layerwise_effective_rank": -18.383085250854492,
            "layerwise_effective_rank_mergeability_score": 51.29327392578125,
            "task_vector_cosine_similarity": 35.048030853271484,
            "task_vector_l2_distance": -48.63999938964844,
            "task_vector_dot_product": 57.016441345214844,
            "weight_space_angle": 15.380653381347656,
            "task_vector_magnitude_ratio": -0.17484396696090698,
            "singular_value_overlap": -39.81974411010742,
            "subspace_overlap": 42.38469314575195,
            "right_subspace_overlap": -29.200830459594727,
            "encoder_gradient_cosine_similarity": 49.011695861816406,
            "encoder_gradient_l2_distance": 20.13153076171875,
            "encoder_gradient_dot_product": -4.508090972900391,
            "input_gradient_cosine_similarity": 35.12202072143555,
            "input_gradient_l2_distance": -147.3697052001953,
            "input_gradient_dot_product": -1.1461009979248047
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    },
    "arithmetic": {
      "aggregate_metrics": {
        "train_r": 0.23359234658597364,
        "train_p": 3.498877517451537e-41,
        "val_r": 0.11898863598701342,
        "val_p": 0.024353795486833807
      },
      "per_fold_stats": {
        "train_r_mean": 0.5270797362701849,
        "train_r_std": 0.07544790262355155,
        "val_r_mean": 0.4191882029622838,
        "val_r_std": 0.21070118641558142
      },
      "average_coefficients": {
        "right_subspace_overlap_top_k": 28.822216033935547,
        "right_subspace_overlap_bottom_k": 4.52155065536499,
        "interaction_matrix_overlap_top_k": 19.766691207885742,
        "interaction_matrix_overlap_bottom_k": 11.455246925354004,
        "effective_rank": 0.11509702354669571,
        "effective_rank_mergeability_score": 5.937655448913574,
        "stable_rank": 0.6198938488960266,
        "spectral_gap": 11.27633285522461,
        "singular_value_ratio": 3.2245476245880127,
        "layerwise_effective_rank": 0.3268283009529114,
        "layerwise_effective_rank_mergeability_score": 8.269485473632812,
        "task_vector_cosine_similarity": 4.413418769836426,
        "task_vector_l2_distance": -27.284435272216797,
        "task_vector_dot_product": 9.811861991882324,
        "weight_space_angle": -8.904512405395508,
        "task_vector_magnitude_ratio": -9.00728988647461,
        "singular_value_overlap": -35.41975402832031,
        "subspace_overlap": 11.84252643585205,
        "right_subspace_overlap": 23.61832046508789,
        "encoder_gradient_cosine_similarity": 23.68423843383789,
        "encoder_gradient_l2_distance": -43.20964431762695,
        "encoder_gradient_dot_product": 24.743144989013672,
        "input_gradient_cosine_similarity": 11.849625587463379,
        "input_gradient_l2_distance": -43.05323028564453,
        "input_gradient_dot_product": -36.421791076660156
      },
      "coefficient_std": {
        "right_subspace_overlap_top_k": 40.41632080078125,
        "right_subspace_overlap_bottom_k": 27.876697540283203,
        "interaction_matrix_overlap_top_k": 17.82134246826172,
        "interaction_matrix_overlap_bottom_k": 25.123579025268555,
        "effective_rank": 24.659578323364258,
        "effective_rank_mergeability_score": 29.381874084472656,
        "stable_rank": 29.792354583740234,
        "spectral_gap": 23.354808807373047,
        "singular_value_ratio": 20.56673240661621,
        "layerwise_effective_rank": 27.96288299560547,
        "layerwise_effective_rank_mergeability_score": 41.98396682739258,
        "task_vector_cosine_similarity": 44.980567932128906,
        "task_vector_l2_distance": 23.422279357910156,
        "task_vector_dot_product": 47.153079986572266,
        "weight_space_angle": 18.934520721435547,
        "task_vector_magnitude_ratio": 32.61367416381836,
        "singular_value_overlap": 23.4042911529541,
        "subspace_overlap": 33.957275390625,
        "right_subspace_overlap": 27.917984008789062,
        "encoder_gradient_cosine_similarity": 18.076263427734375,
        "encoder_gradient_l2_distance": 29.93277931213379,
        "encoder_gradient_dot_product": 16.545162200927734,
        "input_gradient_cosine_similarity": 17.707103729248047,
        "input_gradient_l2_distance": 43.75696563720703,
        "input_gradient_dot_product": 32.650054931640625
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5794349725726791,
          "val_r": 0.6906302304305941,
          "n_iterations": 877,
          "coefficients": {
            "right_subspace_overlap_top_k": 25.231170654296875,
            "right_subspace_overlap_bottom_k": 7.753875732421875,
            "interaction_matrix_overlap_top_k": 5.822181701660156,
            "interaction_matrix_overlap_bottom_k": 23.349027633666992,
            "effective_rank": -13.996007919311523,
            "effective_rank_mergeability_score": 25.17545509338379,
            "stable_rank": 3.2561628818511963,
            "spectral_gap": 12.557059288024902,
            "singular_value_ratio": -36.53904724121094,
            "layerwise_effective_rank": 38.66532516479492,
            "layerwise_effective_rank_mergeability_score": -23.802946090698242,
            "task_vector_cosine_similarity": 19.043535232543945,
            "task_vector_l2_distance": -48.9365119934082,
            "task_vector_dot_product": -4.846920013427734,
            "weight_space_angle": 30.862825393676758,
            "task_vector_magnitude_ratio": 16.201923370361328,
            "singular_value_overlap": -55.30916213989258,
            "subspace_overlap": 17.67266273498535,
            "right_subspace_overlap": 24.0223445892334,
            "encoder_gradient_cosine_similarity": 8.785720825195312,
            "encoder_gradient_l2_distance": -24.12119483947754,
            "encoder_gradient_dot_product": 36.07170867919922,
            "input_gradient_cosine_similarity": 0.5084198117256165,
            "input_gradient_l2_distance": -44.372032165527344,
            "input_gradient_dot_product": -42.05726623535156
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5434490982854907,
          "val_r": 0.553033231946783,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.12552528083324432,
            "right_subspace_overlap_bottom_k": -5.104091167449951,
            "interaction_matrix_overlap_top_k": 17.492555618286133,
            "interaction_matrix_overlap_bottom_k": 15.97929859161377,
            "effective_rank": 5.954941272735596,
            "effective_rank_mergeability_score": 2.0510504245758057,
            "stable_rank": -2.3330748081207275,
            "spectral_gap": 7.639285564422607,
            "singular_value_ratio": 2.866452932357788,
            "layerwise_effective_rank": 8.14999008178711,
            "layerwise_effective_rank_mergeability_score": 4.828269958496094,
            "task_vector_cosine_similarity": -0.5405360460281372,
            "task_vector_l2_distance": -27.38144302368164,
            "task_vector_dot_product": 8.05325984954834,
            "weight_space_angle": 9.176724433898926,
            "task_vector_magnitude_ratio": -11.924543380737305,
            "singular_value_overlap": -25.94948387145996,
            "subspace_overlap": 11.978182792663574,
            "right_subspace_overlap": 20.566850662231445,
            "encoder_gradient_cosine_similarity": 8.984541893005371,
            "encoder_gradient_l2_distance": -29.931184768676758,
            "encoder_gradient_dot_product": 18.89719581604004,
            "input_gradient_cosine_similarity": 7.966216087341309,
            "input_gradient_l2_distance": -20.126293182373047,
            "input_gradient_dot_product": -26.421207427978516
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5006553972701652,
          "val_r": 0.40764907887283097,
          "n_iterations": 560,
          "coefficients": {
            "right_subspace_overlap_top_k": 10.31873893737793,
            "right_subspace_overlap_bottom_k": 4.812002658843994,
            "interaction_matrix_overlap_top_k": 11.620749473571777,
            "interaction_matrix_overlap_bottom_k": 20.791460037231445,
            "effective_rank": 2.6991777420043945,
            "effective_rank_mergeability_score": 5.504918575286865,
            "stable_rank": -27.4345703125,
            "spectral_gap": -30.288726806640625,
            "singular_value_ratio": 17.934066772460938,
            "layerwise_effective_rank": 21.716079711914062,
            "layerwise_effective_rank_mergeability_score": 39.20319366455078,
            "task_vector_cosine_similarity": 35.139137268066406,
            "task_vector_l2_distance": -19.099811553955078,
            "task_vector_dot_product": -9.778711318969727,
            "weight_space_angle": -20.5643367767334,
            "task_vector_magnitude_ratio": -46.80939865112305,
            "singular_value_overlap": -74.14717864990234,
            "subspace_overlap": 39.69877243041992,
            "right_subspace_overlap": 82.50672912597656,
            "encoder_gradient_cosine_similarity": 44.127777099609375,
            "encoder_gradient_l2_distance": -29.39409637451172,
            "encoder_gradient_dot_product": 33.43394088745117,
            "input_gradient_cosine_similarity": 26.029855728149414,
            "input_gradient_l2_distance": -81.52207946777344,
            "input_gradient_dot_product": -55.50041198730469
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.562363179129151,
          "val_r": 0.34372998636070073,
          "n_iterations": 672,
          "coefficients": {
            "right_subspace_overlap_top_k": 9.627059936523438,
            "right_subspace_overlap_bottom_k": -35.52219009399414,
            "interaction_matrix_overlap_top_k": 8.53035831451416,
            "interaction_matrix_overlap_bottom_k": 59.382083892822266,
            "effective_rank": 25.416934967041016,
            "effective_rank_mergeability_score": 8.79483699798584,
            "stable_rank": -9.9962797164917,
            "spectral_gap": 26.30656623840332,
            "singular_value_ratio": 1.5121126174926758,
            "layerwise_effective_rank": 4.18583869934082,
            "layerwise_effective_rank_mergeability_score": 6.969919204711914,
            "task_vector_cosine_similarity": 30.633665084838867,
            "task_vector_l2_distance": -30.13035011291504,
            "task_vector_dot_product": -24.26004409790039,
            "weight_space_angle": -5.093570232391357,
            "task_vector_magnitude_ratio": 5.376677989959717,
            "singular_value_overlap": -28.130151748657227,
            "subspace_overlap": -5.475264072418213,
            "right_subspace_overlap": 27.538070678710938,
            "encoder_gradient_cosine_similarity": 13.587257385253906,
            "encoder_gradient_l2_distance": -60.46233367919922,
            "encoder_gradient_dot_product": 36.46807861328125,
            "input_gradient_cosine_similarity": 12.626341819763184,
            "input_gradient_l2_distance": -38.414466857910156,
            "input_gradient_dot_product": -38.47322463989258
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.42504437945440454,
          "val_r": 0.5981839324664783,
          "n_iterations": 851,
          "coefficients": {
            "right_subspace_overlap_top_k": 173.0087127685547,
            "right_subspace_overlap_bottom_k": 84.06490325927734,
            "interaction_matrix_overlap_top_k": 67.6689453125,
            "interaction_matrix_overlap_bottom_k": -33.59153747558594,
            "effective_rank": 77.12539672851562,
            "effective_rank_mergeability_score": -110.21184539794922,
            "stable_rank": 105.73715209960938,
            "spectral_gap": 74.83124542236328,
            "singular_value_ratio": 50.760009765625,
            "layerwise_effective_rank": -78.17135620117188,
            "layerwise_effective_rank_mergeability_score": 175.09779357910156,
            "task_vector_cosine_similarity": -145.56919860839844,
            "task_vector_l2_distance": -63.62986373901367,
            "task_vector_dot_product": 173.61900329589844,
            "weight_space_angle": -17.865007400512695,
            "task_vector_magnitude_ratio": -122.41901397705078,
            "singular_value_overlap": 1.701330304145813,
            "subspace_overlap": -113.51852416992188,
            "right_subspace_overlap": -13.586051940917969,
            "encoder_gradient_cosine_similarity": 29.393903732299805,
            "encoder_gradient_l2_distance": -137.97726440429688,
            "encoder_gradient_dot_product": 20.120121002197266,
            "input_gradient_cosine_similarity": -36.2176399230957,
            "input_gradient_l2_distance": -211.1871795654297,
            "input_gradient_dot_product": 51.81420135498047
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.53595228476217,
          "val_r": 0.6328196512848334,
          "n_iterations": 614,
          "coefficients": {
            "right_subspace_overlap_top_k": 16.688907623291016,
            "right_subspace_overlap_bottom_k": 36.649253845214844,
            "interaction_matrix_overlap_top_k": 20.868141174316406,
            "interaction_matrix_overlap_bottom_k": 2.3466362953186035,
            "effective_rank": -13.015671730041504,
            "effective_rank_mergeability_score": 24.252622604370117,
            "stable_rank": -13.956000328063965,
            "spectral_gap": 16.20841407775879,
            "singular_value_ratio": 40.006141662597656,
            "layerwise_effective_rank": 7.118646621704102,
            "layerwise_effective_rank_mergeability_score": -12.595270156860352,
            "task_vector_cosine_similarity": 22.96942901611328,
            "task_vector_l2_distance": -67.86071014404297,
            "task_vector_dot_product": 55.10540771484375,
            "weight_space_angle": -10.394895553588867,
            "task_vector_magnitude_ratio": -39.20844268798828,
            "singular_value_overlap": -57.1446418762207,
            "subspace_overlap": 0.017192581668496132,
            "right_subspace_overlap": 22.977062225341797,
            "encoder_gradient_cosine_similarity": 20.466764450073242,
            "encoder_gradient_l2_distance": -74.65922546386719,
            "encoder_gradient_dot_product": 47.83258819580078,
            "input_gradient_cosine_similarity": 43.29435729980469,
            "input_gradient_l2_distance": -27.78706169128418,
            "input_gradient_dot_product": -59.182132720947266
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.6060186479081547,
          "val_r": 0.28439156010624245,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 2.2872185707092285,
            "right_subspace_overlap_bottom_k": -6.589474201202393,
            "interaction_matrix_overlap_top_k": -1.6062812805175781,
            "interaction_matrix_overlap_bottom_k": 12.853020668029785,
            "effective_rank": -1.4016666412353516,
            "effective_rank_mergeability_score": 1.3390460014343262,
            "stable_rank": -2.75228214263916,
            "spectral_gap": 0.09275646507740021,
            "singular_value_ratio": -2.254556179046631,
            "layerwise_effective_rank": 7.697523593902588,
            "layerwise_effective_rank_mergeability_score": 2.72774076461792,
            "task_vector_cosine_similarity": 5.081521034240723,
            "task_vector_l2_distance": -5.527209281921387,
            "task_vector_dot_product": -0.2134624719619751,
            "weight_space_angle": 4.713334083557129,
            "task_vector_magnitude_ratio": 1.5785547494888306,
            "singular_value_overlap": -3.3248696327209473,
            "subspace_overlap": -0.8305551409721375,
            "right_subspace_overlap": -0.1567082703113556,
            "encoder_gradient_cosine_similarity": 0.8803425431251526,
            "encoder_gradient_l2_distance": -6.268242359161377,
            "encoder_gradient_dot_product": 1.3030306100845337,
            "input_gradient_cosine_similarity": -0.5203531384468079,
            "input_gradient_l2_distance": -5.559966564178467,
            "input_gradient_dot_product": -2.5496084690093994
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4809683761823443,
          "val_r": 0.1665176781006173,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 26.21795654296875,
            "right_subspace_overlap_bottom_k": 1.3665375709533691,
            "interaction_matrix_overlap_top_k": 0.6761277318000793,
            "interaction_matrix_overlap_bottom_k": 32.8702507019043,
            "effective_rank": 9.045370101928711,
            "effective_rank_mergeability_score": -3.999992847442627,
            "stable_rank": 6.606378078460693,
            "spectral_gap": 33.54920959472656,
            "singular_value_ratio": -10.664334297180176,
            "layerwise_effective_rank": 1.960310935974121,
            "layerwise_effective_rank_mergeability_score": 1.1856580972671509,
            "task_vector_cosine_similarity": 5.343392372131348,
            "task_vector_l2_distance": -30.835487365722656,
            "task_vector_dot_product": -22.655765533447266,
            "weight_space_angle": -15.638031959533691,
            "task_vector_magnitude_ratio": -4.919414520263672,
            "singular_value_overlap": -43.13711166381836,
            "subspace_overlap": 22.934179306030273,
            "right_subspace_overlap": 38.19602584838867,
            "encoder_gradient_cosine_similarity": 17.61578941345215,
            "encoder_gradient_l2_distance": -42.76189041137695,
            "encoder_gradient_dot_product": 21.96087646484375,
            "input_gradient_cosine_similarity": 12.388995170593262,
            "input_gradient_l2_distance": -50.41630172729492,
            "input_gradient_dot_product": -5.890328884124756
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.4230013605749151,
          "val_r": -0.237415405203857,
          "n_iterations": 681,
          "coefficients": {
            "right_subspace_overlap_top_k": 85.5077896118164,
            "right_subspace_overlap_bottom_k": 1.4866149425506592,
            "interaction_matrix_overlap_top_k": 13.741585731506348,
            "interaction_matrix_overlap_bottom_k": 65.14694213867188,
            "effective_rank": -38.2010612487793,
            "effective_rank_mergeability_score": 41.12621307373047,
            "stable_rank": -51.29773712158203,
            "spectral_gap": -38.229949951171875,
            "singular_value_ratio": 24.51155662536621,
            "layerwise_effective_rank": -72.26951599121094,
            "layerwise_effective_rank_mergeability_score": 17.70159912109375,
            "task_vector_cosine_similarity": 83.83560943603516,
            "task_vector_l2_distance": -8.497260093688965,
            "task_vector_dot_product": -28.04459571838379,
            "weight_space_angle": -46.56793975830078,
            "task_vector_magnitude_ratio": 32.643394470214844,
            "singular_value_overlap": -45.3306884765625,
            "subspace_overlap": 53.49593734741211,
            "right_subspace_overlap": 5.193942546844482,
            "encoder_gradient_cosine_similarity": 69.20577239990234,
            "encoder_gradient_l2_distance": -64.40409851074219,
            "encoder_gradient_dot_product": 7.2777509689331055,
            "input_gradient_cosine_similarity": 36.564208984375,
            "input_gradient_l2_distance": -62.59157943725586,
            "input_gradient_dot_product": -81.00684356689453
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5230467492873645,
          "val_r": 0.3561880341361159,
          "n_iterations": 644,
          "coefficients": {
            "right_subspace_overlap_top_k": 29.599769592285156,
            "right_subspace_overlap_bottom_k": -10.454663276672363,
            "interaction_matrix_overlap_top_k": 21.249134063720703,
            "interaction_matrix_overlap_bottom_k": 21.133718490600586,
            "effective_rank": 7.405068397521973,
            "effective_rank_mergeability_score": 10.277453422546387,
            "stable_rank": -4.312119007110596,
            "spectral_gap": 9.745377540588379,
            "singular_value_ratio": 2.652841329574585,
            "layerwise_effective_rank": -4.102776050567627,
            "layerwise_effective_rank_mergeability_score": 0.6950420141220093,
            "task_vector_cosine_similarity": 23.0035400390625,
            "task_vector_l2_distance": -56.64482498168945,
            "task_vector_dot_product": 24.670833587646484,
            "weight_space_angle": -10.778775215148926,
            "task_vector_magnitude_ratio": -10.302460670471191,
            "singular_value_overlap": -53.113243103027344,
            "subspace_overlap": 11.909585952758789,
            "right_subspace_overlap": 41.11540603637695,
            "encoder_gradient_cosine_similarity": 32.9273681640625,
            "encoder_gradient_l2_distance": -46.49068069458008,
            "encoder_gradient_dot_product": 54.25190353393555,
            "input_gradient_cosine_similarity": 11.219986915588379,
            "input_gradient_l2_distance": -54.72598648071289,
            "input_gradient_dot_product": -49.933841705322266
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5523263306471146,
          "val_r": 0.36245335038017407,
          "n_iterations": 842,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.8442604541778564,
            "right_subspace_overlap_bottom_k": 9.745476722717285,
            "interaction_matrix_overlap_top_k": 9.486305236816406,
            "interaction_matrix_overlap_bottom_k": -0.14455777406692505,
            "effective_rank": 2.3393611907958984,
            "effective_rank_mergeability_score": 6.304585933685303,
            "stable_rank": -0.3367931544780731,
            "spectral_gap": 4.522006988525391,
            "singular_value_ratio": -3.0293612480163574,
            "layerwise_effective_rank": 4.3857526779174805,
            "layerwise_effective_rank_mergeability_score": 0.916335940361023,
            "task_vector_cosine_similarity": -2.315532684326172,
            "task_vector_l2_distance": -12.271551132202148,
            "task_vector_dot_product": 3.150470495223999,
            "weight_space_angle": 0.9356421232223511,
            "task_vector_magnitude_ratio": 4.193097114562988,
            "singular_value_overlap": -7.550382137298584,
            "subspace_overlap": -6.91627311706543,
            "right_subspace_overlap": -1.96429443359375,
            "encoder_gradient_cosine_similarity": 1.5201343297958374,
            "encoder_gradient_l2_distance": -9.352548599243164,
            "encoder_gradient_dot_product": 2.2378687858581543,
            "input_gradient_cosine_similarity": 3.7689249515533447,
            "input_gradient_l2_distance": -9.075196266174316,
            "input_gradient_dot_product": -3.3951518535614014
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.559282004662562,
          "val_r": 0.5437663457773889,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 13.933403968811035,
            "right_subspace_overlap_bottom_k": -6.460270404815674,
            "interaction_matrix_overlap_top_k": 2.883068561553955,
            "interaction_matrix_overlap_bottom_k": 15.538896560668945,
            "effective_rank": -5.336411476135254,
            "effective_rank_mergeability_score": 20.490991592407227,
            "stable_rank": -0.4658891558647156,
            "spectral_gap": 6.183124542236328,
            "singular_value_ratio": -1.2136716842651367,
            "layerwise_effective_rank": 15.708108901977539,
            "layerwise_effective_rank_mergeability_score": -17.651119232177734,
            "task_vector_cosine_similarity": -0.7896155714988708,
            "task_vector_l2_distance": -19.178577423095703,
            "task_vector_dot_product": 8.42264175415039,
            "weight_space_angle": 17.098196029663086,
            "task_vector_magnitude_ratio": -3.9417266845703125,
            "singular_value_overlap": -19.47324562072754,
            "subspace_overlap": 10.731890678405762,
            "right_subspace_overlap": 7.708592414855957,
            "encoder_gradient_cosine_similarity": 8.322310447692871,
            "encoder_gradient_l2_distance": -22.459653854370117,
            "encoder_gradient_dot_product": 8.303557395935059,
            "input_gradient_cosine_similarity": 6.105866432189941,
            "input_gradient_l2_distance": -16.20345115661621,
            "input_gradient_dot_product": -27.258424758911133
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.4682139909664061,
          "val_r": 0.29370294663379054,
          "n_iterations": 735,
          "coefficients": {
            "right_subspace_overlap_top_k": 1.5955771207809448,
            "right_subspace_overlap_bottom_k": 9.733588218688965,
            "interaction_matrix_overlap_top_k": 31.763731002807617,
            "interaction_matrix_overlap_bottom_k": 7.494326114654541,
            "effective_rank": 2.0912094116210938,
            "effective_rank_mergeability_score": -5.602400779724121,
            "stable_rank": 19.60036849975586,
            "spectral_gap": 9.14667797088623,
            "singular_value_ratio": -24.106523513793945,
            "layerwise_effective_rank": -2.2951579093933105,
            "layerwise_effective_rank_mergeability_score": 10.927634239196777,
            "task_vector_cosine_similarity": 20.076671600341797,
            "task_vector_l2_distance": -32.01681900024414,
            "task_vector_dot_product": 49.48751449584961,
            "weight_space_angle": -41.91981887817383,
            "task_vector_magnitude_ratio": 2.7814252376556396,
            "singular_value_overlap": -52.19630432128906,
            "subspace_overlap": 19.380382537841797,
            "right_subspace_overlap": -5.665317535400391,
            "encoder_gradient_cosine_similarity": 33.0831413269043,
            "encoder_gradient_l2_distance": -32.70826721191406,
            "encoder_gradient_dot_product": 49.238162994384766,
            "input_gradient_cosine_similarity": 15.434008598327637,
            "input_gradient_l2_distance": -29.907487869262695,
            "input_gradient_dot_product": -54.418521881103516
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.43177015369252514,
          "val_r": 0.6259147767594183,
          "n_iterations": 593,
          "coefficients": {
            "right_subspace_overlap_top_k": 18.511707305908203,
            "right_subspace_overlap_bottom_k": 25.75614356994629,
            "interaction_matrix_overlap_top_k": 39.07170104980469,
            "interaction_matrix_overlap_bottom_k": -39.59376907348633,
            "effective_rank": -50.14693069458008,
            "effective_rank_mergeability_score": 21.66080093383789,
            "stable_rank": -6.098048686981201,
            "spectral_gap": 33.44068145751953,
            "singular_value_ratio": -11.31181812286377,
            "layerwise_effective_rank": 33.25820541381836,
            "layerwise_effective_rank_mergeability_score": -19.341053009033203,
            "task_vector_cosine_similarity": -71.87890625,
            "task_vector_l2_distance": -10.440939903259277,
            "task_vector_dot_product": 0.9222930073738098,
            "weight_space_angle": -1.521875023841858,
            "task_vector_magnitude_ratio": 40.69817352294922,
            "singular_value_overlap": -52.177066802978516,
            "subspace_overlap": 44.80474853515625,
            "right_subspace_overlap": 101.29399108886719,
            "encoder_gradient_cosine_similarity": 47.077518463134766,
            "encoder_gradient_l2_distance": -70.74433898925781,
            "encoder_gradient_dot_product": 11.206059455871582,
            "input_gradient_cosine_similarity": 2.6174027919769287,
            "input_gradient_l2_distance": -16.060901641845703,
            "input_gradient_dot_product": -70.00631713867188
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4267493105953266,
          "val_r": 0.5761630681990627,
          "n_iterations": 934,
          "coefficients": {
            "right_subspace_overlap_top_k": 75.25934600830078,
            "right_subspace_overlap_bottom_k": -46.73640060424805,
            "interaction_matrix_overlap_top_k": 34.34864044189453,
            "interaction_matrix_overlap_bottom_k": 15.61064338684082,
            "effective_rank": -25.873811721801758,
            "effective_rank_mergeability_score": 22.9234676361084,
            "stable_rank": -15.610968589782715,
            "spectral_gap": 16.771728515625,
            "singular_value_ratio": -3.8964145183563232,
            "layerwise_effective_rank": 3.37788462638855,
            "layerwise_effective_rank_mergeability_score": -36.409202575683594,
            "task_vector_cosine_similarity": 25.98237419128418,
            "task_vector_l2_distance": -46.71500778198242,
            "task_vector_dot_product": 26.040889739990234,
            "weight_space_angle": -7.79760217666626,
            "task_vector_magnitude_ratio": 7.204225540161133,
            "singular_value_overlap": -70.55900573730469,
            "subspace_overlap": 34.70768737792969,
            "right_subspace_overlap": 42.275535583496094,
            "encoder_gradient_cosine_similarity": 51.94562911987305,
            "encoder_gradient_l2_distance": -52.21907424926758,
            "encoder_gradient_dot_product": 38.22370147705078,
            "input_gradient_cosine_similarity": 10.884904861450195,
            "input_gradient_l2_distance": -18.930143356323242,
            "input_gradient_dot_product": -79.8107681274414
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.5234482628950385,
          "val_r": 0.324962330281244,
          "n_iterations": 578,
          "coefficients": {
            "right_subspace_overlap_top_k": 23.093372344970703,
            "right_subspace_overlap_bottom_k": 8.336146354675293,
            "interaction_matrix_overlap_top_k": 39.1578483581543,
            "interaction_matrix_overlap_bottom_k": -11.3031005859375,
            "effective_rank": 8.395235061645508,
            "effective_rank_mergeability_score": 22.694334030151367,
            "stable_rank": -24.98686408996582,
            "spectral_gap": 16.827533721923828,
            "singular_value_ratio": 18.705846786499023,
            "layerwise_effective_rank": 16.69921112060547,
            "layerwise_effective_rank_mergeability_score": -14.714447975158691,
            "task_vector_cosine_similarity": 36.72145462036133,
            "task_vector_l2_distance": -48.15574264526367,
            "task_vector_dot_product": 10.358277320861816,
            "weight_space_angle": -18.935791015625,
            "task_vector_magnitude_ratio": -16.920522689819336,
            "singular_value_overlap": -35.771209716796875,
            "subspace_overlap": 16.20085906982422,
            "right_subspace_overlap": 38.11738967895508,
            "encoder_gradient_cosine_similarity": 21.38450813293457,
            "encoder_gradient_l2_distance": -47.4753303527832,
            "encoder_gradient_dot_product": 39.91044235229492,
            "input_gradient_cosine_similarity": 25.9606876373291,
            "input_gradient_l2_distance": -43.985286712646484,
            "input_gradient_dot_product": -79.31743621826172
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.6339239253484723,
          "val_r": 0.6271747105043887,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.7030816674232483,
            "right_subspace_overlap_bottom_k": -1.3194390535354614,
            "interaction_matrix_overlap_top_k": -1.3045084476470947,
            "interaction_matrix_overlap_bottom_k": 1.6603361368179321,
            "effective_rank": 0.8246133327484131,
            "effective_rank_mergeability_score": 0.8438488841056824,
            "stable_rank": -0.43540260195732117,
            "spectral_gap": 0.7436414361000061,
            "singular_value_ratio": 1.3213874101638794,
            "layerwise_effective_rank": 0.05950816348195076,
            "layerwise_effective_rank_mergeability_score": -0.30908089876174927,
            "task_vector_cosine_similarity": -0.10105843096971512,
            "task_vector_l2_distance": -0.3238810896873474,
            "task_vector_dot_product": 0.26616933941841125,
            "weight_space_angle": -0.4470946490764618,
            "task_vector_magnitude_ratio": -0.5447966456413269,
            "singular_value_overlap": -0.2389024794101715,
            "subspace_overlap": 0.02082696370780468,
            "right_subspace_overlap": 0.1490701138973236,
            "encoder_gradient_cosine_similarity": 0.02915845811367035,
            "encoder_gradient_l2_distance": -0.24531660974025726,
            "encoder_gradient_dot_product": 0.08452872186899185,
            "input_gradient_cosine_similarity": 0.03306785598397255,
            "input_gradient_l2_distance": -0.34659719467163086,
            "input_gradient_dot_product": -0.1244048923254013
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.46415642713935423,
          "val_r": 0.27998057552809863,
          "n_iterations": 452,
          "coefficients": {
            "right_subspace_overlap_top_k": 50.51213073730469,
            "right_subspace_overlap_bottom_k": 47.291866302490234,
            "interaction_matrix_overlap_top_k": 8.86070442199707,
            "interaction_matrix_overlap_bottom_k": 0.410295307636261,
            "effective_rank": -9.540502548217773,
            "effective_rank_mergeability_score": -6.258843421936035,
            "stable_rank": 38.57206726074219,
            "spectral_gap": 9.550190925598145,
            "singular_value_ratio": -23.652217864990234,
            "layerwise_effective_rank": -9.4213285446167,
            "layerwise_effective_rank_mergeability_score": 16.242231369018555,
            "task_vector_cosine_similarity": 27.029829025268555,
            "task_vector_l2_distance": 19.34555435180664,
            "task_vector_dot_product": -83.88105773925781,
            "weight_space_angle": -39.743919372558594,
            "task_vector_magnitude_ratio": -20.537233352661133,
            "singular_value_overlap": -44.7902946472168,
            "subspace_overlap": 54.19511032104492,
            "right_subspace_overlap": 22.23213768005371,
            "encoder_gradient_cosine_similarity": 28.091524124145508,
            "encoder_gradient_l2_distance": -55.82686233520508,
            "encoder_gradient_dot_product": 29.862712860107422,
            "input_gradient_cosine_similarity": 45.27146530151367,
            "input_gradient_l2_distance": -59.692771911621094,
            "input_gradient_dot_product": -43.12609100341797
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7174574083805669,
          "val_r": 0.5653813813897329,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 5.390468597412109,
            "right_subspace_overlap_bottom_k": -21.386859893798828,
            "interaction_matrix_overlap_top_k": 47.008155822753906,
            "interaction_matrix_overlap_bottom_k": -12.72534465789795,
            "effective_rank": 10.950394630432129,
            "effective_rank_mergeability_score": 24.135658264160156,
            "stable_rank": -4.904451370239258,
            "spectral_gap": -14.820734977722168,
            "singular_value_ratio": -0.3407781720161438,
            "layerwise_effective_rank": -7.766732692718506,
            "layerwise_effective_rank_mergeability_score": -10.444629669189453,
            "task_vector_cosine_similarity": 0.2673704922199249,
            "task_vector_l2_distance": 6.8067522048950195,
            "task_vector_dot_product": -3.215407371520996,
            "weight_space_angle": 8.997876167297363,
            "task_vector_magnitude_ratio": -5.43796443939209,
            "singular_value_overlap": 1.3659943342208862,
            "subspace_overlap": 5.707612037658691,
            "right_subspace_overlap": 8.730350494384766,
            "encoder_gradient_cosine_similarity": 15.668286323547363,
            "encoder_gradient_l2_distance": -21.144027709960938,
            "encoder_gradient_dot_product": 10.666647911071777,
            "input_gradient_cosine_similarity": -2.1893627643585205,
            "input_gradient_l2_distance": -25.151046752929688,
            "input_gradient_dot_product": -15.169817924499512
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5843324656494935,
          "val_r": 0.38853659529103873,
          "n_iterations": 848,
          "coefficients": {
            "right_subspace_overlap_top_k": 4.988145351409912,
            "right_subspace_overlap_bottom_k": -12.991991996765137,
            "interaction_matrix_overlap_top_k": 17.994678497314453,
            "interaction_matrix_overlap_bottom_k": 31.89631462097168,
            "effective_rank": 7.5663018226623535,
            "effective_rank_mergeability_score": 7.250909805297852,
            "stable_rank": 3.5462357997894287,
            "spectral_gap": 30.750585556030273,
            "singular_value_ratio": 21.229257583618164,
            "layerwise_effective_rank": 17.581045150756836,
            "layerwise_effective_rank_mergeability_score": 24.16205406188965,
            "task_vector_cosine_similarity": -25.664306640625,
            "task_vector_l2_distance": -44.19503402709961,
            "task_vector_dot_product": 13.0364351272583,
            "weight_space_angle": -12.606192588806152,
            "task_vector_magnitude_ratio": -7.857732772827148,
            "singular_value_overlap": -43.11944580078125,
            "subspace_overlap": 20.135494232177734,
            "right_subspace_overlap": 11.115256309509277,
            "encoder_gradient_cosine_similarity": 20.587339401245117,
            "encoder_gradient_l2_distance": -35.54729461669922,
            "encoder_gradient_dot_product": 27.51205062866211,
            "input_gradient_cosine_similarity": 15.245153427124023,
            "input_gradient_l2_distance": -45.00881576538086,
            "input_gradient_dot_product": -46.608253479003906
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    },
    "tsv": {
      "aggregate_metrics": {
        "train_r": 0.09183687909939028,
        "train_p": 1.7707644466284906e-07,
        "val_r": 0.08687895988437096,
        "val_p": 0.10075950327351509
      },
      "per_fold_stats": {
        "train_r_mean": 0.6559518826312077,
        "train_r_std": 0.09486562821975214,
        "val_r_mean": 0.5549913283389103,
        "val_r_std": 0.20292178956865428
      },
      "average_coefficients": {
        "right_subspace_overlap_top_k": 51.5689811706543,
        "right_subspace_overlap_bottom_k": -25.292430877685547,
        "interaction_matrix_overlap_top_k": 28.448654174804688,
        "interaction_matrix_overlap_bottom_k": 1.526309609413147,
        "effective_rank": 3.617974042892456,
        "effective_rank_mergeability_score": 14.779199600219727,
        "stable_rank": 11.42481803894043,
        "spectral_gap": 8.259401321411133,
        "singular_value_ratio": 4.448522090911865,
        "layerwise_effective_rank": -1.7128515243530273,
        "layerwise_effective_rank_mergeability_score": 0.9680374264717102,
        "task_vector_cosine_similarity": 15.453977584838867,
        "task_vector_l2_distance": -13.318827629089355,
        "task_vector_dot_product": -12.888193130493164,
        "weight_space_angle": -10.974605560302734,
        "task_vector_magnitude_ratio": -1.4384143352508545,
        "singular_value_overlap": 15.125033378601074,
        "subspace_overlap": -1.983797311782837,
        "right_subspace_overlap": -22.004032135009766,
        "encoder_gradient_cosine_similarity": 19.64982032775879,
        "encoder_gradient_l2_distance": -48.181304931640625,
        "encoder_gradient_dot_product": 23.760602951049805,
        "input_gradient_cosine_similarity": -9.984248161315918,
        "input_gradient_l2_distance": -21.130084991455078,
        "input_gradient_dot_product": -29.124820709228516
      },
      "coefficient_std": {
        "right_subspace_overlap_top_k": 149.35882568359375,
        "right_subspace_overlap_bottom_k": 48.58954620361328,
        "interaction_matrix_overlap_top_k": 51.27946853637695,
        "interaction_matrix_overlap_bottom_k": 56.646053314208984,
        "effective_rank": 41.28589630126953,
        "effective_rank_mergeability_score": 65.41566467285156,
        "stable_rank": 106.93952941894531,
        "spectral_gap": 35.45848083496094,
        "singular_value_ratio": 13.960068702697754,
        "layerwise_effective_rank": 14.932609558105469,
        "layerwise_effective_rank_mergeability_score": 20.2020320892334,
        "task_vector_cosine_similarity": 27.948463439941406,
        "task_vector_l2_distance": 28.282773971557617,
        "task_vector_dot_product": 83.67048645019531,
        "weight_space_angle": 31.82280158996582,
        "task_vector_magnitude_ratio": 63.98155975341797,
        "singular_value_overlap": 41.52299880981445,
        "subspace_overlap": 22.75664710998535,
        "right_subspace_overlap": 132.89434814453125,
        "encoder_gradient_cosine_similarity": 30.638072967529297,
        "encoder_gradient_l2_distance": 87.0252456665039,
        "encoder_gradient_dot_product": 70.86094665527344,
        "input_gradient_cosine_similarity": 70.91796112060547,
        "input_gradient_l2_distance": 37.16252899169922,
        "input_gradient_dot_product": 65.93130493164062
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.6713895295890558,
          "val_r": 0.6411714169399075,
          "n_iterations": 898,
          "coefficients": {
            "right_subspace_overlap_top_k": 25.987531661987305,
            "right_subspace_overlap_bottom_k": -10.768632888793945,
            "interaction_matrix_overlap_top_k": -4.137286186218262,
            "interaction_matrix_overlap_bottom_k": -15.254526138305664,
            "effective_rank": 8.828700065612793,
            "effective_rank_mergeability_score": -0.7753280401229858,
            "stable_rank": 2.7487311363220215,
            "spectral_gap": 5.471801280975342,
            "singular_value_ratio": 9.319009780883789,
            "layerwise_effective_rank": -15.011987686157227,
            "layerwise_effective_rank_mergeability_score": 0.4198601543903351,
            "task_vector_cosine_similarity": -8.01361083984375,
            "task_vector_l2_distance": -10.792259216308594,
            "task_vector_dot_product": 5.449970245361328,
            "weight_space_angle": 11.540079116821289,
            "task_vector_magnitude_ratio": -4.324131965637207,
            "singular_value_overlap": 4.004635810852051,
            "subspace_overlap": -6.34647798538208,
            "right_subspace_overlap": 27.868314743041992,
            "encoder_gradient_cosine_similarity": 8.436690330505371,
            "encoder_gradient_l2_distance": -22.036836624145508,
            "encoder_gradient_dot_product": 4.841688632965088,
            "input_gradient_cosine_similarity": 1.7643086910247803,
            "input_gradient_l2_distance": -21.894670486450195,
            "input_gradient_dot_product": 3.672814130783081
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.40840195954447384,
          "val_r": 0.3112053358877407,
          "n_iterations": 51,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.2157631367444992,
            "right_subspace_overlap_bottom_k": -0.26164913177490234,
            "interaction_matrix_overlap_top_k": 0.5257810354232788,
            "interaction_matrix_overlap_bottom_k": -0.3869801461696625,
            "effective_rank": -0.08332329988479614,
            "effective_rank_mergeability_score": 0.05449063330888748,
            "stable_rank": 0.2452387511730194,
            "spectral_gap": -0.12522803246974945,
            "singular_value_ratio": 0.4041294753551483,
            "layerwise_effective_rank": 0.18241079151630402,
            "layerwise_effective_rank_mergeability_score": -0.09107858687639236,
            "task_vector_cosine_similarity": 0.23678362369537354,
            "task_vector_l2_distance": -0.495013564825058,
            "task_vector_dot_product": -0.031042352318763733,
            "weight_space_angle": -0.2893947660923004,
            "task_vector_magnitude_ratio": -0.10632747411727905,
            "singular_value_overlap": 0.5669344067573547,
            "subspace_overlap": 0.8257344365119934,
            "right_subspace_overlap": -0.25742340087890625,
            "encoder_gradient_cosine_similarity": 0.691683828830719,
            "encoder_gradient_l2_distance": -0.6961145401000977,
            "encoder_gradient_dot_product": 0.6441774368286133,
            "input_gradient_cosine_similarity": -0.615055501461029,
            "input_gradient_l2_distance": -0.007442818954586983,
            "input_gradient_dot_product": -0.1672428995370865
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.4917220117875425,
          "val_r": 0.06885550615486268,
          "n_iterations": 640,
          "coefficients": {
            "right_subspace_overlap_top_k": 91.47201538085938,
            "right_subspace_overlap_bottom_k": -9.005743026733398,
            "interaction_matrix_overlap_top_k": 85.50789642333984,
            "interaction_matrix_overlap_bottom_k": 31.047595977783203,
            "effective_rank": -76.40718841552734,
            "effective_rank_mergeability_score": 18.86224937438965,
            "stable_rank": -135.6186981201172,
            "spectral_gap": 12.425161361694336,
            "singular_value_ratio": 49.886962890625,
            "layerwise_effective_rank": 8.770288467407227,
            "layerwise_effective_rank_mergeability_score": 11.708568572998047,
            "task_vector_cosine_similarity": 103.55833435058594,
            "task_vector_l2_distance": -120.5285415649414,
            "task_vector_dot_product": 69.55159759521484,
            "weight_space_angle": -92.958251953125,
            "task_vector_magnitude_ratio": 136.23426818847656,
            "singular_value_overlap": -17.427114486694336,
            "subspace_overlap": -7.937014102935791,
            "right_subspace_overlap": 24.93612289428711,
            "encoder_gradient_cosine_similarity": 29.28325843811035,
            "encoder_gradient_l2_distance": -224.88682556152344,
            "encoder_gradient_dot_product": 19.926570892333984,
            "input_gradient_cosine_similarity": 75.43815612792969,
            "input_gradient_l2_distance": 38.19495391845703,
            "input_gradient_dot_product": -121.0369873046875
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6839838609547755,
          "val_r": 0.49691612364717724,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 15.316924095153809,
            "right_subspace_overlap_bottom_k": -18.363773345947266,
            "interaction_matrix_overlap_top_k": 6.584619998931885,
            "interaction_matrix_overlap_bottom_k": -10.445343971252441,
            "effective_rank": -4.156853675842285,
            "effective_rank_mergeability_score": 2.8757269382476807,
            "stable_rank": 1.3290164470672607,
            "spectral_gap": 0.1076880544424057,
            "singular_value_ratio": 10.164698600769043,
            "layerwise_effective_rank": 0.5778095722198486,
            "layerwise_effective_rank_mergeability_score": 5.378847122192383,
            "task_vector_cosine_similarity": 0.3277626633644104,
            "task_vector_l2_distance": -5.2163801193237305,
            "task_vector_dot_product": 1.7293503284454346,
            "weight_space_angle": -1.0814930200576782,
            "task_vector_magnitude_ratio": -3.432966947555542,
            "singular_value_overlap": 6.633322715759277,
            "subspace_overlap": 1.333268642425537,
            "right_subspace_overlap": 15.284071922302246,
            "encoder_gradient_cosine_similarity": 12.889690399169922,
            "encoder_gradient_l2_distance": -17.015094757080078,
            "encoder_gradient_dot_product": 9.267631530761719,
            "input_gradient_cosine_similarity": -0.38462403416633606,
            "input_gradient_l2_distance": -16.35335922241211,
            "input_gradient_dot_product": -12.352011680603027
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6730258501588,
          "val_r": 0.6204394954977722,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 4.203489780426025,
            "right_subspace_overlap_bottom_k": -6.679756164550781,
            "interaction_matrix_overlap_top_k": 14.289693832397461,
            "interaction_matrix_overlap_bottom_k": -8.781682968139648,
            "effective_rank": 0.5743672847747803,
            "effective_rank_mergeability_score": 3.477797746658325,
            "stable_rank": -4.16275691986084,
            "spectral_gap": 0.24898996949195862,
            "singular_value_ratio": -2.6147100925445557,
            "layerwise_effective_rank": 2.686128616333008,
            "layerwise_effective_rank_mergeability_score": -1.4691781997680664,
            "task_vector_cosine_similarity": 3.403850555419922,
            "task_vector_l2_distance": -8.205828666687012,
            "task_vector_dot_product": 5.267849922180176,
            "weight_space_angle": 2.983766794204712,
            "task_vector_magnitude_ratio": 4.494879245758057,
            "singular_value_overlap": 3.013500213623047,
            "subspace_overlap": -0.2238200604915619,
            "right_subspace_overlap": 5.409512996673584,
            "encoder_gradient_cosine_similarity": 7.952455520629883,
            "encoder_gradient_l2_distance": -13.055950164794922,
            "encoder_gradient_dot_product": 4.547661304473877,
            "input_gradient_cosine_similarity": 4.565752983093262,
            "input_gradient_l2_distance": -12.084242820739746,
            "input_gradient_dot_product": -8.842947959899902
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.6205765310905934,
          "val_r": 0.6098770892003107,
          "n_iterations": 961,
          "coefficients": {
            "right_subspace_overlap_top_k": 29.817859649658203,
            "right_subspace_overlap_bottom_k": -76.00479888916016,
            "interaction_matrix_overlap_top_k": 73.14344787597656,
            "interaction_matrix_overlap_bottom_k": -57.798118591308594,
            "effective_rank": 11.836891174316406,
            "effective_rank_mergeability_score": 5.175981044769287,
            "stable_rank": -27.425554275512695,
            "spectral_gap": -66.69442749023438,
            "singular_value_ratio": -4.98028564453125,
            "layerwise_effective_rank": -9.00650691986084,
            "layerwise_effective_rank_mergeability_score": 15.944249153137207,
            "task_vector_cosine_similarity": 10.292780876159668,
            "task_vector_l2_distance": -20.076751708984375,
            "task_vector_dot_product": 22.796783447265625,
            "weight_space_angle": 1.9438261985778809,
            "task_vector_magnitude_ratio": -28.084514617919922,
            "singular_value_overlap": 16.032323837280273,
            "subspace_overlap": 23.110462188720703,
            "right_subspace_overlap": 61.59674072265625,
            "encoder_gradient_cosine_similarity": 47.044647216796875,
            "encoder_gradient_l2_distance": -41.06892395019531,
            "encoder_gradient_dot_product": 31.504566192626953,
            "input_gradient_cosine_similarity": 25.59151840209961,
            "input_gradient_l2_distance": -0.790868878364563,
            "input_gradient_dot_product": -42.90296936035156
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.7083184250494758,
          "val_r": 0.6630981285218713,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.248870849609375,
            "right_subspace_overlap_bottom_k": -2.2991514205932617,
            "interaction_matrix_overlap_top_k": -1.1342581510543823,
            "interaction_matrix_overlap_bottom_k": -2.3656821250915527,
            "effective_rank": 1.485943078994751,
            "effective_rank_mergeability_score": 2.7504167556762695,
            "stable_rank": -1.2075531482696533,
            "spectral_gap": 0.46212413907051086,
            "singular_value_ratio": 1.5115944147109985,
            "layerwise_effective_rank": 1.1392478942871094,
            "layerwise_effective_rank_mergeability_score": -0.6845572590827942,
            "task_vector_cosine_similarity": 2.600172281265259,
            "task_vector_l2_distance": -2.4164278507232666,
            "task_vector_dot_product": 1.3913229703903198,
            "weight_space_angle": 2.471693754196167,
            "task_vector_magnitude_ratio": -1.115517020225525,
            "singular_value_overlap": 1.543838381767273,
            "subspace_overlap": -2.3552722930908203,
            "right_subspace_overlap": 3.5238757133483887,
            "encoder_gradient_cosine_similarity": 1.7897549867630005,
            "encoder_gradient_l2_distance": -5.608683109283447,
            "encoder_gradient_dot_product": 1.6288381814956665,
            "input_gradient_cosine_similarity": -0.4398190379142761,
            "input_gradient_l2_distance": -3.0475738048553467,
            "input_gradient_dot_product": -1.8741015195846558
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7028853215326419,
          "val_r": 0.2474128870111539,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 16.554393768310547,
            "right_subspace_overlap_bottom_k": -11.639678001403809,
            "interaction_matrix_overlap_top_k": 2.8885929584503174,
            "interaction_matrix_overlap_bottom_k": -4.381120681762695,
            "effective_rank": -7.289849281311035,
            "effective_rank_mergeability_score": -8.874456405639648,
            "stable_rank": 1.7440423965454102,
            "spectral_gap": 8.170393943786621,
            "singular_value_ratio": 7.691953182220459,
            "layerwise_effective_rank": -1.143625020980835,
            "layerwise_effective_rank_mergeability_score": 5.378459453582764,
            "task_vector_cosine_similarity": -6.128944396972656,
            "task_vector_l2_distance": -6.185261249542236,
            "task_vector_dot_product": -1.6460403203964233,
            "weight_space_angle": 2.9042391777038574,
            "task_vector_magnitude_ratio": 1.29140043258667,
            "singular_value_overlap": 3.5018324851989746,
            "subspace_overlap": -4.732745170593262,
            "right_subspace_overlap": 12.120718955993652,
            "encoder_gradient_cosine_similarity": 6.808775424957275,
            "encoder_gradient_l2_distance": -13.633010864257812,
            "encoder_gradient_dot_product": 4.100926399230957,
            "input_gradient_cosine_similarity": 1.842816710472107,
            "input_gradient_l2_distance": -7.873898506164551,
            "input_gradient_dot_product": -0.4712892472743988
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.7286952915999447,
          "val_r": 0.11378227167799115,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 11.640851020812988,
            "right_subspace_overlap_bottom_k": -6.225329399108887,
            "interaction_matrix_overlap_top_k": 6.273797035217285,
            "interaction_matrix_overlap_bottom_k": -8.089875221252441,
            "effective_rank": 0.1704530566930771,
            "effective_rank_mergeability_score": 2.3843555450439453,
            "stable_rank": -4.972339630126953,
            "spectral_gap": -0.11800853163003922,
            "singular_value_ratio": 0.2893342673778534,
            "layerwise_effective_rank": 2.4228055477142334,
            "layerwise_effective_rank_mergeability_score": 2.143836498260498,
            "task_vector_cosine_similarity": 1.617051362991333,
            "task_vector_l2_distance": -3.2527880668640137,
            "task_vector_dot_product": -0.7871229648590088,
            "weight_space_angle": 3.8652262687683105,
            "task_vector_magnitude_ratio": 3.3777084350585938,
            "singular_value_overlap": 3.614614486694336,
            "subspace_overlap": -3.1981124877929688,
            "right_subspace_overlap": 5.854832649230957,
            "encoder_gradient_cosine_similarity": 5.635009288787842,
            "encoder_gradient_l2_distance": -9.903761863708496,
            "encoder_gradient_dot_product": 3.932363271713257,
            "input_gradient_cosine_similarity": 1.4484516382217407,
            "input_gradient_l2_distance": -11.312485694885254,
            "input_gradient_dot_product": -5.812064170837402
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7652517786066674,
          "val_r": 0.6212663758307135,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.1443259716033936,
            "right_subspace_overlap_bottom_k": -3.2831616401672363,
            "interaction_matrix_overlap_top_k": 2.172849416732788,
            "interaction_matrix_overlap_bottom_k": -2.9141287803649902,
            "effective_rank": 0.335595041513443,
            "effective_rank_mergeability_score": 1.4914823770523071,
            "stable_rank": 2.165891170501709,
            "spectral_gap": -0.6274007558822632,
            "singular_value_ratio": 0.7840216159820557,
            "layerwise_effective_rank": -1.248640537261963,
            "layerwise_effective_rank_mergeability_score": 1.9842818975448608,
            "task_vector_cosine_similarity": -1.514050841331482,
            "task_vector_l2_distance": -0.7337700128555298,
            "task_vector_dot_product": 0.1803540140390396,
            "weight_space_angle": 2.6315064430236816,
            "task_vector_magnitude_ratio": -0.8674633502960205,
            "singular_value_overlap": 1.5708211660385132,
            "subspace_overlap": -1.1962069272994995,
            "right_subspace_overlap": 4.973667144775391,
            "encoder_gradient_cosine_similarity": 1.8119951486587524,
            "encoder_gradient_l2_distance": -5.331720352172852,
            "encoder_gradient_dot_product": 0.5542052388191223,
            "input_gradient_cosine_similarity": 0.6404616236686707,
            "input_gradient_l2_distance": -3.9259800910949707,
            "input_gradient_dot_product": -1.7997509241104126
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6914540291212882,
          "val_r": 0.5220326020258137,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 22.066890716552734,
            "right_subspace_overlap_bottom_k": -17.84808921813965,
            "interaction_matrix_overlap_top_k": -0.2536482810974121,
            "interaction_matrix_overlap_bottom_k": -4.44429349899292,
            "effective_rank": 4.293068885803223,
            "effective_rank_mergeability_score": 0.5732207298278809,
            "stable_rank": -18.580720901489258,
            "spectral_gap": 2.2324798107147217,
            "singular_value_ratio": 13.525026321411133,
            "layerwise_effective_rank": 12.930670738220215,
            "layerwise_effective_rank_mergeability_score": 2.307906150817871,
            "task_vector_cosine_similarity": -2.9083497524261475,
            "task_vector_l2_distance": -3.297652244567871,
            "task_vector_dot_product": 0.2885938286781311,
            "weight_space_angle": -0.13104557991027832,
            "task_vector_magnitude_ratio": -6.259285926818848,
            "singular_value_overlap": 11.066344261169434,
            "subspace_overlap": -5.997982025146484,
            "right_subspace_overlap": 10.181987762451172,
            "encoder_gradient_cosine_similarity": 5.0114922523498535,
            "encoder_gradient_l2_distance": -10.736136436462402,
            "encoder_gradient_dot_product": 5.45650053024292,
            "input_gradient_cosine_similarity": -0.8989829421043396,
            "input_gradient_l2_distance": -14.42650032043457,
            "input_gradient_dot_product": -3.152975559234619
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.6716802805724804,
          "val_r": 0.7322567644791279,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 9.125964164733887,
            "right_subspace_overlap_bottom_k": -14.381304740905762,
            "interaction_matrix_overlap_top_k": 29.169424057006836,
            "interaction_matrix_overlap_bottom_k": -14.648035049438477,
            "effective_rank": -10.59085750579834,
            "effective_rank_mergeability_score": 9.729841232299805,
            "stable_rank": 8.808917045593262,
            "spectral_gap": -8.399788856506348,
            "singular_value_ratio": -1.2188982963562012,
            "layerwise_effective_rank": 2.2115108966827393,
            "layerwise_effective_rank_mergeability_score": -6.257704257965088,
            "task_vector_cosine_similarity": 3.54317307472229,
            "task_vector_l2_distance": -3.7591516971588135,
            "task_vector_dot_product": -2.7322051525115967,
            "weight_space_angle": 5.94979190826416,
            "task_vector_magnitude_ratio": -4.2862868309021,
            "singular_value_overlap": 9.336313247680664,
            "subspace_overlap": 4.716660976409912,
            "right_subspace_overlap": 1.8311452865600586,
            "encoder_gradient_cosine_similarity": 9.482322692871094,
            "encoder_gradient_l2_distance": -8.748127937316895,
            "encoder_gradient_dot_product": 15.159830093383789,
            "input_gradient_cosine_similarity": 2.5328152179718018,
            "input_gradient_l2_distance": -23.470218658447266,
            "input_gradient_dot_product": -12.106602668762207
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.672193007730066,
          "val_r": 0.5198263269548453,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 4.659052848815918,
            "right_subspace_overlap_bottom_k": -5.9499993324279785,
            "interaction_matrix_overlap_top_k": 7.741866588592529,
            "interaction_matrix_overlap_bottom_k": -14.829258918762207,
            "effective_rank": 7.519309043884277,
            "effective_rank_mergeability_score": 3.2763209342956543,
            "stable_rank": -4.304373741149902,
            "spectral_gap": -6.095963478088379,
            "singular_value_ratio": 5.977419376373291,
            "layerwise_effective_rank": 9.211402893066406,
            "layerwise_effective_rank_mergeability_score": 7.870409965515137,
            "task_vector_cosine_similarity": 18.181852340698242,
            "task_vector_l2_distance": -4.83858060836792,
            "task_vector_dot_product": 14.558985710144043,
            "weight_space_angle": -6.675022602081299,
            "task_vector_magnitude_ratio": -12.362349510192871,
            "singular_value_overlap": 6.29454231262207,
            "subspace_overlap": -10.349059104919434,
            "right_subspace_overlap": 3.428696393966675,
            "encoder_gradient_cosine_similarity": 7.724040508270264,
            "encoder_gradient_l2_distance": -15.026634216308594,
            "encoder_gradient_dot_product": 7.856668472290039,
            "input_gradient_cosine_similarity": 1.5208473205566406,
            "input_gradient_l2_distance": -11.299993515014648,
            "input_gradient_dot_product": -13.091501235961914
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7469184745781702,
          "val_r": 0.7520826177404584,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 1.6005076169967651,
            "right_subspace_overlap_bottom_k": -2.2851033210754395,
            "interaction_matrix_overlap_top_k": -0.6523812413215637,
            "interaction_matrix_overlap_bottom_k": 1.3345853090286255,
            "effective_rank": 0.7807243466377258,
            "effective_rank_mergeability_score": 0.31188610196113586,
            "stable_rank": -0.07267917692661285,
            "spectral_gap": 0.5945030450820923,
            "singular_value_ratio": 0.8300018906593323,
            "layerwise_effective_rank": -0.06341345608234406,
            "layerwise_effective_rank_mergeability_score": 0.4374631345272064,
            "task_vector_cosine_similarity": 0.6661624312400818,
            "task_vector_l2_distance": -0.39486104249954224,
            "task_vector_dot_product": 0.31096604466438293,
            "weight_space_angle": 0.38616907596588135,
            "task_vector_magnitude_ratio": -0.3524128496646881,
            "singular_value_overlap": -0.0011264709755778313,
            "subspace_overlap": -2.6268365383148193,
            "right_subspace_overlap": 2.3135147094726562,
            "encoder_gradient_cosine_similarity": 0.3381931781768799,
            "encoder_gradient_l2_distance": -1.4045214653015137,
            "encoder_gradient_dot_product": 0.2952536642551422,
            "input_gradient_cosine_similarity": 0.145969957113266,
            "input_gradient_l2_distance": -0.8924943804740906,
            "input_gradient_dot_product": -0.5997004508972168
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.629258301481251,
          "val_r": 0.7364163630560443,
          "n_iterations": 618,
          "coefficients": {
            "right_subspace_overlap_top_k": 9.959654808044434,
            "right_subspace_overlap_bottom_k": -24.414012908935547,
            "interaction_matrix_overlap_top_k": 62.35435485839844,
            "interaction_matrix_overlap_bottom_k": -19.994949340820312,
            "effective_rank": -6.128098964691162,
            "effective_rank_mergeability_score": 15.43166446685791,
            "stable_rank": -17.026485443115234,
            "spectral_gap": 4.79395055770874,
            "singular_value_ratio": -9.442439079284668,
            "layerwise_effective_rank": -5.772395610809326,
            "layerwise_effective_rank_mergeability_score": -11.50314712524414,
            "task_vector_cosine_similarity": 62.59025573730469,
            "task_vector_l2_distance": -1.1867481470108032,
            "task_vector_dot_product": -6.668182849884033,
            "weight_space_angle": -1.935566782951355,
            "task_vector_magnitude_ratio": 30.324426651000977,
            "singular_value_overlap": 23.692346572875977,
            "subspace_overlap": -3.6346404552459717,
            "right_subspace_overlap": 23.697519302368164,
            "encoder_gradient_cosine_similarity": 41.29556655883789,
            "encoder_gradient_l2_distance": -62.6771354675293,
            "encoder_gradient_dot_product": 11.581403732299805,
            "input_gradient_cosine_similarity": 5.238542079925537,
            "input_gradient_l2_distance": -74.91732025146484,
            "input_gradient_dot_product": -44.66096878051758
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.7790270159799468,
          "val_r": 0.6999502506492411,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 5.441356182098389,
            "right_subspace_overlap_bottom_k": -3.8070268630981445,
            "interaction_matrix_overlap_top_k": 3.559030055999756,
            "interaction_matrix_overlap_bottom_k": -2.8010973930358887,
            "effective_rank": 0.7914722561836243,
            "effective_rank_mergeability_score": 1.4214928150177002,
            "stable_rank": -2.775038480758667,
            "spectral_gap": 6.940905570983887,
            "singular_value_ratio": 3.6927669048309326,
            "layerwise_effective_rank": 1.247322916984558,
            "layerwise_effective_rank_mergeability_score": -2.063248634338379,
            "task_vector_cosine_similarity": -2.397775411605835,
            "task_vector_l2_distance": -3.3664662837982178,
            "task_vector_dot_product": 2.379812240600586,
            "weight_space_angle": -0.48706644773483276,
            "task_vector_magnitude_ratio": 3.1371116638183594,
            "singular_value_overlap": 3.082728624343872,
            "subspace_overlap": -9.982644081115723,
            "right_subspace_overlap": 6.180954933166504,
            "encoder_gradient_cosine_similarity": 1.1135538816452026,
            "encoder_gradient_l2_distance": -6.981871128082275,
            "encoder_gradient_dot_product": 1.3775967359542847,
            "input_gradient_cosine_similarity": 0.5431467890739441,
            "input_gradient_l2_distance": -3.3368935585021973,
            "input_gradient_dot_product": -1.911065697669983
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5790384972891656,
          "val_r": 0.6768403096553164,
          "n_iterations": 816,
          "coefficients": {
            "right_subspace_overlap_top_k": 14.90977954864502,
            "right_subspace_overlap_bottom_k": -49.54831314086914,
            "interaction_matrix_overlap_top_k": 27.799217224121094,
            "interaction_matrix_overlap_bottom_k": -35.8800163269043,
            "effective_rank": -27.263368606567383,
            "effective_rank_mergeability_score": -33.489288330078125,
            "stable_rank": -41.55125045776367,
            "spectral_gap": 13.870603561401367,
            "singular_value_ratio": 28.011783599853516,
            "layerwise_effective_rank": 27.037277221679688,
            "layerwise_effective_rank_mergeability_score": 13.145715713500977,
            "task_vector_cosine_similarity": 50.83049774169922,
            "task_vector_l2_distance": 15.118517875671387,
            "task_vector_dot_product": 11.27409839630127,
            "weight_space_angle": -33.37371826171875,
            "task_vector_magnitude_ratio": 3.802959442138672,
            "singular_value_overlap": 30.570146560668945,
            "subspace_overlap": 68.5987319946289,
            "right_subspace_overlap": -32.21512985229492,
            "encoder_gradient_cosine_similarity": 30.147212982177734,
            "encoder_gradient_l2_distance": -49.23640441894531,
            "encoder_gradient_dot_product": 5.657569885253906,
            "input_gradient_cosine_similarity": 7.1517839431762695,
            "input_gradient_l2_distance": -61.344913482666016,
            "input_gradient_dot_product": 16.9746036529541
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7159204135891603,
          "val_r": 0.689844929971069,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 2.0224545001983643,
            "right_subspace_overlap_bottom_k": -3.3090426921844482,
            "interaction_matrix_overlap_top_k": 1.193803071975708,
            "interaction_matrix_overlap_bottom_k": 0.6667261719703674,
            "effective_rank": 1.9366470575332642,
            "effective_rank_mergeability_score": 0.7802411913871765,
            "stable_rank": -0.8420431017875671,
            "spectral_gap": 1.4304769039154053,
            "singular_value_ratio": 1.3639343976974487,
            "layerwise_effective_rank": -0.20991410315036774,
            "layerwise_effective_rank_mergeability_score": 0.29965469241142273,
            "task_vector_cosine_similarity": 1.4792081117630005,
            "task_vector_l2_distance": -1.2992231845855713,
            "task_vector_dot_product": 0.7268633246421814,
            "weight_space_angle": 1.1913421154022217,
            "task_vector_magnitude_ratio": -0.3073752820491791,
            "singular_value_overlap": 0.8218332529067993,
            "subspace_overlap": -3.0835883617401123,
            "right_subspace_overlap": 1.6335442066192627,
            "encoder_gradient_cosine_similarity": 1.0071847438812256,
            "encoder_gradient_l2_distance": -3.394143581390381,
            "encoder_gradient_dot_product": 0.9818428158760071,
            "input_gradient_cosine_similarity": 0.0301649272441864,
            "input_gradient_l2_distance": -2.8643686771392822,
            "input_gradient_dot_product": -1.2566584348678589
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4829327105055029,
          "val_r": 0.620234887882532,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 695.4249267578125,
            "right_subspace_overlap_bottom_k": -222.54833984375,
            "interaction_matrix_overlap_top_k": 222.08056640625,
            "interaction_matrix_overlap_bottom_k": 236.5356903076172,
            "effective_rank": 165.07479858398438,
            "effective_rank_mergeability_score": 295.53533935546875,
            "stable_rank": 457.72235107421875,
            "spectral_gap": 135.7885284423828,
            "singular_value_ratio": -7.342919826507568,
            "layerwise_effective_rank": -52.84562683105469,
            "layerwise_effective_rank_mergeability_score": -71.8589859008789,
            "task_vector_cosine_similarity": 28.959762573242188,
            "task_vector_l2_distance": -56.991294860839844,
            "task_vector_dot_product": -370.6653137207031,
            "weight_space_angle": -112.2515869140625,
            "task_vector_magnitude_ratio": -233.2469024658203,
            "singular_value_overlap": 191.39675903320312,
            "subspace_overlap": -68.48626708984375,
            "right_subspace_overlap": -595.7764892578125,
            "encoder_gradient_cosine_similarity": 137.3548126220703,
            "encoder_gradient_l2_distance": -358.9044189453125,
            "encoder_gradient_dot_product": 330.82305908203125,
            "input_gradient_cosine_similarity": -309.602294921875,
            "input_gradient_l2_distance": -147.7714385986328,
            "input_gradient_dot_product": -287.4062805175781
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6963643618631511,
          "val_r": 0.7563168839942555,
          "n_iterations": 883,
          "coefficients": {
            "right_subspace_overlap_top_k": 64.5670394897461,
            "right_subspace_overlap_bottom_k": -17.225711822509766,
            "interaction_matrix_overlap_top_k": 29.865644454956055,
            "interaction_matrix_overlap_bottom_k": -36.043296813964844,
            "effective_rank": 0.6510544419288635,
            "effective_rank_mergeability_score": -25.409440994262695,
            "stable_rank": 12.271642684936523,
            "spectral_gap": 54.711238861083984,
            "singular_value_ratio": -18.882946014404297,
            "layerwise_effective_rank": -17.371795654296875,
            "layerwise_effective_rank_mergeability_score": 46.26939010620117,
            "task_vector_cosine_similarity": 41.75468063354492,
            "task_vector_l2_distance": -28.458065032958984,
            "task_vector_dot_product": -11.140473365783691,
            "weight_space_angle": -6.176599502563477,
            "task_vector_magnitude_ratio": 83.31450653076172,
            "singular_value_overlap": 3.18609881401062,
            "subspace_overlap": -8.110136985778809,
            "right_subspace_overlap": -22.66680335998535,
            "encoder_gradient_cosine_similarity": 37.178035736083984,
            "encoder_gradient_l2_distance": -93.27980041503906,
            "encoder_gradient_dot_product": 15.073698043823242,
            "input_gradient_cosine_similarity": -16.198951721191406,
            "input_gradient_l2_distance": -43.182010650634766,
            "input_gradient_dot_product": -43.69871520996094
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    },
    "isotropic": {
      "aggregate_metrics": {
        "train_r": 0.16727052636986867,
        "train_p": 1.1953097159150748e-21,
        "val_r": 0.19602247759523134,
        "val_p": 0.0001897999447864549
      },
      "per_fold_stats": {
        "train_r_mean": 0.4806556586097314,
        "train_r_std": 0.09117042485445828,
        "val_r_mean": 0.37584147475286855,
        "val_r_std": 0.20419107919939009
      },
      "average_coefficients": {
        "right_subspace_overlap_top_k": 48.140846252441406,
        "right_subspace_overlap_bottom_k": 36.38416290283203,
        "interaction_matrix_overlap_top_k": 5.945261478424072,
        "interaction_matrix_overlap_bottom_k": 39.328609466552734,
        "effective_rank": -4.18609619140625,
        "effective_rank_mergeability_score": 7.503643989562988,
        "stable_rank": -3.0267465114593506,
        "spectral_gap": 0.3822577893733978,
        "singular_value_ratio": -21.330726623535156,
        "layerwise_effective_rank": -5.568869590759277,
        "layerwise_effective_rank_mergeability_score": -11.3728609085083,
        "task_vector_cosine_similarity": -3.768975019454956,
        "task_vector_l2_distance": -35.93769454956055,
        "task_vector_dot_product": -8.367576599121094,
        "weight_space_angle": 29.854145050048828,
        "task_vector_magnitude_ratio": -7.449483394622803,
        "singular_value_overlap": -42.277854919433594,
        "subspace_overlap": 17.339656829833984,
        "right_subspace_overlap": 17.883533477783203,
        "encoder_gradient_cosine_similarity": 14.315057754516602,
        "encoder_gradient_l2_distance": -25.734664916992188,
        "encoder_gradient_dot_product": 22.976688385009766,
        "input_gradient_cosine_similarity": 18.087373733520508,
        "input_gradient_l2_distance": -46.508689880371094,
        "input_gradient_dot_product": -41.61314010620117
      },
      "coefficient_std": {
        "right_subspace_overlap_top_k": 51.13064956665039,
        "right_subspace_overlap_bottom_k": 65.27442932128906,
        "interaction_matrix_overlap_top_k": 41.54039001464844,
        "interaction_matrix_overlap_bottom_k": 49.813236236572266,
        "effective_rank": 56.09489822387695,
        "effective_rank_mergeability_score": 47.82360076904297,
        "stable_rank": 31.38559913635254,
        "spectral_gap": 34.13792419433594,
        "singular_value_ratio": 37.796295166015625,
        "layerwise_effective_rank": 33.98410415649414,
        "layerwise_effective_rank_mergeability_score": 45.553863525390625,
        "task_vector_cosine_similarity": 40.3008918762207,
        "task_vector_l2_distance": 43.703895568847656,
        "task_vector_dot_product": 44.586219787597656,
        "weight_space_angle": 71.57379150390625,
        "task_vector_magnitude_ratio": 30.82371711730957,
        "singular_value_overlap": 32.79603958129883,
        "subspace_overlap": 32.509300231933594,
        "right_subspace_overlap": 28.939348220825195,
        "encoder_gradient_cosine_similarity": 26.119535446166992,
        "encoder_gradient_l2_distance": 43.2000732421875,
        "encoder_gradient_dot_product": 45.62858963012695,
        "input_gradient_cosine_similarity": 18.023555755615234,
        "input_gradient_l2_distance": 46.92709732055664,
        "input_gradient_dot_product": 63.99600601196289
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.49035500096240414,
          "val_r": 0.5897749418371877,
          "n_iterations": 683,
          "coefficients": {
            "right_subspace_overlap_top_k": 68.73896026611328,
            "right_subspace_overlap_bottom_k": 91.37103271484375,
            "interaction_matrix_overlap_top_k": 31.14832878112793,
            "interaction_matrix_overlap_bottom_k": 69.36382293701172,
            "effective_rank": -8.577086448669434,
            "effective_rank_mergeability_score": 44.32826232910156,
            "stable_rank": -14.363791465759277,
            "spectral_gap": 36.11246109008789,
            "singular_value_ratio": -18.207965850830078,
            "layerwise_effective_rank": -4.282628059387207,
            "layerwise_effective_rank_mergeability_score": -42.51250076293945,
            "task_vector_cosine_similarity": 73.19514465332031,
            "task_vector_l2_distance": -119.96896362304688,
            "task_vector_dot_product": 23.724576950073242,
            "weight_space_angle": 49.45371627807617,
            "task_vector_magnitude_ratio": -5.297768592834473,
            "singular_value_overlap": -95.88085174560547,
            "subspace_overlap": 38.84658432006836,
            "right_subspace_overlap": -9.54377269744873,
            "encoder_gradient_cosine_similarity": -3.9951119422912598,
            "encoder_gradient_l2_distance": -102.61593627929688,
            "encoder_gradient_dot_product": 51.451873779296875,
            "input_gradient_cosine_similarity": 50.68821716308594,
            "input_gradient_l2_distance": -97.03130340576172,
            "input_gradient_dot_product": -105.14765167236328
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5432245058818463,
          "val_r": 0.5197328463708625,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 1.1730304956436157,
            "right_subspace_overlap_bottom_k": 5.983649253845215,
            "interaction_matrix_overlap_top_k": 1.4287620782852173,
            "interaction_matrix_overlap_bottom_k": 0.8823767304420471,
            "effective_rank": -0.040070656687021255,
            "effective_rank_mergeability_score": 3.375462532043457,
            "stable_rank": 0.46151888370513916,
            "spectral_gap": 0.31819936633110046,
            "singular_value_ratio": 1.1532124280929565,
            "layerwise_effective_rank": 3.736110210418701,
            "layerwise_effective_rank_mergeability_score": 1.5772892236709595,
            "task_vector_cosine_similarity": 1.262204647064209,
            "task_vector_l2_distance": -4.911165237426758,
            "task_vector_dot_product": 1.1923397779464722,
            "weight_space_angle": 0.8390842080116272,
            "task_vector_magnitude_ratio": -2.2200582027435303,
            "singular_value_overlap": -3.9218456745147705,
            "subspace_overlap": -1.608397364616394,
            "right_subspace_overlap": -1.7169439792633057,
            "encoder_gradient_cosine_similarity": -0.04548614099621773,
            "encoder_gradient_l2_distance": -4.299805641174316,
            "encoder_gradient_dot_product": 0.5524417757987976,
            "input_gradient_cosine_similarity": 1.2432482242584229,
            "input_gradient_l2_distance": -4.03558874130249,
            "input_gradient_dot_product": -1.3803950548171997
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5193761053119121,
          "val_r": 0.413398495600589,
          "n_iterations": 424,
          "coefficients": {
            "right_subspace_overlap_top_k": 7.439212799072266,
            "right_subspace_overlap_bottom_k": 28.560771942138672,
            "interaction_matrix_overlap_top_k": 32.49717712402344,
            "interaction_matrix_overlap_bottom_k": 37.39506912231445,
            "effective_rank": 15.862244606018066,
            "effective_rank_mergeability_score": -3.6840758323669434,
            "stable_rank": 1.5780128240585327,
            "spectral_gap": 6.154335021972656,
            "singular_value_ratio": -16.540281295776367,
            "layerwise_effective_rank": 5.565829277038574,
            "layerwise_effective_rank_mergeability_score": 16.927337646484375,
            "task_vector_cosine_similarity": -2.214674949645996,
            "task_vector_l2_distance": -40.83401870727539,
            "task_vector_dot_product": 2.5227065086364746,
            "weight_space_angle": 7.882326602935791,
            "task_vector_magnitude_ratio": -12.583118438720703,
            "singular_value_overlap": -51.556156158447266,
            "subspace_overlap": 19.336524963378906,
            "right_subspace_overlap": -8.17296314239502,
            "encoder_gradient_cosine_similarity": 2.0466208457946777,
            "encoder_gradient_l2_distance": -25.047700881958008,
            "encoder_gradient_dot_product": 18.198028564453125,
            "input_gradient_cosine_similarity": 26.899076461791992,
            "input_gradient_l2_distance": -37.704261779785156,
            "input_gradient_dot_product": -29.531381607055664
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.579966174092056,
          "val_r": 0.48679996125164293,
          "n_iterations": 847,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.1486072987318039,
            "right_subspace_overlap_bottom_k": -0.9435663223266602,
            "interaction_matrix_overlap_top_k": -1.4640766382217407,
            "interaction_matrix_overlap_bottom_k": 1.4903098344802856,
            "effective_rank": 0.4781189262866974,
            "effective_rank_mergeability_score": 0.8408353924751282,
            "stable_rank": 0.3295753300189972,
            "spectral_gap": 0.3973301947116852,
            "singular_value_ratio": 0.4303008019924164,
            "layerwise_effective_rank": 0.2195240706205368,
            "layerwise_effective_rank_mergeability_score": 0.18679897487163544,
            "task_vector_cosine_similarity": -0.4655703008174896,
            "task_vector_l2_distance": -0.3021492063999176,
            "task_vector_dot_product": 0.3631507456302643,
            "weight_space_angle": -0.5819677114486694,
            "task_vector_magnitude_ratio": -0.19536836445331573,
            "singular_value_overlap": -0.3029221296310425,
            "subspace_overlap": 0.17772604525089264,
            "right_subspace_overlap": 0.591036856174469,
            "encoder_gradient_cosine_similarity": -0.018472040072083473,
            "encoder_gradient_l2_distance": -0.11984168738126755,
            "encoder_gradient_dot_product": 0.010038339532911777,
            "input_gradient_cosine_similarity": 0.09410955756902695,
            "input_gradient_l2_distance": -0.2772441506385803,
            "input_gradient_dot_product": -0.08771701157093048
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.30807196273297327,
          "val_r": 0.2773285391322126,
          "n_iterations": 468,
          "coefficients": {
            "right_subspace_overlap_top_k": 130.7686004638672,
            "right_subspace_overlap_bottom_k": 62.0387077331543,
            "interaction_matrix_overlap_top_k": -57.95948028564453,
            "interaction_matrix_overlap_bottom_k": 138.101318359375,
            "effective_rank": -95.37885284423828,
            "effective_rank_mergeability_score": 14.902533531188965,
            "stable_rank": -68.5762939453125,
            "spectral_gap": 43.962913513183594,
            "singular_value_ratio": 25.943735122680664,
            "layerwise_effective_rank": -16.68250846862793,
            "layerwise_effective_rank_mergeability_score": -93.28252410888672,
            "task_vector_cosine_similarity": 8.395706176757812,
            "task_vector_l2_distance": 83.86421203613281,
            "task_vector_dot_product": -46.50307846069336,
            "weight_space_angle": -75.29857635498047,
            "task_vector_magnitude_ratio": 27.581106185913086,
            "singular_value_overlap": -76.0792465209961,
            "subspace_overlap": 51.7332649230957,
            "right_subspace_overlap": 22.63361167907715,
            "encoder_gradient_cosine_similarity": 3.030287027359009,
            "encoder_gradient_l2_distance": -20.232995986938477,
            "encoder_gradient_dot_product": -21.400075912475586,
            "input_gradient_cosine_similarity": 54.47825622558594,
            "input_gradient_l2_distance": -56.36189270019531,
            "input_gradient_dot_product": -38.68196105957031
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.501065650851966,
          "val_r": 0.7885234591937846,
          "n_iterations": 827,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.45708075165748596,
            "right_subspace_overlap_bottom_k": -24.651683807373047,
            "interaction_matrix_overlap_top_k": -19.98405647277832,
            "interaction_matrix_overlap_bottom_k": 122.3342514038086,
            "effective_rank": 5.601956844329834,
            "effective_rank_mergeability_score": 75.49422454833984,
            "stable_rank": 18.2579402923584,
            "spectral_gap": -50.08512878417969,
            "singular_value_ratio": -16.114686965942383,
            "layerwise_effective_rank": 44.413875579833984,
            "layerwise_effective_rank_mergeability_score": -17.022911071777344,
            "task_vector_cosine_similarity": 40.059261322021484,
            "task_vector_l2_distance": -67.31298065185547,
            "task_vector_dot_product": -9.179458618164062,
            "weight_space_angle": 65.38018035888672,
            "task_vector_magnitude_ratio": -77.51123046875,
            "singular_value_overlap": -49.50196075439453,
            "subspace_overlap": -6.73118257522583,
            "right_subspace_overlap": 65.20758056640625,
            "encoder_gradient_cosine_similarity": -23.36789894104004,
            "encoder_gradient_l2_distance": -31.625972747802734,
            "encoder_gradient_dot_product": 20.550329208374023,
            "input_gradient_cosine_similarity": 19.949304580688477,
            "input_gradient_l2_distance": -91.67476654052734,
            "input_gradient_dot_product": 8.056106567382812
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.5103951402716695,
          "val_r": -0.12236797934569221,
          "n_iterations": 771,
          "coefficients": {
            "right_subspace_overlap_top_k": 42.279197692871094,
            "right_subspace_overlap_bottom_k": 29.664146423339844,
            "interaction_matrix_overlap_top_k": -12.54101276397705,
            "interaction_matrix_overlap_bottom_k": 23.590370178222656,
            "effective_rank": -14.451151847839355,
            "effective_rank_mergeability_score": 9.533377647399902,
            "stable_rank": 31.096492767333984,
            "spectral_gap": 1.2811329364776611,
            "singular_value_ratio": -19.156038284301758,
            "layerwise_effective_rank": 0.7340141534805298,
            "layerwise_effective_rank_mergeability_score": -0.5556400418281555,
            "task_vector_cosine_similarity": 6.814720630645752,
            "task_vector_l2_distance": -56.55878448486328,
            "task_vector_dot_product": 9.925479888916016,
            "weight_space_angle": 65.87046813964844,
            "task_vector_magnitude_ratio": -22.49587631225586,
            "singular_value_overlap": -24.0910587310791,
            "subspace_overlap": 9.785345077514648,
            "right_subspace_overlap": 16.643905639648438,
            "encoder_gradient_cosine_similarity": 14.168031692504883,
            "encoder_gradient_l2_distance": -56.94136428833008,
            "encoder_gradient_dot_product": 32.49527359008789,
            "input_gradient_cosine_similarity": -3.7216618061065674,
            "input_gradient_l2_distance": -27.988113403320312,
            "input_gradient_dot_product": -54.383155822753906
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.36052520601603,
          "val_r": 0.2017799703031678,
          "n_iterations": 564,
          "coefficients": {
            "right_subspace_overlap_top_k": 162.6822967529297,
            "right_subspace_overlap_bottom_k": 40.73015594482422,
            "interaction_matrix_overlap_top_k": 56.48323059082031,
            "interaction_matrix_overlap_bottom_k": 1.1527973413467407,
            "effective_rank": 77.42587280273438,
            "effective_rank_mergeability_score": -68.17317962646484,
            "stable_rank": 45.50536346435547,
            "spectral_gap": 35.732948303222656,
            "singular_value_ratio": -120.54551696777344,
            "layerwise_effective_rank": -92.60032653808594,
            "layerwise_effective_rank_mergeability_score": 40.35059356689453,
            "task_vector_cosine_similarity": -77.54119873046875,
            "task_vector_l2_distance": 2.7235803604125977,
            "task_vector_dot_product": -151.60519409179688,
            "weight_space_angle": -10.938498497009277,
            "task_vector_magnitude_ratio": 29.817665100097656,
            "singular_value_overlap": -100.14379119873047,
            "subspace_overlap": 63.11049270629883,
            "right_subspace_overlap": 85.23873901367188,
            "encoder_gradient_cosine_similarity": 39.64943313598633,
            "encoder_gradient_l2_distance": 12.539162635803223,
            "encoder_gradient_dot_product": -16.206520080566406,
            "input_gradient_cosine_similarity": 0.9239580035209656,
            "input_gradient_l2_distance": -49.030303955078125,
            "input_gradient_dot_product": -6.284627437591553
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.4626262996150136,
          "val_r": 0.08626025633336071,
          "n_iterations": 562,
          "coefficients": {
            "right_subspace_overlap_top_k": 22.86854362487793,
            "right_subspace_overlap_bottom_k": 29.052242279052734,
            "interaction_matrix_overlap_top_k": 2.8914451599121094,
            "interaction_matrix_overlap_bottom_k": 11.669437408447266,
            "effective_rank": -3.7022366523742676,
            "effective_rank_mergeability_score": 8.753951072692871,
            "stable_rank": -8.223271369934082,
            "spectral_gap": 18.251188278198242,
            "singular_value_ratio": -12.545366287231445,
            "layerwise_effective_rank": 16.745704650878906,
            "layerwise_effective_rank_mergeability_score": -14.779810905456543,
            "task_vector_cosine_similarity": -1.9639562368392944,
            "task_vector_l2_distance": -25.07731819152832,
            "task_vector_dot_product": -18.087566375732422,
            "weight_space_angle": -0.14558765292167664,
            "task_vector_magnitude_ratio": -8.301324844360352,
            "singular_value_overlap": -46.397220611572266,
            "subspace_overlap": 9.588438987731934,
            "right_subspace_overlap": 46.38581466674805,
            "encoder_gradient_cosine_similarity": 40.027976989746094,
            "encoder_gradient_l2_distance": -33.93938446044922,
            "encoder_gradient_dot_product": 27.2001953125,
            "input_gradient_cosine_similarity": 18.871225357055664,
            "input_gradient_l2_distance": -32.4463005065918,
            "input_gradient_dot_product": -45.69949722290039
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.43018916804935015,
          "val_r": 0.3443708159487475,
          "n_iterations": 478,
          "coefficients": {
            "right_subspace_overlap_top_k": 109.91810607910156,
            "right_subspace_overlap_bottom_k": -31.887969970703125,
            "interaction_matrix_overlap_top_k": 53.033607482910156,
            "interaction_matrix_overlap_bottom_k": 151.68173217773438,
            "effective_rank": -70.0858154296875,
            "effective_rank_mergeability_score": 85.3682861328125,
            "stable_rank": -31.735443115234375,
            "spectral_gap": 15.583147048950195,
            "singular_value_ratio": -15.10242748260498,
            "layerwise_effective_rank": 11.590651512145996,
            "layerwise_effective_rank_mergeability_score": -80.56339263916016,
            "task_vector_cosine_similarity": 33.413108825683594,
            "task_vector_l2_distance": -44.22798156738281,
            "task_vector_dot_product": -73.55093383789062,
            "weight_space_angle": 30.21847152709961,
            "task_vector_magnitude_ratio": 38.7833251953125,
            "singular_value_overlap": -76.51423645019531,
            "subspace_overlap": -44.180450439453125,
            "right_subspace_overlap": 65.75931549072266,
            "encoder_gradient_cosine_similarity": 28.24026107788086,
            "encoder_gradient_l2_distance": -96.65394592285156,
            "encoder_gradient_dot_product": 39.627166748046875,
            "input_gradient_cosine_similarity": 19.98988151550293,
            "input_gradient_l2_distance": -35.18590545654297,
            "input_gradient_dot_product": -82.52163696289062
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5278138905116996,
          "val_r": 0.41308973333058924,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": -0.9289132952690125,
            "right_subspace_overlap_bottom_k": 1.747924566268921,
            "interaction_matrix_overlap_top_k": -1.5441263914108276,
            "interaction_matrix_overlap_bottom_k": 2.561368942260742,
            "effective_rank": 0.3748024106025696,
            "effective_rank_mergeability_score": 1.8469417095184326,
            "stable_rank": 0.23585182428359985,
            "spectral_gap": 1.569064736366272,
            "singular_value_ratio": 0.8856971859931946,
            "layerwise_effective_rank": 0.40628114342689514,
            "layerwise_effective_rank_mergeability_score": -0.2704800069332123,
            "task_vector_cosine_similarity": 0.276921808719635,
            "task_vector_l2_distance": -2.6058290004730225,
            "task_vector_dot_product": 0.530279815196991,
            "weight_space_angle": 0.23550084233283997,
            "task_vector_magnitude_ratio": 0.1358768492937088,
            "singular_value_overlap": -2.1662657260894775,
            "subspace_overlap": 0.47068852186203003,
            "right_subspace_overlap": 0.8605725169181824,
            "encoder_gradient_cosine_similarity": -0.09770075231790543,
            "encoder_gradient_l2_distance": -1.4256117343902588,
            "encoder_gradient_dot_product": -0.20953790843486786,
            "input_gradient_cosine_similarity": 0.6213029623031616,
            "input_gradient_l2_distance": -1.9070841073989868,
            "input_gradient_dot_product": -0.6036344170570374
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5161946070826372,
          "val_r": 0.5225564417501579,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": -5.518855094909668,
            "right_subspace_overlap_bottom_k": 4.472259044647217,
            "interaction_matrix_overlap_top_k": -11.92236614227295,
            "interaction_matrix_overlap_bottom_k": 36.340152740478516,
            "effective_rank": -4.099583148956299,
            "effective_rank_mergeability_score": 13.049490928649902,
            "stable_rank": -3.0482888221740723,
            "spectral_gap": -2.996523857116699,
            "singular_value_ratio": -24.1809024810791,
            "layerwise_effective_rank": 34.68445587158203,
            "layerwise_effective_rank_mergeability_score": 13.379128456115723,
            "task_vector_cosine_similarity": -35.865966796875,
            "task_vector_l2_distance": -30.150726318359375,
            "task_vector_dot_product": 40.0901985168457,
            "weight_space_angle": 19.57472038269043,
            "task_vector_magnitude_ratio": 6.2103095054626465,
            "singular_value_overlap": -28.33283233642578,
            "subspace_overlap": 33.10106658935547,
            "right_subspace_overlap": -0.43663856387138367,
            "encoder_gradient_cosine_similarity": 3.752599000930786,
            "encoder_gradient_l2_distance": -18.05718421936035,
            "encoder_gradient_dot_product": 0.7705238461494446,
            "input_gradient_cosine_similarity": 7.9250359535217285,
            "input_gradient_l2_distance": -21.743118286132812,
            "input_gradient_dot_product": -25.998279571533203
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.30568408561981003,
          "val_r": 0.20563159363478284,
          "n_iterations": 487,
          "coefficients": {
            "right_subspace_overlap_top_k": 144.8486785888672,
            "right_subspace_overlap_bottom_k": 268.0596618652344,
            "interaction_matrix_overlap_top_k": 136.26754760742188,
            "interaction_matrix_overlap_bottom_k": -49.37776184082031,
            "effective_rank": -143.35818481445312,
            "effective_rank_mergeability_score": -140.46041870117188,
            "stable_rank": 54.77898406982422,
            "spectral_gap": 9.353631973266602,
            "singular_value_ratio": -124.66056060791016,
            "layerwise_effective_rank": -35.83803176879883,
            "layerwise_effective_rank_mergeability_score": -117.64078521728516,
            "task_vector_cosine_similarity": -102.24683380126953,
            "task_vector_l2_distance": -101.19844055175781,
            "task_vector_dot_product": -9.010933876037598,
            "weight_space_angle": 307.7027587890625,
            "task_vector_magnitude_ratio": -50.191219329833984,
            "singular_value_overlap": 4.521020889282227,
            "subspace_overlap": -6.883511066436768,
            "right_subspace_overlap": 17.470035552978516,
            "encoder_gradient_cosine_similarity": 106.6142807006836,
            "encoder_gradient_l2_distance": 109.1449203491211,
            "encoder_gradient_dot_product": 202.94985961914062,
            "input_gradient_cosine_similarity": 29.562210083007812,
            "input_gradient_l2_distance": -218.01287841796875,
            "input_gradient_dot_product": -291.3970947265625
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.3785328335015252,
          "val_r": 0.533250629795134,
          "n_iterations": 460,
          "coefficients": {
            "right_subspace_overlap_top_k": 62.11006164550781,
            "right_subspace_overlap_bottom_k": 134.5089569091797,
            "interaction_matrix_overlap_top_k": -31.567453384399414,
            "interaction_matrix_overlap_bottom_k": 3.839534044265747,
            "effective_rank": 135.1576385498047,
            "effective_rank_mergeability_score": 21.524856567382812,
            "stable_rank": -16.38140296936035,
            "spectral_gap": -108.87533569335938,
            "singular_value_ratio": -31.841753005981445,
            "layerwise_effective_rank": -97.14534759521484,
            "layerwise_effective_rank_mergeability_score": 76.30431365966797,
            "task_vector_cosine_similarity": -73.606201171875,
            "task_vector_l2_distance": -84.81754302978516,
            "task_vector_dot_product": 42.99125289916992,
            "weight_space_angle": -7.702002048492432,
            "task_vector_magnitude_ratio": -73.95779418945312,
            "singular_value_overlap": -47.57358932495117,
            "subspace_overlap": 21.47244644165039,
            "right_subspace_overlap": 51.58564758300781,
            "encoder_gradient_cosine_similarity": 22.3166446685791,
            "encoder_gradient_l2_distance": -35.274871826171875,
            "encoder_gradient_dot_product": 54.64216613769531,
            "input_gradient_cosine_similarity": 21.1329402923584,
            "input_gradient_l2_distance": -26.762996673583984,
            "input_gradient_dot_product": -11.083422660827637
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4433133670242425,
          "val_r": 0.4785354534298062,
          "n_iterations": 572,
          "coefficients": {
            "right_subspace_overlap_top_k": 28.396949768066406,
            "right_subspace_overlap_bottom_k": 12.875178337097168,
            "interaction_matrix_overlap_top_k": -53.114280700683594,
            "interaction_matrix_overlap_bottom_k": 76.3102798461914,
            "effective_rank": -46.33253860473633,
            "effective_rank_mergeability_score": 60.363121032714844,
            "stable_rank": -12.166237831115723,
            "spectral_gap": 33.985660552978516,
            "singular_value_ratio": 12.785435676574707,
            "layerwise_effective_rank": 12.433923721313477,
            "layerwise_effective_rank_mergeability_score": -55.007450103759766,
            "task_vector_cosine_similarity": 6.2922892570495605,
            "task_vector_l2_distance": -72.34312438964844,
            "task_vector_dot_product": 57.47235870361328,
            "weight_space_angle": 72.90451049804688,
            "task_vector_magnitude_ratio": 35.9095458984375,
            "singular_value_overlap": -19.434919357299805,
            "subspace_overlap": -14.383398056030273,
            "right_subspace_overlap": 7.94785213470459,
            "encoder_gradient_cosine_similarity": 3.1097183227539062,
            "encoder_gradient_l2_distance": -75.69548034667969,
            "encoder_gradient_dot_product": 7.1040544509887695,
            "input_gradient_cosine_similarity": 4.462813377380371,
            "input_gradient_l2_distance": -49.635929107666016,
            "input_gradient_dot_product": -33.24272918701172
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.5030645025087592,
          "val_r": 0.47015844980365146,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 30.430320739746094,
            "right_subspace_overlap_bottom_k": 9.342302322387695,
            "interaction_matrix_overlap_top_k": -10.610379219055176,
            "interaction_matrix_overlap_bottom_k": 29.569334030151367,
            "effective_rank": 17.50119400024414,
            "effective_rank_mergeability_score": 8.9680757522583,
            "stable_rank": 4.15904426574707,
            "spectral_gap": 16.7138614654541,
            "singular_value_ratio": 3.464359760284424,
            "layerwise_effective_rank": 9.963279724121094,
            "layerwise_effective_rank_mergeability_score": 20.05629539489746,
            "task_vector_cosine_similarity": -15.608606338500977,
            "task_vector_l2_distance": -39.64502716064453,
            "task_vector_dot_product": -8.45919418334961,
            "weight_space_angle": 1.4570444822311401,
            "task_vector_magnitude_ratio": -12.994205474853516,
            "singular_value_overlap": -45.4717903137207,
            "subspace_overlap": 32.190731048583984,
            "right_subspace_overlap": 25.35483741760254,
            "encoder_gradient_cosine_similarity": -4.529555320739746,
            "encoder_gradient_l2_distance": -29.989044189453125,
            "encoder_gradient_dot_product": 2.8434348106384277,
            "input_gradient_cosine_similarity": 23.427230834960938,
            "input_gradient_l2_distance": -45.91779327392578,
            "input_gradient_dot_product": -21.217273712158203
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.43497390105830996,
          "val_r": 0.43893015703367433,
          "n_iterations": 502,
          "coefficients": {
            "right_subspace_overlap_top_k": 39.26821517944336,
            "right_subspace_overlap_bottom_k": 34.53630065917969,
            "interaction_matrix_overlap_top_k": 5.755978107452393,
            "interaction_matrix_overlap_bottom_k": 50.7833366394043,
            "effective_rank": 12.63242244720459,
            "effective_rank_mergeability_score": -19.273468017578125,
            "stable_rank": -63.63522720336914,
            "spectral_gap": 5.2849650382995605,
            "singular_value_ratio": -23.802385330200195,
            "layerwise_effective_rank": 7.549988746643066,
            "layerwise_effective_rank_mergeability_score": -22.420076370239258,
            "task_vector_cosine_similarity": 22.635046005249023,
            "task_vector_l2_distance": -54.61371612548828,
            "task_vector_dot_product": 1.950408935546875,
            "weight_space_angle": 1.4450477361679077,
            "task_vector_magnitude_ratio": -5.053354740142822,
            "singular_value_overlap": -91.01947784423828,
            "subspace_overlap": 113.67705535888672,
            "right_subspace_overlap": -11.95635986328125,
            "encoder_gradient_cosine_similarity": 23.4834041595459,
            "encoder_gradient_l2_distance": -22.577468872070312,
            "encoder_gradient_dot_product": 12.386656761169434,
            "input_gradient_cosine_similarity": 56.80369567871094,
            "input_gradient_l2_distance": -17.767169952392578,
            "input_gradient_dot_product": -55.07686233520508
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5376445885751981,
          "val_r": 0.09642133643704012,
          "n_iterations": 631,
          "coefficients": {
            "right_subspace_overlap_top_k": 59.997188568115234,
            "right_subspace_overlap_bottom_k": 43.304691314697266,
            "interaction_matrix_overlap_top_k": -15.09920883178711,
            "interaction_matrix_overlap_bottom_k": 57.66963195800781,
            "effective_rank": 33.4681510925293,
            "effective_rank_mergeability_score": 45.4794921875,
            "stable_rank": 38.84962463378906,
            "spectral_gap": -47.14390182495117,
            "singular_value_ratio": -53.46923828125,
            "layerwise_effective_rank": -11.554999351501465,
            "layerwise_effective_rank_mergeability_score": 23.475278854370117,
            "task_vector_cosine_similarity": 16.741722106933594,
            "task_vector_l2_distance": -48.5473518371582,
            "task_vector_dot_product": -46.494728088378906,
            "weight_space_angle": 28.357898712158203,
            "task_vector_magnitude_ratio": -22.828407287597656,
            "singular_value_overlap": -65.5177001953125,
            "subspace_overlap": 25.114295959472656,
            "right_subspace_overlap": 2.273941993713379,
            "encoder_gradient_cosine_similarity": 14.639039039611816,
            "encoder_gradient_l2_distance": -55.85928726196289,
            "encoder_gradient_dot_product": 8.160496711730957,
            "input_gradient_cosine_similarity": 19.68368148803711,
            "input_gradient_l2_distance": -44.876277923583984,
            "input_gradient_dot_product": -4.826417922973633
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.68519494429954,
          "val_r": 0.5126941103666305,
          "n_iterations": 748,
          "coefficients": {
            "right_subspace_overlap_top_k": 64.12710571289062,
            "right_subspace_overlap_bottom_k": -17.364288330078125,
            "interaction_matrix_overlap_top_k": 18.580259323120117,
            "interaction_matrix_overlap_bottom_k": 11.788349151611328,
            "effective_rank": -5.9719319343566895,
            "effective_rank_mergeability_score": -17.238828659057617,
            "stable_rank": -39.016963958740234,
            "spectral_gap": -5.3347063064575195,
            "singular_value_ratio": 9.357769012451172,
            "layerwise_effective_rank": -5.363479137420654,
            "layerwise_effective_rank_mergeability_score": 16.96213150024414,
            "task_vector_cosine_similarity": 12.859148979187012,
            "task_vector_l2_distance": -2.8919765949249268,
            "task_vector_dot_product": 20.34030532836914,
            "weight_space_angle": 34.219642639160156,
            "task_vector_magnitude_ratio": 11.221487045288086,
            "singular_value_overlap": -19.50408172607422,
            "subspace_overlap": -2.0107338428497314,
            "right_subspace_overlap": -19.48385238647461,
            "encoder_gradient_cosine_similarity": 17.88859748840332,
            "encoder_gradient_l2_distance": -15.101758003234863,
            "encoder_gradient_dot_product": 15.80224609375,
            "input_gradient_cosine_similarity": 5.907066345214844,
            "input_gradient_l2_distance": -60.29434585571289,
            "input_gradient_dot_product": -28.479198455810547
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5749012382276872,
          "val_r": 0.2599602828500406,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": -6.387409210205078,
            "right_subspace_overlap_bottom_k": 6.282735824584961,
            "interaction_matrix_overlap_top_k": -3.3746631145477295,
            "interaction_matrix_overlap_bottom_k": 9.426509857177734,
            "effective_rank": 9.773122787475586,
            "effective_rank_mergeability_score": 5.073939800262451,
            "stable_rank": 1.3595784902572632,
            "spectral_gap": -2.620086431503296,
            "singular_value_ratio": -4.467862606048584,
            "layerwise_effective_rank": 4.0462870597839355,
            "layerwise_effective_rank_mergeability_score": 7.379185199737549,
            "task_vector_cosine_similarity": 12.188231468200684,
            "task_vector_l2_distance": -9.334653854370117,
            "task_vector_dot_product": -5.563469409942627,
            "weight_space_angle": 6.208045482635498,
            "task_vector_magnitude_ratio": -5.019260406494141,
            "singular_value_overlap": -6.668161392211914,
            "subspace_overlap": 3.986131191253662,
            "right_subspace_overlap": 1.0283297300338745,
            "encoder_gradient_cosine_similarity": -0.6115270256996155,
            "encoder_gradient_l2_distance": -10.919710159301758,
            "encoder_gradient_dot_product": 2.6051011085510254,
            "input_gradient_cosine_similarity": 2.8058226108551025,
            "input_gradient_l2_distance": -11.520487785339355,
            "input_gradient_dot_product": -4.6759934425354
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    }
  }
}