{
  "aggregate_metrics": {
    "train_r": 0.3081560084998685,
    "train_p": 7.815410353686358e-72,
    "val_r": 0.25023409597565494,
    "val_p": 1.6301159313618725e-06
  },
  "per_fold_stats": {
    "train_r_mean": 0.5987373357814293,
    "train_r_std": 0.14894481906902488,
    "val_r_mean": 0.5136336458395625,
    "val_r_std": 0.174851013861217
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 30.061878204345703,
    "right_subspace_overlap_bottom_k": -20.329557418823242,
    "interaction_matrix_overlap_top_k": 28.193359375,
    "interaction_matrix_overlap_bottom_k": -13.377527236938477,
    "effective_rank": -0.3749411702156067,
    "effective_rank_mergeability_score": -12.241896629333496,
    "stable_rank": -20.168991088867188,
    "spectral_gap": 2.6433753967285156,
    "singular_value_ratio": 10.26717758178711,
    "layerwise_effective_rank": -4.108586311340332,
    "layerwise_effective_rank_mergeability_score": 6.143611907958984,
    "task_vector_cosine_similarity": 19.856746673583984,
    "task_vector_l2_distance": -13.014312744140625,
    "task_vector_dot_product": 13.921127319335938,
    "weight_space_angle": -10.037684440612793,
    "task_vector_magnitude_ratio": 0.29567378759384155,
    "singular_value_overlap": 1.439159631729126,
    "subspace_overlap": -0.02333373948931694,
    "right_subspace_overlap": 3.858647108078003,
    "encoder_gradient_cosine_similarity": 27.874353408813477,
    "encoder_gradient_l2_distance": -24.457103729248047,
    "encoder_gradient_dot_product": 29.208438873291016,
    "input_gradient_cosine_similarity": 6.365433692932129,
    "input_gradient_l2_distance": -44.449974060058594,
    "input_gradient_dot_product": -16.545608520507812
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 52.609100341796875,
    "right_subspace_overlap_bottom_k": 30.47812271118164,
    "interaction_matrix_overlap_top_k": 40.6084098815918,
    "interaction_matrix_overlap_bottom_k": 27.854665756225586,
    "effective_rank": 32.2656364440918,
    "effective_rank_mergeability_score": 53.114585876464844,
    "stable_rank": 43.567291259765625,
    "spectral_gap": 33.306304931640625,
    "singular_value_ratio": 25.40228271484375,
    "layerwise_effective_rank": 37.01395034790039,
    "layerwise_effective_rank_mergeability_score": 53.09374237060547,
    "task_vector_cosine_similarity": 63.90947341918945,
    "task_vector_l2_distance": 29.839933395385742,
    "task_vector_dot_product": 21.28866958618164,
    "weight_space_angle": 30.869651794433594,
    "task_vector_magnitude_ratio": 25.6010684967041,
    "singular_value_overlap": 21.03470230102539,
    "subspace_overlap": 34.6933479309082,
    "right_subspace_overlap": 46.115211486816406,
    "encoder_gradient_cosine_similarity": 36.19207763671875,
    "encoder_gradient_l2_distance": 36.33167266845703,
    "encoder_gradient_dot_product": 40.47578048706055,
    "input_gradient_cosine_similarity": 20.162046432495117,
    "input_gradient_l2_distance": 49.66156768798828,
    "input_gradient_dot_product": 37.42958068847656
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6800711387035088,
      "val_r": 0.7673876336194255,
      "n_iterations": 801,
      "coefficients": {
        "right_subspace_overlap_top_k": 16.509336471557617,
        "right_subspace_overlap_bottom_k": -15.20195198059082,
        "interaction_matrix_overlap_top_k": 11.09233570098877,
        "interaction_matrix_overlap_bottom_k": 3.27517032623291,
        "effective_rank": 9.639944076538086,
        "effective_rank_mergeability_score": 5.114923000335693,
        "stable_rank": -0.7865902781486511,
        "spectral_gap": 2.5499067306518555,
        "singular_value_ratio": -0.0562378466129303,
        "layerwise_effective_rank": 10.091578483581543,
        "layerwise_effective_rank_mergeability_score": 11.99970531463623,
        "task_vector_cosine_similarity": -12.196418762207031,
        "task_vector_l2_distance": -9.61866569519043,
        "task_vector_dot_product": -4.159532070159912,
        "weight_space_angle": 4.019112586975098,
        "task_vector_magnitude_ratio": -2.101897954940796,
        "singular_value_overlap": -6.418807029724121,
        "subspace_overlap": 0.4599720239639282,
        "right_subspace_overlap": 11.69342041015625,
        "encoder_gradient_cosine_similarity": 8.803751945495605,
        "encoder_gradient_l2_distance": -28.447372436523438,
        "encoder_gradient_dot_product": 5.049064636230469,
        "input_gradient_cosine_similarity": 2.8171329498291016,
        "input_gradient_l2_distance": -10.783092498779297,
        "input_gradient_dot_product": -12.346527099609375
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6837504612689993,
      "val_r": 0.7189276147633015,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.6399855613708496,
        "right_subspace_overlap_bottom_k": -3.695446014404297,
        "interaction_matrix_overlap_top_k": 0.6654148697853088,
        "interaction_matrix_overlap_bottom_k": -1.5910449028015137,
        "effective_rank": 3.5655531883239746,
        "effective_rank_mergeability_score": 8.364029884338379,
        "stable_rank": -2.6399173736572266,
        "spectral_gap": -0.9255524277687073,
        "singular_value_ratio": 2.183548927307129,
        "layerwise_effective_rank": 4.838817596435547,
        "layerwise_effective_rank_mergeability_score": 0.06050168350338936,
        "task_vector_cosine_similarity": 2.4624264240264893,
        "task_vector_l2_distance": -5.223520755767822,
        "task_vector_dot_product": 0.07695663720369339,
        "weight_space_angle": 3.0180301666259766,
        "task_vector_magnitude_ratio": -2.2747232913970947,
        "singular_value_overlap": -0.3282022774219513,
        "subspace_overlap": -2.4654040336608887,
        "right_subspace_overlap": 8.780803680419922,
        "encoder_gradient_cosine_similarity": 3.978753089904785,
        "encoder_gradient_l2_distance": -12.913397789001465,
        "encoder_gradient_dot_product": 4.006263256072998,
        "input_gradient_cosine_similarity": 0.32609352469444275,
        "input_gradient_l2_distance": -8.66537094116211,
        "input_gradient_dot_product": -4.245733261108398
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6771207093304432,
      "val_r": 0.562760785804842,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 11.370861053466797,
        "right_subspace_overlap_bottom_k": -19.793846130371094,
        "interaction_matrix_overlap_top_k": 16.91474723815918,
        "interaction_matrix_overlap_bottom_k": -2.2463645935058594,
        "effective_rank": -2.9859530925750732,
        "effective_rank_mergeability_score": 8.84941291809082,
        "stable_rank": -9.922136306762695,
        "spectral_gap": -3.7297604084014893,
        "singular_value_ratio": 9.529345512390137,
        "layerwise_effective_rank": 2.6267974376678467,
        "layerwise_effective_rank_mergeability_score": -5.482705593109131,
        "task_vector_cosine_similarity": 15.630732536315918,
        "task_vector_l2_distance": -7.503546714782715,
        "task_vector_dot_product": -2.289834976196289,
        "weight_space_angle": 12.369190216064453,
        "task_vector_magnitude_ratio": -4.1878461837768555,
        "singular_value_overlap": -1.9424912929534912,
        "subspace_overlap": 7.218624591827393,
        "right_subspace_overlap": 7.678624153137207,
        "encoder_gradient_cosine_similarity": 10.127492904663086,
        "encoder_gradient_l2_distance": -15.921706199645996,
        "encoder_gradient_dot_product": 11.06100845336914,
        "input_gradient_cosine_similarity": 5.068501949310303,
        "input_gradient_l2_distance": -20.847702026367188,
        "input_gradient_dot_product": -20.592918395996094
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6902502513832667,
      "val_r": 0.49327028669520123,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.373915433883667,
        "right_subspace_overlap_bottom_k": -3.5619583129882812,
        "interaction_matrix_overlap_top_k": 3.542733907699585,
        "interaction_matrix_overlap_bottom_k": 0.8806107640266418,
        "effective_rank": 5.429708003997803,
        "effective_rank_mergeability_score": 2.325190305709839,
        "stable_rank": -4.662481784820557,
        "spectral_gap": 0.677977979183197,
        "singular_value_ratio": -2.9499404430389404,
        "layerwise_effective_rank": 0.8714336156845093,
        "layerwise_effective_rank_mergeability_score": 0.42357364296913147,
        "task_vector_cosine_similarity": 2.975113868713379,
        "task_vector_l2_distance": -1.683394193649292,
        "task_vector_dot_product": -3.214970111846924,
        "weight_space_angle": 2.0112197399139404,
        "task_vector_magnitude_ratio": 4.253445148468018,
        "singular_value_overlap": -0.8554108142852783,
        "subspace_overlap": -2.262190341949463,
        "right_subspace_overlap": 2.396235942840576,
        "encoder_gradient_cosine_similarity": 2.3141422271728516,
        "encoder_gradient_l2_distance": -5.82631254196167,
        "encoder_gradient_dot_product": 2.156752586364746,
        "input_gradient_cosine_similarity": 0.07361587136983871,
        "input_gradient_l2_distance": -5.06129789352417,
        "input_gradient_dot_product": -2.628453016281128
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6139158966397267,
      "val_r": 0.5684829030606675,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 26.99551773071289,
        "right_subspace_overlap_bottom_k": -19.896385192871094,
        "interaction_matrix_overlap_top_k": -5.858401775360107,
        "interaction_matrix_overlap_bottom_k": -33.29988098144531,
        "effective_rank": -61.70061111450195,
        "effective_rank_mergeability_score": -9.103799819946289,
        "stable_rank": -45.637386322021484,
        "spectral_gap": 24.276912689208984,
        "singular_value_ratio": 20.788732528686523,
        "layerwise_effective_rank": 59.28065490722656,
        "layerwise_effective_rank_mergeability_score": -21.271751403808594,
        "task_vector_cosine_similarity": 5.317526340484619,
        "task_vector_l2_distance": -29.817243576049805,
        "task_vector_dot_product": 54.135128021240234,
        "weight_space_angle": 22.58089256286621,
        "task_vector_magnitude_ratio": 19.47783851623535,
        "singular_value_overlap": 0.4646006226539612,
        "subspace_overlap": -22.472562789916992,
        "right_subspace_overlap": 59.21455001831055,
        "encoder_gradient_cosine_similarity": 28.748872756958008,
        "encoder_gradient_l2_distance": -61.168052673339844,
        "encoder_gradient_dot_product": 11.890721321105957,
        "input_gradient_cosine_similarity": 15.324645042419434,
        "input_gradient_l2_distance": -4.445045471191406,
        "input_gradient_dot_product": -32.82707595825195
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5566351657736085,
      "val_r": 0.4549692508470823,
      "n_iterations": 502,
      "coefficients": {
        "right_subspace_overlap_top_k": 51.527347564697266,
        "right_subspace_overlap_bottom_k": -25.373693466186523,
        "interaction_matrix_overlap_top_k": -2.2782270908355713,
        "interaction_matrix_overlap_bottom_k": -18.338947296142578,
        "effective_rank": 91.98855590820312,
        "effective_rank_mergeability_score": 115.03936004638672,
        "stable_rank": -31.801433563232422,
        "spectral_gap": 39.155296325683594,
        "singular_value_ratio": -3.3004889488220215,
        "layerwise_effective_rank": 7.482936859130859,
        "layerwise_effective_rank_mergeability_score": -107.3845443725586,
        "task_vector_cosine_similarity": -66.71881866455078,
        "task_vector_l2_distance": -33.30224609375,
        "task_vector_dot_product": 50.51726531982422,
        "weight_space_angle": -88.4361343383789,
        "task_vector_magnitude_ratio": -30.457529067993164,
        "singular_value_overlap": 1.4891736507415771,
        "subspace_overlap": -21.663787841796875,
        "right_subspace_overlap": 79.3016357421875,
        "encoder_gradient_cosine_similarity": -18.91836166381836,
        "encoder_gradient_l2_distance": 5.655179500579834,
        "encoder_gradient_dot_product": 74.22525024414062,
        "input_gradient_cosine_similarity": 44.52933883666992,
        "input_gradient_l2_distance": -151.37969970703125,
        "input_gradient_dot_product": 39.439674377441406
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5709257636377174,
      "val_r": 0.43647404198823764,
      "n_iterations": 804,
      "coefficients": {
        "right_subspace_overlap_top_k": 69.45716094970703,
        "right_subspace_overlap_bottom_k": -15.043959617614746,
        "interaction_matrix_overlap_top_k": 67.38423156738281,
        "interaction_matrix_overlap_bottom_k": -51.43782043457031,
        "effective_rank": -20.7965087890625,
        "effective_rank_mergeability_score": -81.89859771728516,
        "stable_rank": -50.456172943115234,
        "spectral_gap": 87.5328598022461,
        "singular_value_ratio": 7.410624980926514,
        "layerwise_effective_rank": 39.395965576171875,
        "layerwise_effective_rank_mergeability_score": -11.87989616394043,
        "task_vector_cosine_similarity": 38.193546295166016,
        "task_vector_l2_distance": -47.11946105957031,
        "task_vector_dot_product": 28.104564666748047,
        "weight_space_angle": -38.018131256103516,
        "task_vector_magnitude_ratio": 9.58967399597168,
        "singular_value_overlap": -10.514525413513184,
        "subspace_overlap": -38.79973220825195,
        "right_subspace_overlap": -37.614742279052734,
        "encoder_gradient_cosine_similarity": 33.59958267211914,
        "encoder_gradient_l2_distance": -34.18234634399414,
        "encoder_gradient_dot_product": 121.65654754638672,
        "input_gradient_cosine_similarity": 4.4635009765625,
        "input_gradient_l2_distance": -103.95075225830078,
        "input_gradient_dot_product": 35.92245864868164
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.659397667084712,
      "val_r": 0.26611036914620506,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.453690528869629,
        "right_subspace_overlap_bottom_k": -2.5460944175720215,
        "interaction_matrix_overlap_top_k": -0.0660906583070755,
        "interaction_matrix_overlap_bottom_k": -2.0602755546569824,
        "effective_rank": 0.752940833568573,
        "effective_rank_mergeability_score": 3.271496295928955,
        "stable_rank": 2.9769363403320312,
        "spectral_gap": -0.432425320148468,
        "singular_value_ratio": 2.276301145553589,
        "layerwise_effective_rank": -0.15978609025478363,
        "layerwise_effective_rank_mergeability_score": 1.3567626476287842,
        "task_vector_cosine_similarity": 3.5991389751434326,
        "task_vector_l2_distance": -5.188724040985107,
        "task_vector_dot_product": -4.094612121582031,
        "weight_space_angle": 1.8904316425323486,
        "task_vector_magnitude_ratio": -3.653193712234497,
        "singular_value_overlap": -0.9910544157028198,
        "subspace_overlap": -3.3678550720214844,
        "right_subspace_overlap": 8.760705947875977,
        "encoder_gradient_cosine_similarity": 3.9308009147644043,
        "encoder_gradient_l2_distance": -10.23470687866211,
        "encoder_gradient_dot_product": 3.1227807998657227,
        "input_gradient_cosine_similarity": 1.518373966217041,
        "input_gradient_l2_distance": -5.589851379394531,
        "input_gradient_dot_product": -0.5268537402153015
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.026684118795944917,
      "val_r": 0.3412605083858768,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.21472038328647614,
        "right_subspace_overlap_bottom_k": -0.368704229593277,
        "interaction_matrix_overlap_top_k": 0.6981685161590576,
        "interaction_matrix_overlap_bottom_k": -0.22596313059329987,
        "effective_rank": 0.46845507621765137,
        "effective_rank_mergeability_score": -0.10270346701145172,
        "stable_rank": 0.0017264913767576218,
        "spectral_gap": -0.5409911870956421,
        "singular_value_ratio": 0.16478222608566284,
        "layerwise_effective_rank": 0.09410392493009567,
        "layerwise_effective_rank_mergeability_score": 0.07272721081972122,
        "task_vector_cosine_similarity": -0.18091194331645966,
        "task_vector_l2_distance": -0.23897671699523926,
        "task_vector_dot_product": 0.2697652280330658,
        "weight_space_angle": -0.05914029851555824,
        "task_vector_magnitude_ratio": 0.7143641114234924,
        "singular_value_overlap": -0.5937680602073669,
        "subspace_overlap": 0.1128772646188736,
        "right_subspace_overlap": 0.5173827409744263,
        "encoder_gradient_cosine_similarity": 0.20932653546333313,
        "encoder_gradient_l2_distance": 0.08826428651809692,
        "encoder_gradient_dot_product": -0.06828498840332031,
        "input_gradient_cosine_similarity": 0.18597009778022766,
        "input_gradient_l2_distance": -0.11798095703125,
        "input_gradient_dot_product": 0.13682448863983154
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5978105385040435,
      "val_r": 0.4417539351818198,
      "n_iterations": 806,
      "coefficients": {
        "right_subspace_overlap_top_k": 93.02692413330078,
        "right_subspace_overlap_bottom_k": -77.25761413574219,
        "interaction_matrix_overlap_top_k": 24.553150177001953,
        "interaction_matrix_overlap_bottom_k": -55.95151138305664,
        "effective_rank": -48.20625686645508,
        "effective_rank_mergeability_score": 7.499451637268066,
        "stable_rank": -23.690980911254883,
        "spectral_gap": 10.717833518981934,
        "singular_value_ratio": 13.968156814575195,
        "layerwise_effective_rank": -45.79341506958008,
        "layerwise_effective_rank_mergeability_score": -56.51004409790039,
        "task_vector_cosine_similarity": 68.09501647949219,
        "task_vector_l2_distance": 46.525325775146484,
        "task_vector_dot_product": -21.348344802856445,
        "weight_space_angle": 13.287802696228027,
        "task_vector_magnitude_ratio": 45.032962799072266,
        "singular_value_overlap": 24.913707733154297,
        "subspace_overlap": 30.985841751098633,
        "right_subspace_overlap": 13.31196403503418,
        "encoder_gradient_cosine_similarity": 4.058264255523682,
        "encoder_gradient_l2_distance": 12.97447681427002,
        "encoder_gradient_dot_product": 49.34876251220703,
        "input_gradient_cosine_similarity": 26.96826934814453,
        "input_gradient_l2_distance": -76.56171417236328,
        "input_gradient_dot_product": -78.94986724853516
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5902291140106712,
      "val_r": 0.21847658746943538,
      "n_iterations": 425,
      "coefficients": {
        "right_subspace_overlap_top_k": 42.39413833618164,
        "right_subspace_overlap_bottom_k": -17.67967414855957,
        "interaction_matrix_overlap_top_k": 31.120384216308594,
        "interaction_matrix_overlap_bottom_k": 0.23338955640792847,
        "effective_rank": 29.830162048339844,
        "effective_rank_mergeability_score": 52.30778503417969,
        "stable_rank": -115.5929183959961,
        "spectral_gap": -35.83604049682617,
        "singular_value_ratio": 66.97175598144531,
        "layerwise_effective_rank": 23.441162109375,
        "layerwise_effective_rank_mergeability_score": -51.22582244873047,
        "task_vector_cosine_similarity": 60.935428619384766,
        "task_vector_l2_distance": 10.248490333557129,
        "task_vector_dot_product": 3.5813472270965576,
        "weight_space_angle": -12.146636009216309,
        "task_vector_magnitude_ratio": -52.0915412902832,
        "singular_value_overlap": 47.36117172241211,
        "subspace_overlap": -46.00664138793945,
        "right_subspace_overlap": 8.1957368850708,
        "encoder_gradient_cosine_similarity": 39.62770462036133,
        "encoder_gradient_l2_distance": -79.95745849609375,
        "encoder_gradient_dot_product": 35.00328063964844,
        "input_gradient_cosine_similarity": -4.928718566894531,
        "input_gradient_l2_distance": -60.78287887573242,
        "input_gradient_dot_product": 25.99305534362793
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.704532694397987,
      "val_r": 0.7027827769622037,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 4.24968147277832,
        "right_subspace_overlap_bottom_k": -2.6405181884765625,
        "interaction_matrix_overlap_top_k": 0.1740407645702362,
        "interaction_matrix_overlap_bottom_k": -0.16948729753494263,
        "effective_rank": 0.3221634030342102,
        "effective_rank_mergeability_score": 0.924318790435791,
        "stable_rank": 0.3408426344394684,
        "spectral_gap": 1.268438458442688,
        "singular_value_ratio": 0.7337084412574768,
        "layerwise_effective_rank": 1.2363492250442505,
        "layerwise_effective_rank_mergeability_score": 0.3539445102214813,
        "task_vector_cosine_similarity": -0.8145534992218018,
        "task_vector_l2_distance": -1.3721877336502075,
        "task_vector_dot_product": 0.2093021124601364,
        "weight_space_angle": 2.137883424758911,
        "task_vector_magnitude_ratio": -0.34138453006744385,
        "singular_value_overlap": -0.28931331634521484,
        "subspace_overlap": -0.7480429410934448,
        "right_subspace_overlap": 2.1907029151916504,
        "encoder_gradient_cosine_similarity": 1.3220607042312622,
        "encoder_gradient_l2_distance": -4.252832412719727,
        "encoder_gradient_dot_product": 1.2749375104904175,
        "input_gradient_cosine_similarity": 0.15900030732154846,
        "input_gradient_l2_distance": -3.2705647945404053,
        "input_gradient_dot_product": -1.9989144802093506
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5388832538366963,
      "val_r": 0.7028412508240647,
      "n_iterations": 799,
      "coefficients": {
        "right_subspace_overlap_top_k": 114.86746978759766,
        "right_subspace_overlap_bottom_k": -92.87462615966797,
        "interaction_matrix_overlap_top_k": 80.49569702148438,
        "interaction_matrix_overlap_bottom_k": -70.75859832763672,
        "effective_rank": -39.3358039855957,
        "effective_rank_mergeability_score": -153.00323486328125,
        "stable_rank": 97.77800750732422,
        "spectral_gap": 50.088279724121094,
        "singular_value_ratio": 1.8461596965789795,
        "layerwise_effective_rank": -103.61890411376953,
        "layerwise_effective_rank_mergeability_score": 73.63704681396484,
        "task_vector_cosine_similarity": -99.98285675048828,
        "task_vector_l2_distance": 59.354190826416016,
        "task_vector_dot_product": 38.45291519165039,
        "weight_space_angle": -21.98729705810547,
        "task_vector_magnitude_ratio": -1.654091238975525,
        "singular_value_overlap": -5.520482540130615,
        "subspace_overlap": 65.44847106933594,
        "right_subspace_overlap": 37.91646194458008,
        "encoder_gradient_cosine_similarity": 128.93812561035156,
        "encoder_gradient_l2_distance": -75.85507202148438,
        "encoder_gradient_dot_product": 5.51995325088501,
        "input_gradient_cosine_similarity": -48.43157958984375,
        "input_gradient_l2_distance": -12.788911819458008,
        "input_gradient_dot_product": -27.533349990844727
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6128980761413436,
      "val_r": 0.6877121504645918,
      "n_iterations": 754,
      "coefficients": {
        "right_subspace_overlap_top_k": -20.3190860748291,
        "right_subspace_overlap_bottom_k": -7.992713451385498,
        "interaction_matrix_overlap_top_k": 103.00154113769531,
        "interaction_matrix_overlap_bottom_k": -33.0210075378418,
        "effective_rank": 31.011348724365234,
        "effective_rank_mergeability_score": -8.183887481689453,
        "stable_rank": -41.441986083984375,
        "spectral_gap": 5.478028297424316,
        "singular_value_ratio": 82.65080261230469,
        "layerwise_effective_rank": -37.451271057128906,
        "layerwise_effective_rank_mergeability_score": -7.344688892364502,
        "task_vector_cosine_similarity": 41.153053283691406,
        "task_vector_l2_distance": -24.621559143066406,
        "task_vector_dot_product": 21.979019165039062,
        "weight_space_angle": -8.679244041442871,
        "task_vector_magnitude_ratio": -59.85881042480469,
        "singular_value_overlap": 1.140635371208191,
        "subspace_overlap": 1.0689197778701782,
        "right_subspace_overlap": -11.37098217010498,
        "encoder_gradient_cosine_similarity": 36.01760482788086,
        "encoder_gradient_l2_distance": -50.04277420043945,
        "encoder_gradient_dot_product": 33.24822998046875,
        "input_gradient_cosine_similarity": 38.810001373291016,
        "input_gradient_l2_distance": -41.53047561645508,
        "input_gradient_dot_product": -42.70278549194336
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4809083656875949,
      "val_r": 0.5221004526218799,
      "n_iterations": 858,
      "coefficients": {
        "right_subspace_overlap_top_k": 194.17291259765625,
        "right_subspace_overlap_bottom_k": -85.35838317871094,
        "interaction_matrix_overlap_top_k": -13.590764999389648,
        "interaction_matrix_overlap_bottom_k": 60.53139877319336,
        "effective_rank": -15.32730484008789,
        "effective_rank_mergeability_score": -66.46944427490234,
        "stable_rank": -88.16410827636719,
        "spectral_gap": -74.32254028320312,
        "singular_value_ratio": 16.395668029785156,
        "layerwise_effective_rank": 13.576980590820312,
        "layerwise_effective_rank_mergeability_score": 149.2571563720703,
        "task_vector_cosine_similarity": 243.54554748535156,
        "task_vector_l2_distance": -52.72982406616211,
        "task_vector_dot_product": 18.177898406982422,
        "weight_space_angle": -93.9410171508789,
        "task_vector_magnitude_ratio": 44.56228256225586,
        "singular_value_overlap": 45.95026397705078,
        "subspace_overlap": -83.76570129394531,
        "right_subspace_overlap": -157.42039489746094,
        "encoder_gradient_cosine_similarity": 59.57744216918945,
        "encoder_gradient_l2_distance": 14.34050178527832,
        "encoder_gradient_dot_product": 123.80430603027344,
        "input_gradient_cosine_similarity": -0.10205025970935822,
        "input_gradient_l2_distance": -128.66871643066406,
        "input_gradient_dot_product": -123.03402709960938
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7523990435706305,
      "val_r": 0.7648244425182564,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 11.24205493927002,
        "right_subspace_overlap_bottom_k": -8.87767505645752,
        "interaction_matrix_overlap_top_k": 14.644187927246094,
        "interaction_matrix_overlap_bottom_k": 0.9644711017608643,
        "effective_rank": -3.5536251068115234,
        "effective_rank_mergeability_score": 9.664801597595215,
        "stable_rank": 18.497974395751953,
        "spectral_gap": 6.681545257568359,
        "singular_value_ratio": 11.458066940307617,
        "layerwise_effective_rank": -6.762487411499023,
        "layerwise_effective_rank_mergeability_score": -1.9683787822723389,
        "task_vector_cosine_similarity": -9.587102890014648,
        "task_vector_l2_distance": -10.13046932220459,
        "task_vector_dot_product": 12.66232967376709,
        "weight_space_angle": 0.3732554614543915,
        "task_vector_magnitude_ratio": -10.247685432434082,
        "singular_value_overlap": 2.2822329998016357,
        "subspace_overlap": -19.43990135192871,
        "right_subspace_overlap": 3.1440911293029785,
        "encoder_gradient_cosine_similarity": 2.092855453491211,
        "encoder_gradient_l2_distance": -11.071854591369629,
        "encoder_gradient_dot_product": 5.231098175048828,
        "input_gradient_cosine_similarity": 1.3134642839431763,
        "input_gradient_l2_distance": -11.608409881591797,
        "input_gradient_dot_product": -6.005901336669922
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5322329389677694,
      "val_r": 0.47704444768233634,
      "n_iterations": 489,
      "coefficients": {
        "right_subspace_overlap_top_k": -40.916839599609375,
        "right_subspace_overlap_bottom_k": -43.80784606933594,
        "interaction_matrix_overlap_top_k": 132.64141845703125,
        "interaction_matrix_overlap_bottom_k": -30.936235427856445,
        "effective_rank": 15.859237670898438,
        "effective_rank_mergeability_score": -47.339195251464844,
        "stable_rank": -57.85771942138672,
        "spectral_gap": -50.49928665161133,
        "singular_value_ratio": -21.69800567626953,
        "layerwise_effective_rank": -74.0440673828125,
        "layerwise_effective_rank_mergeability_score": 4.171014785766602,
        "task_vector_cosine_similarity": 26.61461067199707,
        "task_vector_l2_distance": -39.42531967163086,
        "task_vector_dot_product": 18.969587326049805,
        "weight_space_angle": -30.335405349731445,
        "task_vector_magnitude_ratio": 25.252365112304688,
        "singular_value_overlap": 15.85074520111084,
        "subspace_overlap": 64.42965698242188,
        "right_subspace_overlap": 61.1020622253418,
        "encoder_gradient_cosine_similarity": 93.99760437011719,
        "encoder_gradient_l2_distance": -26.77532958984375,
        "encoder_gradient_dot_product": 94.71672821044922,
        "input_gradient_cosine_similarity": 22.287900924682617,
        "input_gradient_l2_distance": -47.12602615356445,
        "input_gradient_dot_product": -64.13469696044922
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7494386847265531,
      "val_r": 0.4877860126036708,
      "n_iterations": 961,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.1700059473514557,
        "right_subspace_overlap_bottom_k": -0.8499748110771179,
        "interaction_matrix_overlap_top_k": -0.26428574323654175,
        "interaction_matrix_overlap_bottom_k": 0.8789678812026978,
        "effective_rank": 0.2148408740758896,
        "effective_rank_mergeability_score": -0.28579601645469666,
        "stable_rank": -0.6074293255805969,
        "spectral_gap": 0.1639944463968277,
        "singular_value_ratio": 0.5880624651908875,
        "layerwise_effective_rank": 0.5493453741073608,
        "layerwise_effective_rank_mergeability_score": 0.5326855778694153,
        "task_vector_cosine_similarity": 0.2570246756076813,
        "task_vector_l2_distance": -0.0690900981426239,
        "task_vector_dot_product": 0.09940598905086517,
        "weight_space_angle": 0.21297915279865265,
        "task_vector_magnitude_ratio": -0.336761474609375,
        "singular_value_overlap": -0.021205950528383255,
        "subspace_overlap": -0.11029504984617233,
        "right_subspace_overlap": 0.14213325083255768,
        "encoder_gradient_cosine_similarity": 0.017892614006996155,
        "encoder_gradient_l2_distance": -0.12681050598621368,
        "encoder_gradient_dot_product": 0.045677512884140015,
        "input_gradient_cosine_similarity": 0.0061901467852294445,
        "input_gradient_l2_distance": -0.15176402032375336,
        "input_gradient_dot_product": -0.05604821816086769
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6383136787414607,
      "val_r": 0.1403309935427412,
      "n_iterations": 690,
      "coefficients": {
        "right_subspace_overlap_top_k": 29.902870178222656,
        "right_subspace_overlap_bottom_k": 19.41661262512207,
        "interaction_matrix_overlap_top_k": 83.57173919677734,
        "interaction_matrix_overlap_bottom_k": -33.63555145263672,
        "effective_rank": -31.877775192260742,
        "effective_rank_mergeability_score": -77.27506256103516,
        "stable_rank": -59.65348434448242,
        "spectral_gap": 9.711835861206055,
        "singular_value_ratio": 29.917593002319336,
        "layerwise_effective_rank": 40.555171966552734,
        "layerwise_effective_rank_mergeability_score": 92.78167724609375,
        "task_vector_cosine_similarity": 42.78835678100586,
        "task_vector_l2_distance": -59.73001480102539,
        "task_vector_dot_product": 9.277902603149414,
        "weight_space_angle": 15.56783676147461,
        "task_vector_magnitude_ratio": 24.410852432250977,
        "singular_value_overlap": -43.37433624267578,
        "subspace_overlap": 28.526386260986328,
        "right_subspace_overlap": 8.433370590209961,
        "encoder_gradient_cosine_similarity": 70.0314712524414,
        "encoder_gradient_l2_distance": -125.55601501464844,
        "encoder_gradient_dot_product": 7.3838276863098145,
        "input_gradient_cosine_similarity": -18.20299530029297,
        "input_gradient_l2_distance": -48.299495697021484,
        "input_gradient_dot_product": -13.674935340881348
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6183491544259063,
      "val_r": 0.5173764726094082,
      "n_iterations": 616,
      "coefficients": {
        "right_subspace_overlap_top_k": -16.66564178466797,
        "right_subspace_overlap_bottom_k": 16.813312530517578,
        "interaction_matrix_overlap_top_k": 15.425193786621094,
        "interaction_matrix_overlap_bottom_k": -0.6418673396110535,
        "effective_rank": 27.20210838317871,
        "effective_rank_mergeability_score": -14.536968231201172,
        "stable_rank": 9.939421653747559,
        "spectral_gap": -19.14881706237793,
        "singular_value_ratio": -33.53507614135742,
        "layerwise_effective_rank": -18.383085250854492,
        "layerwise_effective_rank_mergeability_score": 51.29327392578125,
        "task_vector_cosine_similarity": 35.048030853271484,
        "task_vector_l2_distance": -48.63999938964844,
        "task_vector_dot_product": 57.016441345214844,
        "weight_space_angle": 15.380653381347656,
        "task_vector_magnitude_ratio": -0.17484396696090698,
        "singular_value_overlap": -39.81974411010742,
        "subspace_overlap": 42.38469314575195,
        "right_subspace_overlap": -29.200830459594727,
        "encoder_gradient_cosine_similarity": 49.011695861816406,
        "encoder_gradient_l2_distance": 20.13153076171875,
        "encoder_gradient_dot_product": -4.508090972900391,
        "input_gradient_cosine_similarity": 35.12202072143555,
        "input_gradient_l2_distance": -147.3697052001953,
        "input_gradient_dot_product": -1.1461009979248047
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}