{
  "excluded_metrics": [
    "task_vector_cosine_similarity",
    "task_vector_dot_product",
    "task_vector_l2_distance",
    "task_vector_magnitude_ratio",
    "weight_space_angle"
  ],
  "n_metrics_used": 24,
  "metrics_used": [
    "right_subspace_overlap_top_k",
    "right_subspace_overlap_bottom_k",
    "interaction_matrix_overlap_top_k",
    "interaction_matrix_overlap_bottom_k",
    "effective_rank",
    "effective_rank_mergeability_score",
    "stable_rank",
    "spectral_gap",
    "singular_value_ratio",
    "layerwise_effective_rank",
    "layerwise_effective_rank_mergeability_score",
    "singular_value_overlap",
    "subspace_overlap",
    "right_subspace_overlap",
    "activation_l2_distance",
    "activation_cosine_similarity",
    "activation_magnitude_ratio",
    "activation_dot_product",
    "encoder_gradient_cosine_similarity",
    "encoder_gradient_l2_distance",
    "encoder_gradient_dot_product",
    "input_gradient_cosine_similarity",
    "input_gradient_l2_distance",
    "input_gradient_dot_product"
  ],
  "methods": {
    "weight_avg": {
      "aggregate_metrics": {
        "train_r": 0.24321332424059944,
        "train_p": 1.3356030775018332e-44,
        "val_r": 0.16969554671155934,
        "val_p": 0.0012686993272305021
      },
      "per_fold_stats": {
        "train_r_mean": 0.6737788837351036,
        "train_r_std": 0.16036575846408999,
        "val_r_mean": 0.5032944983265961,
        "val_r_std": 0.24533633061389143
      },
      "average_coefficients": {
        "right_subspace_overlap_top_k": 29.923198699951172,
        "right_subspace_overlap_bottom_k": -10.144109725952148,
        "interaction_matrix_overlap_top_k": 12.671030044555664,
        "interaction_matrix_overlap_bottom_k": -0.8807390332221985,
        "effective_rank": 0.29870548844337463,
        "effective_rank_mergeability_score": -1.990128755569458,
        "stable_rank": -5.9369049072265625,
        "spectral_gap": -5.73242712020874,
        "singular_value_ratio": -15.533482551574707,
        "layerwise_effective_rank": -2.445176362991333,
        "layerwise_effective_rank_mergeability_score": -5.340041637420654,
        "singular_value_overlap": 4.114165782928467,
        "subspace_overlap": 5.891267776489258,
        "right_subspace_overlap": 5.781153202056885,
        "activation_l2_distance": -9.188437461853027,
        "activation_cosine_similarity": 21.343982696533203,
        "activation_magnitude_ratio": -10.236796379089355,
        "activation_dot_product": 14.112627029418945,
        "encoder_gradient_cosine_similarity": 20.656883239746094,
        "encoder_gradient_l2_distance": -20.630489349365234,
        "encoder_gradient_dot_product": 5.564703941345215,
        "input_gradient_cosine_similarity": 22.066795349121094,
        "input_gradient_l2_distance": -25.119680404663086,
        "input_gradient_dot_product": -28.24483871459961
      },
      "coefficient_std": {
        "right_subspace_overlap_top_k": 67.34864044189453,
        "right_subspace_overlap_bottom_k": 18.757143020629883,
        "interaction_matrix_overlap_top_k": 24.30814552307129,
        "interaction_matrix_overlap_bottom_k": 57.056427001953125,
        "effective_rank": 17.388412475585938,
        "effective_rank_mergeability_score": 29.018451690673828,
        "stable_rank": 33.6640739440918,
        "spectral_gap": 28.734027862548828,
        "singular_value_ratio": 75.260009765625,
        "layerwise_effective_rank": 16.16051483154297,
        "layerwise_effective_rank_mergeability_score": 57.31739807128906,
        "singular_value_overlap": 10.781160354614258,
        "subspace_overlap": 15.491127967834473,
        "right_subspace_overlap": 21.175626754760742,
        "activation_l2_distance": 19.662403106689453,
        "activation_cosine_similarity": 53.65087890625,
        "activation_magnitude_ratio": 22.500125885009766,
        "activation_dot_product": 25.764963150024414,
        "encoder_gradient_cosine_similarity": 46.81007766723633,
        "encoder_gradient_l2_distance": 19.402572631835938,
        "encoder_gradient_dot_product": 12.72139835357666,
        "input_gradient_cosine_similarity": 67.79020690917969,
        "input_gradient_l2_distance": 22.032320022583008,
        "input_gradient_dot_product": 59.38526153564453
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7121420910281249,
          "val_r": 0.5031965450847742,
          "n_iterations": 977,
          "coefficients": {
            "right_subspace_overlap_top_k": 35.53596496582031,
            "right_subspace_overlap_bottom_k": -19.701066970825195,
            "interaction_matrix_overlap_top_k": -2.7738521099090576,
            "interaction_matrix_overlap_bottom_k": 0.5659106373786926,
            "effective_rank": -8.596423149108887,
            "effective_rank_mergeability_score": 3.937828540802002,
            "stable_rank": -7.490433216094971,
            "spectral_gap": 5.257785797119141,
            "singular_value_ratio": 7.523526668548584,
            "layerwise_effective_rank": 12.240213394165039,
            "layerwise_effective_rank_mergeability_score": -2.605897903442383,
            "singular_value_overlap": -0.8168977499008179,
            "subspace_overlap": -6.567772388458252,
            "right_subspace_overlap": 5.598260402679443,
            "activation_l2_distance": 4.064518928527832,
            "activation_cosine_similarity": 32.83512878417969,
            "activation_magnitude_ratio": -8.837263107299805,
            "activation_dot_product": 1.9137041568756104,
            "encoder_gradient_cosine_similarity": 5.976358890533447,
            "encoder_gradient_l2_distance": -5.630343914031982,
            "encoder_gradient_dot_product": 6.704716205596924,
            "input_gradient_cosine_similarity": 10.443083763122559,
            "input_gradient_l2_distance": -44.40338897705078,
            "input_gradient_dot_product": -24.175195693969727
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7161444051404551,
          "val_r": 0.8040140366427124,
          "n_iterations": 979,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.5078394412994385,
            "right_subspace_overlap_bottom_k": -5.487580299377441,
            "interaction_matrix_overlap_top_k": 3.3367135524749756,
            "interaction_matrix_overlap_bottom_k": -8.533060073852539,
            "effective_rank": 3.072209358215332,
            "effective_rank_mergeability_score": 7.508904933929443,
            "stable_rank": 2.0721728801727295,
            "spectral_gap": 18.27300262451172,
            "singular_value_ratio": 16.549415588378906,
            "layerwise_effective_rank": -8.61815071105957,
            "layerwise_effective_rank_mergeability_score": -6.847635746002197,
            "singular_value_overlap": 3.5723516941070557,
            "subspace_overlap": -3.769291639328003,
            "right_subspace_overlap": 14.920522689819336,
            "activation_l2_distance": -8.849101066589355,
            "activation_cosine_similarity": 1.6945377588272095,
            "activation_magnitude_ratio": -1.827242136001587,
            "activation_dot_product": 13.829036712646484,
            "encoder_gradient_cosine_similarity": 4.935365676879883,
            "encoder_gradient_l2_distance": -29.951974868774414,
            "encoder_gradient_dot_product": 4.715671539306641,
            "input_gradient_cosine_similarity": 4.4250288009643555,
            "input_gradient_l2_distance": -17.157360076904297,
            "input_gradient_dot_product": -10.372819900512695
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7264945881000596,
          "val_r": 0.7122515302116154,
          "n_iterations": 685,
          "coefficients": {
            "right_subspace_overlap_top_k": 10.600981712341309,
            "right_subspace_overlap_bottom_k": -16.713817596435547,
            "interaction_matrix_overlap_top_k": 24.072681427001953,
            "interaction_matrix_overlap_bottom_k": -16.683923721313477,
            "effective_rank": -2.1806037425994873,
            "effective_rank_mergeability_score": 10.108807563781738,
            "stable_rank": -3.294917345046997,
            "spectral_gap": 4.818902969360352,
            "singular_value_ratio": 9.169554710388184,
            "layerwise_effective_rank": -7.836231708526611,
            "layerwise_effective_rank_mergeability_score": -9.69926643371582,
            "singular_value_overlap": 2.4161126613616943,
            "subspace_overlap": 9.4708251953125,
            "right_subspace_overlap": 14.486412048339844,
            "activation_l2_distance": 1.059071660041809,
            "activation_cosine_similarity": 23.213523864746094,
            "activation_magnitude_ratio": -7.008007049560547,
            "activation_dot_product": 17.1151123046875,
            "encoder_gradient_cosine_similarity": 8.495945930480957,
            "encoder_gradient_l2_distance": -40.81058883666992,
            "encoder_gradient_dot_product": 7.379431247711182,
            "input_gradient_cosine_similarity": 12.342602729797363,
            "input_gradient_l2_distance": -24.949092864990234,
            "input_gradient_dot_product": -24.575773239135742
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.2989723700349547,
          "val_r": 0.202461301381188,
          "n_iterations": 822,
          "coefficients": {
            "right_subspace_overlap_top_k": 311.9278564453125,
            "right_subspace_overlap_bottom_k": 45.13705062866211,
            "interaction_matrix_overlap_top_k": 105.15354919433594,
            "interaction_matrix_overlap_bottom_k": 231.79421997070312,
            "effective_rank": -50.411582946777344,
            "effective_rank_mergeability_score": -109.51924896240234,
            "stable_rank": -148.86453247070312,
            "spectral_gap": -126.84222412109375,
            "singular_value_ratio": -341.222412109375,
            "layerwise_effective_rank": -37.82576370239258,
            "layerwise_effective_rank_mergeability_score": -245.3921661376953,
            "singular_value_overlap": 47.64558410644531,
            "subspace_overlap": -11.218626976013184,
            "right_subspace_overlap": -52.072044372558594,
            "activation_l2_distance": -45.746456146240234,
            "activation_cosine_similarity": 250.0570068359375,
            "activation_magnitude_ratio": -94.69527435302734,
            "activation_dot_product": 121.43932342529297,
            "encoder_gradient_cosine_similarity": 219.2974090576172,
            "encoder_gradient_l2_distance": -1.9678473472595215,
            "encoder_gradient_dot_product": -26.97553253173828,
            "input_gradient_cosine_similarity": 316.4059753417969,
            "input_gradient_l2_distance": -73.4978256225586,
            "input_gradient_dot_product": -281.6084289550781
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7275762120087739,
          "val_r": 0.7122774142914976,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 9.74330997467041,
            "right_subspace_overlap_bottom_k": -11.175572395324707,
            "interaction_matrix_overlap_top_k": -2.095107078552246,
            "interaction_matrix_overlap_bottom_k": -4.09853982925415,
            "effective_rank": -2.9909744262695312,
            "effective_rank_mergeability_score": 1.4379851818084717,
            "stable_rank": 0.6595509052276611,
            "spectral_gap": 3.330216646194458,
            "singular_value_ratio": 4.384298801422119,
            "layerwise_effective_rank": 2.417710065841675,
            "layerwise_effective_rank_mergeability_score": 2.4904303550720215,
            "singular_value_overlap": 1.328108310699463,
            "subspace_overlap": -1.498388648033142,
            "right_subspace_overlap": 13.948307037353516,
            "activation_l2_distance": -2.338834047317505,
            "activation_cosine_similarity": 8.606063842773438,
            "activation_magnitude_ratio": -1.063188910484314,
            "activation_dot_product": 6.316108226776123,
            "encoder_gradient_cosine_similarity": 4.851066589355469,
            "encoder_gradient_l2_distance": -15.326361656188965,
            "encoder_gradient_dot_product": 4.251776695251465,
            "input_gradient_cosine_similarity": 4.29746150970459,
            "input_gradient_l2_distance": -16.542911529541016,
            "input_gradient_dot_product": -9.933989524841309
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.13459628869023982,
          "val_r": 0.059729777568229156,
          "n_iterations": 51,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.3807962238788605,
            "right_subspace_overlap_bottom_k": -0.5065087080001831,
            "interaction_matrix_overlap_top_k": -0.3801059126853943,
            "interaction_matrix_overlap_bottom_k": -0.6223934292793274,
            "effective_rank": 0.471926212310791,
            "effective_rank_mergeability_score": 0.5102970004081726,
            "stable_rank": -0.36171892285346985,
            "spectral_gap": 0.5695211887359619,
            "singular_value_ratio": -0.2251194417476654,
            "layerwise_effective_rank": -0.3297889828681946,
            "layerwise_effective_rank_mergeability_score": 0.3796103894710541,
            "singular_value_overlap": 0.12687671184539795,
            "subspace_overlap": 0.1779066026210785,
            "right_subspace_overlap": -0.42596760392189026,
            "activation_l2_distance": 0.5048025846481323,
            "activation_cosine_similarity": 0.45081713795661926,
            "activation_magnitude_ratio": -0.3131135404109955,
            "activation_dot_product": 0.012651152908802032,
            "encoder_gradient_cosine_similarity": 0.4039915204048157,
            "encoder_gradient_l2_distance": -0.12845169007778168,
            "encoder_gradient_dot_product": -0.0031546251848340034,
            "input_gradient_cosine_similarity": 0.42448848485946655,
            "input_gradient_l2_distance": -0.025794606655836105,
            "input_gradient_dot_product": -0.03583447262644768
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.6917316526095062,
          "val_r": 0.45839049914647345,
          "n_iterations": 893,
          "coefficients": {
            "right_subspace_overlap_top_k": 77.24364471435547,
            "right_subspace_overlap_bottom_k": -24.72637367248535,
            "interaction_matrix_overlap_top_k": 29.249021530151367,
            "interaction_matrix_overlap_bottom_k": -65.5291976928711,
            "effective_rank": 0.4337623119354248,
            "effective_rank_mergeability_score": -4.642549991607666,
            "stable_rank": 17.224390029907227,
            "spectral_gap": 4.602863311767578,
            "singular_value_ratio": -6.579765319824219,
            "layerwise_effective_rank": 17.633310317993164,
            "layerwise_effective_rank_mergeability_score": 41.494720458984375,
            "singular_value_overlap": -2.2937068939208984,
            "subspace_overlap": -2.3058359622955322,
            "right_subspace_overlap": -5.820679187774658,
            "activation_l2_distance": -31.986656188964844,
            "activation_cosine_similarity": 1.4521076679229736,
            "activation_magnitude_ratio": 0.835326075553894,
            "activation_dot_product": 4.030367374420166,
            "encoder_gradient_cosine_similarity": 45.46967315673828,
            "encoder_gradient_l2_distance": -36.74824905395508,
            "encoder_gradient_dot_product": 38.60593032836914,
            "input_gradient_cosine_similarity": -0.1472739428281784,
            "input_gradient_l2_distance": -63.123722076416016,
            "input_gradient_dot_product": -33.3727912902832
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7818637858192218,
          "val_r": 0.4260946254949668,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.45489510893821716,
            "right_subspace_overlap_bottom_k": -3.1078853607177734,
            "interaction_matrix_overlap_top_k": -1.5976710319519043,
            "interaction_matrix_overlap_bottom_k": 2.990208864212036,
            "effective_rank": 0.6338799595832825,
            "effective_rank_mergeability_score": -0.6311330795288086,
            "stable_rank": -0.75898277759552,
            "spectral_gap": 0.31910276412963867,
            "singular_value_ratio": 0.4269951581954956,
            "layerwise_effective_rank": 0.06873010098934174,
            "layerwise_effective_rank_mergeability_score": 0.6910304427146912,
            "singular_value_overlap": -0.0967569500207901,
            "subspace_overlap": 0.39181092381477356,
            "right_subspace_overlap": 0.8015221953392029,
            "activation_l2_distance": 0.3543247878551483,
            "activation_cosine_similarity": 0.7631135582923889,
            "activation_magnitude_ratio": -0.010478322394192219,
            "activation_dot_product": -0.1634347289800644,
            "encoder_gradient_cosine_similarity": 0.07551097869873047,
            "encoder_gradient_l2_distance": -0.5330403447151184,
            "encoder_gradient_dot_product": -0.029729001224040985,
            "input_gradient_cosine_similarity": 0.09932780265808105,
            "input_gradient_l2_distance": -0.20978917181491852,
            "input_gradient_dot_product": 0.06730777770280838
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.7478160560521236,
          "val_r": 0.217864174673657,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": -0.7945609092712402,
            "right_subspace_overlap_bottom_k": -25.162765502929688,
            "interaction_matrix_overlap_top_k": 7.995614528656006,
            "interaction_matrix_overlap_bottom_k": -3.7278048992156982,
            "effective_rank": -14.561978340148926,
            "effective_rank_mergeability_score": 14.486581802368164,
            "stable_rank": 11.727489471435547,
            "spectral_gap": -9.584914207458496,
            "singular_value_ratio": 6.56268310546875,
            "layerwise_effective_rank": -7.465231895446777,
            "layerwise_effective_rank_mergeability_score": 3.791034698486328,
            "singular_value_overlap": 2.8713247776031494,
            "subspace_overlap": 13.105937957763672,
            "right_subspace_overlap": 16.71063232421875,
            "activation_l2_distance": 0.6444698572158813,
            "activation_cosine_similarity": 20.6313419342041,
            "activation_magnitude_ratio": 4.034377098083496,
            "activation_dot_product": 4.431493282318115,
            "encoder_gradient_cosine_similarity": 13.93678092956543,
            "encoder_gradient_l2_distance": -15.592002868652344,
            "encoder_gradient_dot_product": 5.297479629516602,
            "input_gradient_cosine_similarity": 5.657290458679199,
            "input_gradient_l2_distance": -34.834327697753906,
            "input_gradient_dot_product": -19.16243553161621
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.6705820876292603,
          "val_r": 0.5014903964166735,
          "n_iterations": 729,
          "coefficients": {
            "right_subspace_overlap_top_k": 26.607677459716797,
            "right_subspace_overlap_bottom_k": -11.914787292480469,
            "interaction_matrix_overlap_top_k": 30.35012435913086,
            "interaction_matrix_overlap_bottom_k": -33.19498062133789,
            "effective_rank": 3.809415340423584,
            "effective_rank_mergeability_score": 13.329366683959961,
            "stable_rank": 11.024301528930664,
            "spectral_gap": -9.303595542907715,
            "singular_value_ratio": -12.750418663024902,
            "layerwise_effective_rank": -18.13887596130371,
            "layerwise_effective_rank_mergeability_score": 3.674454927444458,
            "singular_value_overlap": 7.348223686218262,
            "subspace_overlap": 27.71588134765625,
            "right_subspace_overlap": 12.961286544799805,
            "activation_l2_distance": 11.432286262512207,
            "activation_cosine_similarity": -5.223141670227051,
            "activation_magnitude_ratio": -3.2267568111419678,
            "activation_dot_product": 16.9110050201416,
            "encoder_gradient_cosine_similarity": 26.364097595214844,
            "encoder_gradient_l2_distance": -31.817142486572266,
            "encoder_gradient_dot_product": 8.793128967285156,
            "input_gradient_cosine_similarity": 17.054567337036133,
            "input_gradient_l2_distance": -49.823219299316406,
            "input_gradient_dot_product": -40.98501968383789
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7722742329162947,
          "val_r": 0.2889026577503253,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.47611141204834,
            "right_subspace_overlap_bottom_k": -4.303760528564453,
            "interaction_matrix_overlap_top_k": 0.27359703183174133,
            "interaction_matrix_overlap_bottom_k": 1.1805673837661743,
            "effective_rank": 1.3466981649398804,
            "effective_rank_mergeability_score": 1.497442364692688,
            "stable_rank": -0.2796474099159241,
            "spectral_gap": 1.0534954071044922,
            "singular_value_ratio": 0.9219269752502441,
            "layerwise_effective_rank": -1.5359278917312622,
            "layerwise_effective_rank_mergeability_score": -1.125542402267456,
            "singular_value_overlap": 0.6607012748718262,
            "subspace_overlap": -3.660885810852051,
            "right_subspace_overlap": 2.4284980297088623,
            "activation_l2_distance": 1.1305280923843384,
            "activation_cosine_similarity": 6.780707359313965,
            "activation_magnitude_ratio": -0.5891835689544678,
            "activation_dot_product": 0.012958774343132973,
            "encoder_gradient_cosine_similarity": 0.6359961032867432,
            "encoder_gradient_l2_distance": -5.805887222290039,
            "encoder_gradient_dot_product": 0.5492598414421082,
            "input_gradient_cosine_similarity": 1.0021209716796875,
            "input_gradient_l2_distance": -3.4920358657836914,
            "input_gradient_dot_product": -1.1587938070297241
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7397700561386569,
          "val_r": 0.749096718583626,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 6.768495559692383,
            "right_subspace_overlap_bottom_k": 1.582855224609375,
            "interaction_matrix_overlap_top_k": -5.130660057067871,
            "interaction_matrix_overlap_bottom_k": -9.417582511901855,
            "effective_rank": -0.8531336188316345,
            "effective_rank_mergeability_score": 4.893632888793945,
            "stable_rank": -1.129515290260315,
            "spectral_gap": 0.16712096333503723,
            "singular_value_ratio": 1.7824628353118896,
            "layerwise_effective_rank": 2.404609441757202,
            "layerwise_effective_rank_mergeability_score": -1.640493392944336,
            "singular_value_overlap": 0.9443963766098022,
            "subspace_overlap": -0.09792424738407135,
            "right_subspace_overlap": 7.7312211990356445,
            "activation_l2_distance": 2.129016399383545,
            "activation_cosine_similarity": 8.574955940246582,
            "activation_magnitude_ratio": -1.305867075920105,
            "activation_dot_product": 3.7000293731689453,
            "encoder_gradient_cosine_similarity": 2.6545679569244385,
            "encoder_gradient_l2_distance": -12.875205039978027,
            "encoder_gradient_dot_product": 0.9881574511528015,
            "input_gradient_cosine_similarity": 2.785982370376587,
            "input_gradient_l2_distance": -9.402982711791992,
            "input_gradient_dot_product": -4.2554168701171875
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7966875251616099,
          "val_r": 0.7626395555446668,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.5480037927627563,
            "right_subspace_overlap_bottom_k": -2.8323919773101807,
            "interaction_matrix_overlap_top_k": -1.2335162162780762,
            "interaction_matrix_overlap_bottom_k": 2.737562656402588,
            "effective_rank": 1.184205412864685,
            "effective_rank_mergeability_score": -0.41716742515563965,
            "stable_rank": -0.8158910870552063,
            "spectral_gap": -0.9980124831199646,
            "singular_value_ratio": -0.8607582449913025,
            "layerwise_effective_rank": 0.6119584441184998,
            "layerwise_effective_rank_mergeability_score": 1.533812165260315,
            "singular_value_overlap": -0.11926592141389847,
            "subspace_overlap": 0.37090468406677246,
            "right_subspace_overlap": 0.4189610481262207,
            "activation_l2_distance": 0.8216736316680908,
            "activation_cosine_similarity": 1.214774489402771,
            "activation_magnitude_ratio": 0.017830798402428627,
            "activation_dot_product": -0.19170476496219635,
            "encoder_gradient_cosine_similarity": 0.09833906590938568,
            "encoder_gradient_l2_distance": -0.48587435483932495,
            "encoder_gradient_dot_product": 0.03301704674959183,
            "input_gradient_cosine_similarity": 0.07800602912902832,
            "input_gradient_l2_distance": -0.5263983011245728,
            "input_gradient_dot_product": -0.19041362404823303
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7282262860523483,
          "val_r": 0.7153304585547655,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 13.79046630859375,
            "right_subspace_overlap_bottom_k": -3.930928945541382,
            "interaction_matrix_overlap_top_k": 7.266302585601807,
            "interaction_matrix_overlap_bottom_k": -6.84897518157959,
            "effective_rank": -2.666510820388794,
            "effective_rank_mergeability_score": 8.496403694152832,
            "stable_rank": 10.62496566772461,
            "spectral_gap": 4.915859222412109,
            "singular_value_ratio": 6.081844806671143,
            "layerwise_effective_rank": -2.370492696762085,
            "layerwise_effective_rank_mergeability_score": 3.3401083946228027,
            "singular_value_overlap": 1.2967160940170288,
            "subspace_overlap": 5.1389594078063965,
            "right_subspace_overlap": -8.335824012756348,
            "activation_l2_distance": -7.945807456970215,
            "activation_cosine_similarity": 5.257299900054932,
            "activation_magnitude_ratio": -2.3196468353271484,
            "activation_dot_product": 7.135577201843262,
            "encoder_gradient_cosine_similarity": 5.248079776763916,
            "encoder_gradient_l2_distance": -27.4298095703125,
            "encoder_gradient_dot_product": 1.8447003364562988,
            "input_gradient_cosine_similarity": 3.3921825885772705,
            "input_gradient_l2_distance": -9.769912719726562,
            "input_gradient_dot_product": -11.212986946105957
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7358682269909206,
          "val_r": 0.7996104084270184,
          "n_iterations": 898,
          "coefficients": {
            "right_subspace_overlap_top_k": -0.2283237725496292,
            "right_subspace_overlap_bottom_k": -17.9476318359375,
            "interaction_matrix_overlap_top_k": 4.741369247436523,
            "interaction_matrix_overlap_bottom_k": 1.8543000221252441,
            "effective_rank": 1.9163018465042114,
            "effective_rank_mergeability_score": 7.818216323852539,
            "stable_rank": 11.073718070983887,
            "spectral_gap": 6.993395805358887,
            "singular_value_ratio": 2.345874547958374,
            "layerwise_effective_rank": -14.792780876159668,
            "layerwise_effective_rank_mergeability_score": -9.5382661819458,
            "singular_value_overlap": 2.371358633041382,
            "subspace_overlap": -1.5721869468688965,
            "right_subspace_overlap": 15.363202095031738,
            "activation_l2_distance": 3.214367151260376,
            "activation_cosine_similarity": 17.003461837768555,
            "activation_magnitude_ratio": -1.524810791015625,
            "activation_dot_product": 4.8718342781066895,
            "encoder_gradient_cosine_similarity": 4.106510639190674,
            "encoder_gradient_l2_distance": -28.54589080810547,
            "encoder_gradient_dot_product": 3.6236655712127686,
            "input_gradient_cosine_similarity": 4.402499675750732,
            "input_gradient_l2_distance": -9.796453475952148,
            "input_gradient_dot_product": -6.755390167236328
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.7053617323157264,
          "val_r": 0.08280884063300056,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 7.120969295501709,
            "right_subspace_overlap_bottom_k": 8.792340278625488,
            "interaction_matrix_overlap_top_k": 3.2975170612335205,
            "interaction_matrix_overlap_bottom_k": -26.540075302124023,
            "effective_rank": -8.847957611083984,
            "effective_rank_mergeability_score": -9.152019500732422,
            "stable_rank": 2.232511043548584,
            "spectral_gap": -4.4024224281311035,
            "singular_value_ratio": 8.383139610290527,
            "layerwise_effective_rank": -24.907569885253906,
            "layerwise_effective_rank_mergeability_score": 2.193969249725342,
            "singular_value_overlap": 16.426998138427734,
            "subspace_overlap": 13.433082580566406,
            "right_subspace_overlap": 11.641752243041992,
            "activation_l2_distance": 15.777573585510254,
            "activation_cosine_similarity": 33.853614807128906,
            "activation_magnitude_ratio": -7.972553253173828,
            "activation_dot_product": 19.330171585083008,
            "encoder_gradient_cosine_similarity": 16.470516204833984,
            "encoder_gradient_l2_distance": -14.133688926696777,
            "encoder_gradient_dot_product": 8.256880760192871,
            "input_gradient_cosine_similarity": 6.45627498626709,
            "input_gradient_l2_distance": -41.669002532958984,
            "input_gradient_dot_product": -35.04356384277344
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7031081246212492,
          "val_r": 0.6777928525671546,
          "n_iterations": 936,
          "coefficients": {
            "right_subspace_overlap_top_k": 21.675466537475586,
            "right_subspace_overlap_bottom_k": -38.74187088012695,
            "interaction_matrix_overlap_top_k": -7.921904563903809,
            "interaction_matrix_overlap_bottom_k": -20.29034996032715,
            "effective_rank": 4.279170989990234,
            "effective_rank_mergeability_score": -5.2115960121154785,
            "stable_rank": -13.442952156066895,
            "spectral_gap": 12.543571472167969,
            "singular_value_ratio": 18.98656463623047,
            "layerwise_effective_rank": 34.61944580078125,
            "layerwise_effective_rank_mergeability_score": 39.31643295288086,
            "singular_value_overlap": -0.2811890244483948,
            "subspace_overlap": -0.7209911346435547,
            "right_subspace_overlap": 61.54486846923828,
            "activation_l2_distance": -40.64036560058594,
            "activation_cosine_similarity": 9.944061279296875,
            "activation_magnitude_ratio": -23.496051788330078,
            "activation_dot_product": 3.8622426986694336,
            "encoder_gradient_cosine_similarity": 15.758731842041016,
            "encoder_gradient_l2_distance": -84.12553405761719,
            "encoder_gradient_dot_product": 14.233826637268066,
            "input_gradient_cosine_similarity": 11.472973823547363,
            "input_gradient_l2_distance": -6.3558454513549805,
            "input_gradient_dot_product": -6.010327339172363
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7234326801791722,
          "val_r": 0.5375351522138571,
          "n_iterations": 921,
          "coefficients": {
            "right_subspace_overlap_top_k": 2.975987195968628,
            "right_subspace_overlap_bottom_k": -14.666023254394531,
            "interaction_matrix_overlap_top_k": 17.922163009643555,
            "interaction_matrix_overlap_bottom_k": -0.4834803640842438,
            "effective_rank": 2.579922676086426,
            "effective_rank_mergeability_score": 6.366745948791504,
            "stable_rank": 2.1546642780303955,
            "spectral_gap": -8.220237731933594,
            "singular_value_ratio": -4.353963851928711,
            "layerwise_effective_rank": -1.3584836721420288,
            "layerwise_effective_rank_mergeability_score": 7.297514915466309,
            "singular_value_overlap": 3.753061056137085,
            "subspace_overlap": -5.499792098999023,
            "right_subspace_overlap": 1.2686349153518677,
            "activation_l2_distance": -0.27518177032470703,
            "activation_cosine_similarity": 8.389434814453125,
            "activation_magnitude_ratio": 1.0905474424362183,
            "activation_dot_product": 12.342170715332031,
            "encoder_gradient_cosine_similarity": 5.830009937286377,
            "encoder_gradient_l2_distance": -22.52074432373047,
            "encoder_gradient_dot_product": 7.294764041900635,
            "input_gradient_cosine_similarity": 4.528866291046143,
            "input_gradient_l2_distance": -15.764089584350586,
            "input_gradient_dot_product": -9.654119491577148
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5912258864706917,
          "val_r": 0.1792967169451582,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 41.83648681640625,
            "right_subspace_overlap_bottom_k": -6.080262184143066,
            "interaction_matrix_overlap_top_k": 30.228759765625,
            "interaction_matrix_overlap_bottom_k": -65.8370590209961,
            "effective_rank": 44.729454040527344,
            "effective_rank_mergeability_score": -39.94880676269531,
            "stable_rank": -12.333821296691895,
            "spectral_gap": -8.300590515136719,
            "singular_value_ratio": -21.25279998779297,
            "layerwise_effective_rank": -17.49350357055664,
            "layerwise_effective_rank_mergeability_score": 46.13560485839844,
            "singular_value_overlap": -2.346085786819458,
            "subspace_overlap": 56.8310432434082,
            "right_subspace_overlap": 28.480024337768555,
            "activation_l2_distance": -55.73516082763672,
            "activation_cosine_similarity": -10.430456161499023,
            "activation_magnitude_ratio": -49.125022888183594,
            "activation_dot_product": 24.27330207824707,
            "encoder_gradient_cosine_similarity": 19.36042022705078,
            "encoder_gradient_l2_distance": -6.39532470703125,
            "encoder_gradient_dot_product": 31.838321685791016,
            "input_gradient_cosine_similarity": 21.615358352661133,
            "input_gradient_l2_distance": -25.0025577545166,
            "input_gradient_dot_product": -24.04884910583496
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7717033867426828,
          "val_r": 0.6751063044005635,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 25.291929244995117,
            "right_subspace_overlap_bottom_k": -51.39521789550781,
            "interaction_matrix_overlap_top_k": 10.666016578674316,
            "interaction_matrix_overlap_bottom_k": 3.0698773860931396,
            "effective_rank": 32.62632369995117,
            "effective_rank_mergeability_score": 49.327728271484375,
            "stable_rank": 1.2405662536621094,
            "spectral_gap": -9.841392517089844,
            "singular_value_ratio": -6.542737007141113,
            "layerwise_effective_rank": 23.77329444885254,
            "layerwise_effective_rank_mergeability_score": 17.7097225189209,
            "singular_value_overlap": -2.5245978832244873,
            "subspace_overlap": 28.100698471069336,
            "right_subspace_overlap": -26.026538848876953,
            "activation_l2_distance": -31.383840560913086,
            "activation_cosine_similarity": 11.8113431930542,
            "activation_magnitude_ratio": -7.3995680809021,
            "activation_dot_product": 21.08059310913086,
            "encoder_gradient_cosine_similarity": 13.168323516845703,
            "encoder_gradient_l2_distance": -31.78582191467285,
            "encoder_gradient_dot_product": -6.108211517333984,
            "input_gradient_cosine_similarity": 14.59909725189209,
            "input_gradient_l2_distance": -56.04694747924805,
            "input_gradient_dot_product": -22.412038803100586
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    },
    "arithmetic": {
      "aggregate_metrics": {
        "train_r": 0.3318268083032877,
        "train_p": 1.1434878501278425e-83,
        "val_r": 0.26481052279597517,
        "val_p": 3.696237311518426e-07
      },
      "per_fold_stats": {
        "train_r_mean": 0.5145121386564082,
        "train_r_std": 0.08159380308796446,
        "val_r_mean": 0.3935141877602133,
        "val_r_std": 0.1800244871190147
      },
      "average_coefficients": {
        "right_subspace_overlap_top_k": 14.119417190551758,
        "right_subspace_overlap_bottom_k": -5.767834663391113,
        "interaction_matrix_overlap_top_k": 12.556540489196777,
        "interaction_matrix_overlap_bottom_k": 11.321340560913086,
        "effective_rank": 4.034346580505371,
        "effective_rank_mergeability_score": 4.600121974945068,
        "stable_rank": -2.1511895656585693,
        "spectral_gap": 5.348729133605957,
        "singular_value_ratio": -2.1478819847106934,
        "layerwise_effective_rank": -5.67301082611084,
        "layerwise_effective_rank_mergeability_score": 0.07685728371143341,
        "singular_value_overlap": -20.46152114868164,
        "subspace_overlap": 17.619558334350586,
        "right_subspace_overlap": 12.905008316040039,
        "activation_l2_distance": -7.2193284034729,
        "activation_cosine_similarity": 15.962809562683105,
        "activation_magnitude_ratio": -5.314408302307129,
        "activation_dot_product": 7.48459005355835,
        "encoder_gradient_cosine_similarity": 8.19008731842041,
        "encoder_gradient_l2_distance": -29.133434295654297,
        "encoder_gradient_dot_product": 6.477674961090088,
        "input_gradient_cosine_similarity": 9.75427532196045,
        "input_gradient_l2_distance": -29.107894897460938,
        "input_gradient_dot_product": -22.47701072692871
      },
      "coefficient_std": {
        "right_subspace_overlap_top_k": 12.30291748046875,
        "right_subspace_overlap_bottom_k": 15.38562297821045,
        "interaction_matrix_overlap_top_k": 17.342649459838867,
        "interaction_matrix_overlap_bottom_k": 15.661320686340332,
        "effective_rank": 11.577472686767578,
        "effective_rank_mergeability_score": 12.088871002197266,
        "stable_rank": 10.299169540405273,
        "spectral_gap": 9.567400932312012,
        "singular_value_ratio": 11.56169605255127,
        "layerwise_effective_rank": 21.21300506591797,
        "layerwise_effective_rank_mergeability_score": 17.80553436279297,
        "singular_value_overlap": 14.74803352355957,
        "subspace_overlap": 20.141372680664062,
        "right_subspace_overlap": 14.255441665649414,
        "activation_l2_distance": 10.894170761108398,
        "activation_cosine_similarity": 10.45805549621582,
        "activation_magnitude_ratio": 9.391753196716309,
        "activation_dot_product": 13.484771728515625,
        "encoder_gradient_cosine_similarity": 8.023262023925781,
        "encoder_gradient_l2_distance": 18.099227905273438,
        "encoder_gradient_dot_product": 6.375010013580322,
        "input_gradient_cosine_similarity": 7.414261817932129,
        "input_gradient_l2_distance": 11.51064682006836,
        "input_gradient_dot_product": 23.355955123901367
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.482610333252911,
          "val_r": 0.3822349686679651,
          "n_iterations": 616,
          "coefficients": {
            "right_subspace_overlap_top_k": 28.34377670288086,
            "right_subspace_overlap_bottom_k": -6.758167743682861,
            "interaction_matrix_overlap_top_k": 2.1974804401397705,
            "interaction_matrix_overlap_bottom_k": 26.167280197143555,
            "effective_rank": -25.3055419921875,
            "effective_rank_mergeability_score": -0.06970669329166412,
            "stable_rank": 2.0768160820007324,
            "spectral_gap": 10.609889030456543,
            "singular_value_ratio": -15.570098876953125,
            "layerwise_effective_rank": 19.285282135009766,
            "layerwise_effective_rank_mergeability_score": -14.283636093139648,
            "singular_value_overlap": -40.228179931640625,
            "subspace_overlap": 19.201799392700195,
            "right_subspace_overlap": 23.516876220703125,
            "activation_l2_distance": 4.390182971954346,
            "activation_cosine_similarity": 25.535503387451172,
            "activation_magnitude_ratio": -12.857666015625,
            "activation_dot_product": 22.97817611694336,
            "encoder_gradient_cosine_similarity": -3.4038660526275635,
            "encoder_gradient_l2_distance": -54.63661193847656,
            "encoder_gradient_dot_product": -9.435650825500488,
            "input_gradient_cosine_similarity": 19.667007446289062,
            "input_gradient_l2_distance": -15.899869918823242,
            "input_gradient_dot_product": -4.523545742034912
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5285297628054565,
          "val_r": 0.3652038125920084,
          "n_iterations": 934,
          "coefficients": {
            "right_subspace_overlap_top_k": -8.858386993408203,
            "right_subspace_overlap_bottom_k": 11.86046028137207,
            "interaction_matrix_overlap_top_k": 0.03186450153589249,
            "interaction_matrix_overlap_bottom_k": -8.442291259765625,
            "effective_rank": 17.81745719909668,
            "effective_rank_mergeability_score": -6.170420169830322,
            "stable_rank": -5.609588146209717,
            "spectral_gap": 12.92708969116211,
            "singular_value_ratio": -1.8408864736557007,
            "layerwise_effective_rank": 5.404196739196777,
            "layerwise_effective_rank_mergeability_score": 16.846141815185547,
            "singular_value_overlap": -9.980436325073242,
            "subspace_overlap": 2.3371832370758057,
            "right_subspace_overlap": 26.350269317626953,
            "activation_l2_distance": -5.13045597076416,
            "activation_cosine_similarity": 13.943649291992188,
            "activation_magnitude_ratio": -4.350587368011475,
            "activation_dot_product": -6.09344482421875,
            "encoder_gradient_cosine_similarity": -0.059561219066381454,
            "encoder_gradient_l2_distance": -21.988927841186523,
            "encoder_gradient_dot_product": 7.90430212020874,
            "input_gradient_cosine_similarity": 1.4288681745529175,
            "input_gradient_l2_distance": -23.848438262939453,
            "input_gradient_dot_product": -13.479629516601562
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.49898530233874716,
          "val_r": 0.41813261194714546,
          "n_iterations": 605,
          "coefficients": {
            "right_subspace_overlap_top_k": 25.524658203125,
            "right_subspace_overlap_bottom_k": -14.113786697387695,
            "interaction_matrix_overlap_top_k": 21.242164611816406,
            "interaction_matrix_overlap_bottom_k": 20.982080459594727,
            "effective_rank": 7.344912528991699,
            "effective_rank_mergeability_score": 6.645753383636475,
            "stable_rank": 5.196351528167725,
            "spectral_gap": -6.92702579498291,
            "singular_value_ratio": -10.779349327087402,
            "layerwise_effective_rank": -16.43260955810547,
            "layerwise_effective_rank_mergeability_score": 8.427144050598145,
            "singular_value_overlap": -31.681917190551758,
            "subspace_overlap": 15.04929256439209,
            "right_subspace_overlap": 17.055652618408203,
            "activation_l2_distance": -9.144969940185547,
            "activation_cosine_similarity": 12.484496116638184,
            "activation_magnitude_ratio": -10.983078002929688,
            "activation_dot_product": 13.177202224731445,
            "encoder_gradient_cosine_similarity": 6.781496524810791,
            "encoder_gradient_l2_distance": -24.65355110168457,
            "encoder_gradient_dot_product": 9.719962120056152,
            "input_gradient_cosine_similarity": 15.923280715942383,
            "input_gradient_l2_distance": -31.223512649536133,
            "input_gradient_dot_product": -28.617162704467773
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5196210575704936,
          "val_r": 0.2750394992299855,
          "n_iterations": 735,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.340874195098877,
            "right_subspace_overlap_bottom_k": 2.994988441467285,
            "interaction_matrix_overlap_top_k": 14.656915664672852,
            "interaction_matrix_overlap_bottom_k": 4.70757532119751,
            "effective_rank": 3.534442901611328,
            "effective_rank_mergeability_score": 11.049209594726562,
            "stable_rank": -0.5490593314170837,
            "spectral_gap": 5.831988334655762,
            "singular_value_ratio": -4.155269145965576,
            "layerwise_effective_rank": 6.531237602233887,
            "layerwise_effective_rank_mergeability_score": 2.484354257583618,
            "singular_value_overlap": -22.05815315246582,
            "subspace_overlap": 16.20134925842285,
            "right_subspace_overlap": 10.62297248840332,
            "activation_l2_distance": -3.6043739318847656,
            "activation_cosine_similarity": 14.773627281188965,
            "activation_magnitude_ratio": -6.1379876136779785,
            "activation_dot_product": -0.7032983303070068,
            "encoder_gradient_cosine_similarity": 5.747458457946777,
            "encoder_gradient_l2_distance": -29.81177520751953,
            "encoder_gradient_dot_product": 3.2874717712402344,
            "input_gradient_cosine_similarity": 9.025246620178223,
            "input_gradient_l2_distance": -19.40557289123535,
            "input_gradient_dot_product": -27.366289138793945
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4396848478732758,
          "val_r": 0.4737826451449773,
          "n_iterations": 456,
          "coefficients": {
            "right_subspace_overlap_top_k": 18.220327377319336,
            "right_subspace_overlap_bottom_k": 20.856287002563477,
            "interaction_matrix_overlap_top_k": 38.07107925415039,
            "interaction_matrix_overlap_bottom_k": -13.365461349487305,
            "effective_rank": 28.445430755615234,
            "effective_rank_mergeability_score": 40.02216720581055,
            "stable_rank": -20.184350967407227,
            "spectral_gap": -7.051898002624512,
            "singular_value_ratio": 6.042202472686768,
            "layerwise_effective_rank": -40.888912200927734,
            "layerwise_effective_rank_mergeability_score": -31.90715980529785,
            "singular_value_overlap": -39.59371566772461,
            "subspace_overlap": 83.71076965332031,
            "right_subspace_overlap": 32.01662063598633,
            "activation_l2_distance": -36.72880554199219,
            "activation_cosine_similarity": 15.9818754196167,
            "activation_magnitude_ratio": -16.849868774414062,
            "activation_dot_product": 38.59208679199219,
            "encoder_gradient_cosine_similarity": 17.595367431640625,
            "encoder_gradient_l2_distance": -38.2269172668457,
            "encoder_gradient_dot_product": 6.2207932472229,
            "input_gradient_cosine_similarity": 30.94353485107422,
            "input_gradient_l2_distance": -47.711647033691406,
            "input_gradient_dot_product": -83.21305847167969
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.4981021774068783,
          "val_r": 0.6956005543086647,
          "n_iterations": 569,
          "coefficients": {
            "right_subspace_overlap_top_k": 4.1641974449157715,
            "right_subspace_overlap_bottom_k": 1.679530143737793,
            "interaction_matrix_overlap_top_k": 16.596498489379883,
            "interaction_matrix_overlap_bottom_k": 15.221346855163574,
            "effective_rank": -2.5924952030181885,
            "effective_rank_mergeability_score": 4.120330810546875,
            "stable_rank": -3.154924154281616,
            "spectral_gap": -3.739504814147949,
            "singular_value_ratio": -2.0339760780334473,
            "layerwise_effective_rank": -2.9591028690338135,
            "layerwise_effective_rank_mergeability_score": 13.21554946899414,
            "singular_value_overlap": -27.692180633544922,
            "subspace_overlap": 14.29337215423584,
            "right_subspace_overlap": 17.899545669555664,
            "activation_l2_distance": -6.349045753479004,
            "activation_cosine_similarity": 11.502598762512207,
            "activation_magnitude_ratio": -6.000173568725586,
            "activation_dot_product": 17.22829818725586,
            "encoder_gradient_cosine_similarity": 11.314677238464355,
            "encoder_gradient_l2_distance": -30.582876205444336,
            "encoder_gradient_dot_product": 0.11348126828670502,
            "input_gradient_cosine_similarity": 12.212714195251465,
            "input_gradient_l2_distance": -22.432661056518555,
            "input_gradient_dot_product": -31.027801513671875
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.4648804040623954,
          "val_r": 0.23663304192174547,
          "n_iterations": 544,
          "coefficients": {
            "right_subspace_overlap_top_k": 34.36361312866211,
            "right_subspace_overlap_bottom_k": -23.328218460083008,
            "interaction_matrix_overlap_top_k": -25.751977920532227,
            "interaction_matrix_overlap_bottom_k": -3.939565658569336,
            "effective_rank": 10.442103385925293,
            "effective_rank_mergeability_score": -12.383810043334961,
            "stable_rank": -16.137964248657227,
            "spectral_gap": 3.465789794921875,
            "singular_value_ratio": 14.223567008972168,
            "layerwise_effective_rank": -47.29713439941406,
            "layerwise_effective_rank_mergeability_score": 0.6019549369812012,
            "singular_value_overlap": -45.6707649230957,
            "subspace_overlap": 50.73278045654297,
            "right_subspace_overlap": 39.72226333618164,
            "activation_l2_distance": -12.341073989868164,
            "activation_cosine_similarity": 52.859649658203125,
            "activation_magnitude_ratio": 26.619535446166992,
            "activation_dot_product": -1.1250113248825073,
            "encoder_gradient_cosine_similarity": 34.339195251464844,
            "encoder_gradient_l2_distance": -92.52062225341797,
            "encoder_gradient_dot_product": 11.629029273986816,
            "input_gradient_cosine_similarity": 10.070840835571289,
            "input_gradient_l2_distance": -43.461814880371094,
            "input_gradient_dot_product": 35.884849548339844
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.38390612253702466,
          "val_r": -0.018793645977256274,
          "n_iterations": 629,
          "coefficients": {
            "right_subspace_overlap_top_k": 30.16448402404785,
            "right_subspace_overlap_bottom_k": 11.402137756347656,
            "interaction_matrix_overlap_top_k": 6.709160327911377,
            "interaction_matrix_overlap_bottom_k": -2.312346935272217,
            "effective_rank": -7.781772613525391,
            "effective_rank_mergeability_score": -12.785612106323242,
            "stable_rank": -5.2906718254089355,
            "spectral_gap": 18.713550567626953,
            "singular_value_ratio": -16.37509536743164,
            "layerwise_effective_rank": -10.00205135345459,
            "layerwise_effective_rank_mergeability_score": -19.932491302490234,
            "singular_value_overlap": 13.144667625427246,
            "subspace_overlap": 18.183813095092773,
            "right_subspace_overlap": 24.552318572998047,
            "activation_l2_distance": -30.806888580322266,
            "activation_cosine_similarity": 3.9938464164733887,
            "activation_magnitude_ratio": -21.813020706176758,
            "activation_dot_product": 22.384389877319336,
            "encoder_gradient_cosine_similarity": 12.180599212646484,
            "encoder_gradient_l2_distance": -27.33077621459961,
            "encoder_gradient_dot_product": 13.756980895996094,
            "input_gradient_cosine_similarity": 7.270514488220215,
            "input_gradient_l2_distance": -30.77480697631836,
            "input_gradient_dot_product": 3.7465672492980957
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.5462877983803647,
          "val_r": 0.06638855348031472,
          "n_iterations": 830,
          "coefficients": {
            "right_subspace_overlap_top_k": 20.101545333862305,
            "right_subspace_overlap_bottom_k": -4.670459270477295,
            "interaction_matrix_overlap_top_k": 4.121395587921143,
            "interaction_matrix_overlap_bottom_k": 6.266798973083496,
            "effective_rank": -2.8596513271331787,
            "effective_rank_mergeability_score": 5.272651195526123,
            "stable_rank": 9.409390449523926,
            "spectral_gap": 2.3062052726745605,
            "singular_value_ratio": -1.1185762882232666,
            "layerwise_effective_rank": 5.742580890655518,
            "layerwise_effective_rank_mergeability_score": 17.171152114868164,
            "singular_value_overlap": -14.429375648498535,
            "subspace_overlap": 1.740536093711853,
            "right_subspace_overlap": -0.2518955171108246,
            "activation_l2_distance": -6.7803239822387695,
            "activation_cosine_similarity": 9.962695121765137,
            "activation_magnitude_ratio": -1.969326138496399,
            "activation_dot_product": -1.0783077478408813,
            "encoder_gradient_cosine_similarity": 8.140018463134766,
            "encoder_gradient_l2_distance": -18.73501205444336,
            "encoder_gradient_dot_product": 4.55377197265625,
            "input_gradient_cosine_similarity": 2.8606271743774414,
            "input_gradient_l2_distance": -23.582368850708008,
            "input_gradient_dot_product": -21.175888061523438
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5010041868451925,
          "val_r": 0.5157814776660087,
          "n_iterations": 590,
          "coefficients": {
            "right_subspace_overlap_top_k": 16.04686164855957,
            "right_subspace_overlap_bottom_k": -25.659870147705078,
            "interaction_matrix_overlap_top_k": 14.289681434631348,
            "interaction_matrix_overlap_bottom_k": 33.90150833129883,
            "effective_rank": -2.6856346130371094,
            "effective_rank_mergeability_score": 21.041484832763672,
            "stable_rank": 1.9588543176651,
            "spectral_gap": -16.521240234375,
            "singular_value_ratio": -25.391742706298828,
            "layerwise_effective_rank": 46.17119216918945,
            "layerwise_effective_rank_mergeability_score": 34.028411865234375,
            "singular_value_overlap": -38.65129089355469,
            "subspace_overlap": 11.58993911743164,
            "right_subspace_overlap": 35.79671859741211,
            "activation_l2_distance": -12.963349342346191,
            "activation_cosine_similarity": 5.564289093017578,
            "activation_magnitude_ratio": -8.938560485839844,
            "activation_dot_product": 0.9871547818183899,
            "encoder_gradient_cosine_similarity": 12.271106719970703,
            "encoder_gradient_l2_distance": -35.7931022644043,
            "encoder_gradient_dot_product": 10.447818756103516,
            "input_gradient_cosine_similarity": 3.3294365406036377,
            "input_gradient_l2_distance": -36.235660552978516,
            "input_gradient_dot_product": -43.58653259277344
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5026142442995892,
          "val_r": 0.2448288042192334,
          "n_iterations": 655,
          "coefficients": {
            "right_subspace_overlap_top_k": 9.814764022827148,
            "right_subspace_overlap_bottom_k": 4.796172618865967,
            "interaction_matrix_overlap_top_k": 4.378621578216553,
            "interaction_matrix_overlap_bottom_k": 9.21117877960205,
            "effective_rank": -9.806722640991211,
            "effective_rank_mergeability_score": 10.59415054321289,
            "stable_rank": 1.4740495681762695,
            "spectral_gap": 17.9252872467041,
            "singular_value_ratio": 14.042969703674316,
            "layerwise_effective_rank": 0.4206969141960144,
            "layerwise_effective_rank_mergeability_score": -11.481852531433105,
            "singular_value_overlap": -11.41766357421875,
            "subspace_overlap": 14.315881729125977,
            "right_subspace_overlap": -8.579792022705078,
            "activation_l2_distance": -9.758255004882812,
            "activation_cosine_similarity": 13.69425106048584,
            "activation_magnitude_ratio": -3.3749330043792725,
            "activation_dot_product": 8.704119682312012,
            "encoder_gradient_cosine_similarity": 0.9208440780639648,
            "encoder_gradient_l2_distance": -25.763463973999023,
            "encoder_gradient_dot_product": -3.315430164337158,
            "input_gradient_cosine_similarity": 8.999175071716309,
            "input_gradient_l2_distance": -19.400890350341797,
            "input_gradient_dot_product": -15.395469665527344
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.48100809722913146,
          "val_r": 0.36786251413269044,
          "n_iterations": 739,
          "coefficients": {
            "right_subspace_overlap_top_k": 13.015987396240234,
            "right_subspace_overlap_bottom_k": 4.547016620635986,
            "interaction_matrix_overlap_top_k": 13.453898429870605,
            "interaction_matrix_overlap_bottom_k": 20.518047332763672,
            "effective_rank": 7.128629684448242,
            "effective_rank_mergeability_score": 12.557836532592773,
            "stable_rank": 2.2873053550720215,
            "spectral_gap": 8.063555717468262,
            "singular_value_ratio": -17.185102462768555,
            "layerwise_effective_rank": -15.286038398742676,
            "layerwise_effective_rank_mergeability_score": -26.548070907592773,
            "singular_value_overlap": -34.34156036376953,
            "subspace_overlap": 33.052371978759766,
            "right_subspace_overlap": 15.17734432220459,
            "activation_l2_distance": 0.6535686254501343,
            "activation_cosine_similarity": 12.855071067810059,
            "activation_magnitude_ratio": -17.180130004882812,
            "activation_dot_product": 26.13164520263672,
            "encoder_gradient_cosine_similarity": 10.391432762145996,
            "encoder_gradient_l2_distance": -22.156707763671875,
            "encoder_gradient_dot_product": 17.99951934814453,
            "input_gradient_cosine_similarity": 21.324935913085938,
            "input_gradient_l2_distance": -34.35320281982422,
            "input_gradient_dot_product": -51.10947036743164
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.500140525439878,
          "val_r": 0.5187006504067804,
          "n_iterations": 930,
          "coefficients": {
            "right_subspace_overlap_top_k": 22.205684661865234,
            "right_subspace_overlap_bottom_k": -7.976184844970703,
            "interaction_matrix_overlap_top_k": 6.913715362548828,
            "interaction_matrix_overlap_bottom_k": 17.038724899291992,
            "effective_rank": 7.991059303283691,
            "effective_rank_mergeability_score": -2.9873645305633545,
            "stable_rank": -5.410268306732178,
            "spectral_gap": 4.887261867523193,
            "singular_value_ratio": -2.815995454788208,
            "layerwise_effective_rank": 2.2783312797546387,
            "layerwise_effective_rank_mergeability_score": 6.687589645385742,
            "singular_value_overlap": -18.404014587402344,
            "subspace_overlap": 9.968561172485352,
            "right_subspace_overlap": -8.164932250976562,
            "activation_l2_distance": -5.236979961395264,
            "activation_cosine_similarity": 8.082941055297852,
            "activation_magnitude_ratio": -3.838413953781128,
            "activation_dot_product": 4.19374942779541,
            "encoder_gradient_cosine_similarity": 6.441166877746582,
            "encoder_gradient_l2_distance": -3.4438071250915527,
            "encoder_gradient_dot_product": 7.101759910583496,
            "input_gradient_cosine_similarity": 5.686378479003906,
            "input_gradient_l2_distance": -37.36528778076172,
            "input_gradient_dot_product": -12.835304260253906
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5221695048301316,
          "val_r": 0.6434024923215454,
          "n_iterations": 630,
          "coefficients": {
            "right_subspace_overlap_top_k": 14.548479080200195,
            "right_subspace_overlap_bottom_k": 1.6222083568572998,
            "interaction_matrix_overlap_top_k": 26.272836685180664,
            "interaction_matrix_overlap_bottom_k": -4.252975940704346,
            "effective_rank": -0.30378395318984985,
            "effective_rank_mergeability_score": 2.4934186935424805,
            "stable_rank": 7.9804229736328125,
            "spectral_gap": 1.635521411895752,
            "singular_value_ratio": -2.8908936977386475,
            "layerwise_effective_rank": 6.096875190734863,
            "layerwise_effective_rank_mergeability_score": 20.437593460083008,
            "singular_value_overlap": -26.513227462768555,
            "subspace_overlap": 3.9045755863189697,
            "right_subspace_overlap": 13.590985298156738,
            "activation_l2_distance": -10.31240463256836,
            "activation_cosine_similarity": 23.12145233154297,
            "activation_magnitude_ratio": -4.522274494171143,
            "activation_dot_product": -13.202826499938965,
            "encoder_gradient_cosine_similarity": 8.640678405761719,
            "encoder_gradient_l2_distance": -26.99661636352539,
            "encoder_gradient_dot_product": 15.403068542480469,
            "input_gradient_cosine_similarity": 5.481928825378418,
            "input_gradient_l2_distance": -33.71028518676758,
            "input_gradient_dot_product": -27.527109146118164
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4896686266088885,
          "val_r": 0.5829208081989534,
          "n_iterations": 846,
          "coefficients": {
            "right_subspace_overlap_top_k": 7.04617166519165,
            "right_subspace_overlap_bottom_k": 4.405786991119385,
            "interaction_matrix_overlap_top_k": 14.152901649475098,
            "interaction_matrix_overlap_bottom_k": -5.780767440795898,
            "effective_rank": -0.056106481701135635,
            "effective_rank_mergeability_score": 17.20401382446289,
            "stable_rank": 14.999956130981445,
            "spectral_gap": 14.905328750610352,
            "singular_value_ratio": 1.902814269065857,
            "layerwise_effective_rank": -1.3214912414550781,
            "layerwise_effective_rank_mergeability_score": -3.2099311351776123,
            "singular_value_overlap": -8.849286079406738,
            "subspace_overlap": 8.895751953125,
            "right_subspace_overlap": 3.338717222213745,
            "activation_l2_distance": -7.655126571655273,
            "activation_cosine_similarity": 16.51741600036621,
            "activation_magnitude_ratio": -3.9898011684417725,
            "activation_dot_product": 1.8398492336273193,
            "encoder_gradient_cosine_similarity": 3.919687032699585,
            "encoder_gradient_l2_distance": -31.066755294799805,
            "encoder_gradient_dot_product": 8.620369911193848,
            "input_gradient_cosine_similarity": 2.985475540161133,
            "input_gradient_l2_distance": -31.002521514892578,
            "input_gradient_dot_product": -26.804256439208984
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.46949247734394556,
          "val_r": 0.35973416354973664,
          "n_iterations": 487,
          "coefficients": {
            "right_subspace_overlap_top_k": 25.778474807739258,
            "right_subspace_overlap_bottom_k": -48.407371520996094,
            "interaction_matrix_overlap_top_k": 62.053794860839844,
            "interaction_matrix_overlap_bottom_k": 47.78425598144531,
            "effective_rank": 4.692432880401611,
            "effective_rank_mergeability_score": 3.9537241458892822,
            "stable_rank": -30.366424560546875,
            "spectral_gap": 6.540866374969482,
            "singular_value_ratio": 22.407272338867188,
            "layerwise_effective_rank": -46.3310661315918,
            "layerwise_effective_rank_mergeability_score": -34.59324264526367,
            "singular_value_overlap": -8.054335594177246,
            "subspace_overlap": 38.26561737060547,
            "right_subspace_overlap": -11.251408576965332,
            "activation_l2_distance": 12.184394836425781,
            "activation_cosine_similarity": 24.639284133911133,
            "activation_magnitude_ratio": -4.199883460998535,
            "activation_dot_product": 22.551513671875,
            "encoder_gradient_cosine_similarity": 13.91691780090332,
            "encoder_gradient_l2_distance": -25.372835159301758,
            "encoder_gradient_dot_product": 9.286083221435547,
            "input_gradient_cosine_similarity": 7.867395877838135,
            "input_gradient_l2_distance": -54.04069519042969,
            "input_gradient_dot_product": -38.30792236328125
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5048021903936567,
          "val_r": 0.3635926198699961,
          "n_iterations": 669,
          "coefficients": {
            "right_subspace_overlap_top_k": 24.011159896850586,
            "right_subspace_overlap_bottom_k": -14.26430606842041,
            "interaction_matrix_overlap_top_k": 29.115068435668945,
            "interaction_matrix_overlap_bottom_k": 13.114598274230957,
            "effective_rank": 15.155768394470215,
            "effective_rank_mergeability_score": 4.450618267059326,
            "stable_rank": -6.993777751922607,
            "spectral_gap": -2.653700590133667,
            "singular_value_ratio": -12.564436912536621,
            "layerwise_effective_rank": -6.9868550300598145,
            "layerwise_effective_rank_mergeability_score": 0.646597146987915,
            "singular_value_overlap": -21.136974334716797,
            "subspace_overlap": -1.5782440900802612,
            "right_subspace_overlap": 10.360011100769043,
            "activation_l2_distance": 4.645589828491211,
            "activation_cosine_similarity": 20.44314956665039,
            "activation_magnitude_ratio": -3.3144776821136475,
            "activation_dot_product": 8.726139068603516,
            "encoder_gradient_cosine_similarity": 10.63953971862793,
            "encoder_gradient_l2_distance": -26.117351531982422,
            "encoder_gradient_dot_product": 10.149064064025879,
            "input_gradient_cosine_similarity": 12.300726890563965,
            "input_gradient_l2_distance": -30.024229049682617,
            "input_gradient_dot_product": -37.1259880065918
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5644945640931007,
          "val_r": 0.4052663643434628,
          "n_iterations": 876,
          "coefficients": {
            "right_subspace_overlap_top_k": -9.83307933807373,
            "right_subspace_overlap_bottom_k": -20.709062576293945,
            "interaction_matrix_overlap_top_k": 1.8666051626205444,
            "interaction_matrix_overlap_bottom_k": 33.99951171875,
            "effective_rank": 21.884965896606445,
            "effective_rank_mergeability_score": -1.7419672012329102,
            "stable_rank": 7.296547889709473,
            "spectral_gap": 18.372098922729492,
            "singular_value_ratio": 4.518306255340576,
            "layerwise_effective_rank": -16.429763793945312,
            "layerwise_effective_rank_mergeability_score": 11.634916305541992,
            "singular_value_overlap": -13.58568000793457,
            "subspace_overlap": 15.590353965759277,
            "right_subspace_overlap": 11.03969669342041,
            "activation_l2_distance": -10.445063591003418,
            "activation_cosine_similarity": 17.563045501708984,
            "activation_magnitude_ratio": -3.359941005706787,
            "activation_dot_product": -13.574869155883789,
            "encoder_gradient_cosine_similarity": 2.923401117324829,
            "encoder_gradient_l2_distance": -27.17943572998047,
            "encoder_gradient_dot_product": 2.8247573375701904,
            "input_gradient_cosine_similarity": 12.160245895385742,
            "input_gradient_l2_distance": -26.762943267822266,
            "input_gradient_dot_product": -17.054109573364258
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.8233188948042487,
          "val_r": 0.662957108585699,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 1.6014306545257568,
            "right_subspace_overlap_bottom_k": -4.074592590332031,
            "interaction_matrix_overlap_top_k": -0.826973557472229,
            "interaction_matrix_overlap_bottom_k": 2.800565481185913,
            "effective_rank": 1.5456328392028809,
            "effective_rank_mergeability_score": -0.5030186176300049,
            "stable_rank": -1.75128173828125,
            "spectral_gap": -0.053071681410074234,
            "singular_value_ratio": 0.6120737195014954,
            "layerwise_effective_rank": 0.47056424617767334,
            "layerwise_effective_rank_mergeability_score": 1.9905920028686523,
            "singular_value_overlap": -0.38808542490005493,
            "subspace_overlap": -1.7078936100006104,
            "right_subspace_overlap": 2.7808899879455566,
            "activation_l2_distance": 1.3504196405410767,
            "activation_cosine_similarity": 2.7628636360168457,
            "activation_magnitude_ratio": -0.08436201512813568,
            "activation_dot_product": 0.06497076153755188,
            "encoder_gradient_cosine_similarity": 0.6199696063995361,
            "encoder_gradient_l2_distance": -3.2614006996154785,
            "encoder_gradient_dot_product": 0.5155867338180542,
            "input_gradient_cosine_similarity": 0.053047869354486465,
            "input_gradient_l2_distance": -2.3905837535858154,
            "input_gradient_dot_product": -1.127741813659668
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5689216550128565,
          "val_r": 0.31101471059460883,
          "n_iterations": 791,
          "coefficients": {
            "right_subspace_overlap_top_k": 2.787262439727783,
            "right_subspace_overlap_bottom_k": -9.559259414672852,
            "interaction_matrix_overlap_top_k": 1.5860812664031982,
            "interaction_matrix_overlap_bottom_k": 12.806756973266602,
            "effective_rank": 6.095808029174805,
            "effective_rank_mergeability_score": -10.761011123657227,
            "stable_rank": -0.2551737129688263,
            "spectral_gap": 17.736587524414062,
            "singular_value_ratio": 6.014580726623535,
            "layerwise_effective_rank": -1.9261447191238403,
            "layerwise_effective_rank_mergeability_score": 9.321532249450684,
            "singular_value_overlap": -9.698254585266113,
            "subspace_overlap": -1.3566738367080688,
            "right_subspace_overlap": 2.527284622192383,
            "activation_l2_distance": -0.3536030054092407,
            "activation_cosine_similarity": 12.974482536315918,
            "activation_magnitude_ratio": 0.8567826151847839,
            "activation_dot_product": -2.089740037918091,
            "encoder_gradient_cosine_similarity": 0.4816034436225891,
            "encoder_gradient_l2_distance": -17.030179977416992,
            "encoder_gradient_dot_product": 2.7707583904266357,
            "input_gradient_cosine_similarity": 5.494122505187988,
            "input_gradient_l2_distance": -18.53087615966797,
            "input_gradient_dot_product": -8.894416809082031
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    },
    "tsv": {
      "aggregate_metrics": {
        "train_r": 0.28567495517533215,
        "train_p": 1.4593879409336424e-61,
        "val_r": 0.14568159931877056,
        "val_p": 0.005753077140043521
      },
      "per_fold_stats": {
        "train_r_mean": 0.7441484014528033,
        "train_r_std": 0.09382002159424227,
        "val_r_mean": 0.5915126984908212,
        "val_r_std": 0.16260935649852143
      },
      "average_coefficients": {
        "right_subspace_overlap_top_k": 3.3161540031433105,
        "right_subspace_overlap_bottom_k": -27.092483520507812,
        "interaction_matrix_overlap_top_k": 41.90476989746094,
        "interaction_matrix_overlap_bottom_k": -4.802565574645996,
        "effective_rank": -5.052855014801025,
        "effective_rank_mergeability_score": 14.695791244506836,
        "stable_rank": -7.6664838790893555,
        "spectral_gap": -15.222320556640625,
        "singular_value_ratio": 7.169997215270996,
        "layerwise_effective_rank": -8.384817123413086,
        "layerwise_effective_rank_mergeability_score": -10.571024894714355,
        "singular_value_overlap": 20.35552978515625,
        "subspace_overlap": 9.691378593444824,
        "right_subspace_overlap": 9.217711448669434,
        "activation_l2_distance": -24.106435775756836,
        "activation_cosine_similarity": 5.551836967468262,
        "activation_magnitude_ratio": -4.51003360748291,
        "activation_dot_product": 29.411157608032227,
        "encoder_gradient_cosine_similarity": 9.732672691345215,
        "encoder_gradient_l2_distance": -28.891748428344727,
        "encoder_gradient_dot_product": -1.629195213317871,
        "input_gradient_cosine_similarity": 15.343626022338867,
        "input_gradient_l2_distance": -19.00566291809082,
        "input_gradient_dot_product": -8.456148147583008
      },
      "coefficient_std": {
        "right_subspace_overlap_top_k": 45.141624450683594,
        "right_subspace_overlap_bottom_k": 47.7766227722168,
        "interaction_matrix_overlap_top_k": 104.62875366210938,
        "interaction_matrix_overlap_bottom_k": 20.835735321044922,
        "effective_rank": 29.36737632751465,
        "effective_rank_mergeability_score": 75.30974578857422,
        "stable_rank": 38.110862731933594,
        "spectral_gap": 44.092041015625,
        "singular_value_ratio": 35.189849853515625,
        "layerwise_effective_rank": 26.099443435668945,
        "layerwise_effective_rank_mergeability_score": 90.06269836425781,
        "singular_value_overlap": 30.289445877075195,
        "subspace_overlap": 19.819482803344727,
        "right_subspace_overlap": 47.5316047668457,
        "activation_l2_distance": 48.272247314453125,
        "activation_cosine_similarity": 24.80201530456543,
        "activation_magnitude_ratio": 40.826541900634766,
        "activation_dot_product": 45.41999053955078,
        "encoder_gradient_cosine_similarity": 27.47447395324707,
        "encoder_gradient_l2_distance": 37.78289794921875,
        "encoder_gradient_dot_product": 17.118532180786133,
        "input_gradient_cosine_similarity": 26.607271194458008,
        "input_gradient_l2_distance": 29.676898956298828,
        "input_gradient_dot_product": 14.37448787689209
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7374980889456173,
          "val_r": 0.41600436632638527,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 40.41664505004883,
            "right_subspace_overlap_bottom_k": -15.073270797729492,
            "interaction_matrix_overlap_top_k": 5.760771751403809,
            "interaction_matrix_overlap_bottom_k": -4.398040294647217,
            "effective_rank": 28.3582820892334,
            "effective_rank_mergeability_score": -18.779197692871094,
            "stable_rank": -31.44269561767578,
            "spectral_gap": 27.0040283203125,
            "singular_value_ratio": 32.85797119140625,
            "layerwise_effective_rank": -19.623628616333008,
            "layerwise_effective_rank_mergeability_score": 6.474867343902588,
            "singular_value_overlap": 15.187405586242676,
            "subspace_overlap": -26.320110321044922,
            "right_subspace_overlap": -0.25081759691238403,
            "activation_l2_distance": 4.064082145690918,
            "activation_cosine_similarity": 14.512115478515625,
            "activation_magnitude_ratio": -4.761567115783691,
            "activation_dot_product": 24.373695373535156,
            "encoder_gradient_cosine_similarity": 3.0195415019989014,
            "encoder_gradient_l2_distance": -37.235591888427734,
            "encoder_gradient_dot_product": -7.38693380355835,
            "input_gradient_cosine_similarity": -1.8948602676391602,
            "input_gradient_l2_distance": -20.35753631591797,
            "input_gradient_dot_product": -13.506656646728516
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.8383059942097896,
          "val_r": 0.72809583251584,
          "n_iterations": 972,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.04446364566683769,
            "right_subspace_overlap_bottom_k": -1.323655366897583,
            "interaction_matrix_overlap_top_k": -0.5420386791229248,
            "interaction_matrix_overlap_bottom_k": 1.2514384984970093,
            "effective_rank": 0.3202945291996002,
            "effective_rank_mergeability_score": -0.4731675386428833,
            "stable_rank": -0.6406416893005371,
            "spectral_gap": 0.25184473395347595,
            "singular_value_ratio": 0.37967437505722046,
            "layerwise_effective_rank": 0.3027866780757904,
            "layerwise_effective_rank_mergeability_score": 0.5622750520706177,
            "singular_value_overlap": 0.006170673295855522,
            "subspace_overlap": 0.06039559468626976,
            "right_subspace_overlap": 0.4646780490875244,
            "activation_l2_distance": 0.2859630584716797,
            "activation_cosine_similarity": 0.43322300910949707,
            "activation_magnitude_ratio": 0.004515196196734905,
            "activation_dot_product": -0.06492716819047928,
            "encoder_gradient_cosine_similarity": 0.02419627085328102,
            "encoder_gradient_l2_distance": -0.2044024020433426,
            "encoder_gradient_dot_product": 0.027923068031668663,
            "input_gradient_cosine_similarity": 0.013690070249140263,
            "input_gradient_l2_distance": -0.17120708525180817,
            "input_gradient_dot_product": -0.01390120480209589
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7802591583635948,
          "val_r": 0.7476138311504754,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.2125580310821533,
            "right_subspace_overlap_bottom_k": -9.853775024414062,
            "interaction_matrix_overlap_top_k": 2.078845739364624,
            "interaction_matrix_overlap_bottom_k": 0.7608920931816101,
            "effective_rank": 4.428793907165527,
            "effective_rank_mergeability_score": -2.115644693374634,
            "stable_rank": -2.968055248260498,
            "spectral_gap": 5.0213165283203125,
            "singular_value_ratio": 7.3710551261901855,
            "layerwise_effective_rank": -0.9665985703468323,
            "layerwise_effective_rank_mergeability_score": 6.6432061195373535,
            "singular_value_overlap": 1.880854845046997,
            "subspace_overlap": 0.02649400196969509,
            "right_subspace_overlap": 6.161594390869141,
            "activation_l2_distance": -4.966587066650391,
            "activation_cosine_similarity": 2.5561773777008057,
            "activation_magnitude_ratio": -2.125331401824951,
            "activation_dot_product": 2.267437219619751,
            "encoder_gradient_cosine_similarity": 0.9286357760429382,
            "encoder_gradient_l2_distance": -9.315266609191895,
            "encoder_gradient_dot_product": -0.10228590667247772,
            "input_gradient_cosine_similarity": 2.1145665645599365,
            "input_gradient_l2_distance": -9.071244239807129,
            "input_gradient_dot_product": -2.9684343338012695
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.8299122491481804,
          "val_r": 0.8141604210978313,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.8312404155731201,
            "right_subspace_overlap_bottom_k": -4.800971984863281,
            "interaction_matrix_overlap_top_k": -3.2685413360595703,
            "interaction_matrix_overlap_bottom_k": 4.212291717529297,
            "effective_rank": 1.6230412721633911,
            "effective_rank_mergeability_score": -2.6565966606140137,
            "stable_rank": -3.598100185394287,
            "spectral_gap": -0.401001513004303,
            "singular_value_ratio": 0.358318030834198,
            "layerwise_effective_rank": 1.128957986831665,
            "layerwise_effective_rank_mergeability_score": 2.4536187648773193,
            "singular_value_overlap": 0.0428723581135273,
            "subspace_overlap": 0.40113532543182373,
            "right_subspace_overlap": 2.4038429260253906,
            "activation_l2_distance": 1.8159470558166504,
            "activation_cosine_similarity": 2.6011745929718018,
            "activation_magnitude_ratio": -0.03288964554667473,
            "activation_dot_product": -0.4656289219856262,
            "encoder_gradient_cosine_similarity": 0.1801685243844986,
            "encoder_gradient_l2_distance": -0.8974834084510803,
            "encoder_gradient_dot_product": 0.06134781986474991,
            "input_gradient_cosine_similarity": 0.03124108538031578,
            "input_gradient_l2_distance": -0.8467810750007629,
            "input_gradient_dot_product": -0.17857396602630615
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7446381261287824,
          "val_r": 0.7006762908022628,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 16.21272850036621,
            "right_subspace_overlap_bottom_k": -9.579460144042969,
            "interaction_matrix_overlap_top_k": 3.017984628677368,
            "interaction_matrix_overlap_bottom_k": -5.483421325683594,
            "effective_rank": -7.645815372467041,
            "effective_rank_mergeability_score": 5.600058555603027,
            "stable_rank": 8.311503410339355,
            "spectral_gap": -1.451088786125183,
            "singular_value_ratio": -1.5232964754104614,
            "layerwise_effective_rank": -0.10458706319332123,
            "layerwise_effective_rank_mergeability_score": -3.206059455871582,
            "singular_value_overlap": 7.886322975158691,
            "subspace_overlap": 5.529664516448975,
            "right_subspace_overlap": -6.844853401184082,
            "activation_l2_distance": 0.4266088008880615,
            "activation_cosine_similarity": 8.665726661682129,
            "activation_magnitude_ratio": -0.9669709205627441,
            "activation_dot_product": 7.49919319152832,
            "encoder_gradient_cosine_similarity": 3.5541179180145264,
            "encoder_gradient_l2_distance": -18.52302360534668,
            "encoder_gradient_dot_product": -0.043505601584911346,
            "input_gradient_cosine_similarity": 3.6460607051849365,
            "input_gradient_l2_distance": -9.190518379211426,
            "input_gradient_dot_product": -4.78877067565918
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.7690415021697049,
          "val_r": 0.7274810331144873,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 7.133244514465332,
            "right_subspace_overlap_bottom_k": -9.658954620361328,
            "interaction_matrix_overlap_top_k": 2.5783019065856934,
            "interaction_matrix_overlap_bottom_k": -6.093449115753174,
            "effective_rank": 3.510601282119751,
            "effective_rank_mergeability_score": 0.8061385750770569,
            "stable_rank": 1.492677927017212,
            "spectral_gap": 2.8382856845855713,
            "singular_value_ratio": 3.8996872901916504,
            "layerwise_effective_rank": -6.35392951965332,
            "layerwise_effective_rank_mergeability_score": 1.9603509902954102,
            "singular_value_overlap": 4.638339519500732,
            "subspace_overlap": -2.286855459213257,
            "right_subspace_overlap": 8.978087425231934,
            "activation_l2_distance": -4.63250207901001,
            "activation_cosine_similarity": 6.664045810699463,
            "activation_magnitude_ratio": -2.0336835384368896,
            "activation_dot_product": 4.741621494293213,
            "encoder_gradient_cosine_similarity": 4.851641654968262,
            "encoder_gradient_l2_distance": -12.664204597473145,
            "encoder_gradient_dot_product": 1.466078519821167,
            "input_gradient_cosine_similarity": 3.2171428203582764,
            "input_gradient_l2_distance": -8.422534942626953,
            "input_gradient_dot_product": -5.631503105163574
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.7639768017862987,
          "val_r": 0.6894112803061293,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.288342237472534,
            "right_subspace_overlap_bottom_k": -8.280232429504395,
            "interaction_matrix_overlap_top_k": 1.9487673044204712,
            "interaction_matrix_overlap_bottom_k": -2.8243775367736816,
            "effective_rank": 3.048292398452759,
            "effective_rank_mergeability_score": -6.5289225578308105,
            "stable_rank": -5.274056911468506,
            "spectral_gap": 0.6570937633514404,
            "singular_value_ratio": 2.1134212017059326,
            "layerwise_effective_rank": -0.4945640563964844,
            "layerwise_effective_rank_mergeability_score": 6.700590133666992,
            "singular_value_overlap": 3.936520576477051,
            "subspace_overlap": -3.2283313274383545,
            "right_subspace_overlap": 6.881446361541748,
            "activation_l2_distance": 2.3743040561676025,
            "activation_cosine_similarity": 7.237292289733887,
            "activation_magnitude_ratio": -0.12999314069747925,
            "activation_dot_product": 3.6554160118103027,
            "encoder_gradient_cosine_similarity": 2.278597593307495,
            "encoder_gradient_l2_distance": -8.353442192077637,
            "encoder_gradient_dot_product": 2.576129198074341,
            "input_gradient_cosine_similarity": 0.9364966154098511,
            "input_gradient_l2_distance": -7.816174030303955,
            "input_gradient_dot_product": -3.7040581703186035
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.800553918128157,
          "val_r": 0.4409971441556559,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.9347283840179443,
            "right_subspace_overlap_bottom_k": -0.9470694065093994,
            "interaction_matrix_overlap_top_k": -0.5516523718833923,
            "interaction_matrix_overlap_bottom_k": 0.4022236466407776,
            "effective_rank": 0.04642748460173607,
            "effective_rank_mergeability_score": -0.551649272441864,
            "stable_rank": -0.36694034934043884,
            "spectral_gap": 0.5238763689994812,
            "singular_value_ratio": 0.5883870124816895,
            "layerwise_effective_rank": 0.24738557636737823,
            "layerwise_effective_rank_mergeability_score": 0.5526418685913086,
            "singular_value_overlap": 0.06617379188537598,
            "subspace_overlap": -0.4169482886791229,
            "right_subspace_overlap": 0.43005648255348206,
            "activation_l2_distance": 0.2115102857351303,
            "activation_cosine_similarity": 0.7218717336654663,
            "activation_magnitude_ratio": -0.05652294680476189,
            "activation_dot_product": -0.2238234579563141,
            "encoder_gradient_cosine_similarity": 0.1173773854970932,
            "encoder_gradient_l2_distance": -0.6121653318405151,
            "encoder_gradient_dot_product": 0.013588456436991692,
            "input_gradient_cosine_similarity": 0.08903530240058899,
            "input_gradient_l2_distance": -0.23049917817115784,
            "input_gradient_dot_product": 0.016740325838327408
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.8636284103264029,
          "val_r": 0.39119638408691,
          "n_iterations": 421,
          "coefficients": {
            "right_subspace_overlap_top_k": -0.11404532194137573,
            "right_subspace_overlap_bottom_k": -0.8294604420661926,
            "interaction_matrix_overlap_top_k": -0.3121929466724396,
            "interaction_matrix_overlap_bottom_k": 0.8096815347671509,
            "effective_rank": 0.16513997316360474,
            "effective_rank_mergeability_score": 0.14475463330745697,
            "stable_rank": 0.060751721262931824,
            "spectral_gap": 0.25848710536956787,
            "singular_value_ratio": 0.2982265055179596,
            "layerwise_effective_rank": -0.1171981543302536,
            "layerwise_effective_rank_mergeability_score": 0.04227873310446739,
            "singular_value_overlap": -0.00351183139719069,
            "subspace_overlap": 0.06719641387462616,
            "right_subspace_overlap": 0.3965240716934204,
            "activation_l2_distance": 0.14638009667396545,
            "activation_cosine_similarity": 0.2537095844745636,
            "activation_magnitude_ratio": 0.0055742813274264336,
            "activation_dot_product": -0.06309990584850311,
            "encoder_gradient_cosine_similarity": 0.022072969004511833,
            "encoder_gradient_l2_distance": -0.09548326581716537,
            "encoder_gradient_dot_product": -0.00737382285296917,
            "input_gradient_cosine_similarity": 0.017131740227341652,
            "input_gradient_l2_distance": -0.11875122785568237,
            "input_gradient_dot_product": -0.02711227908730507
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7287347152875535,
          "val_r": 0.3276800641204435,
          "n_iterations": 833,
          "coefficients": {
            "right_subspace_overlap_top_k": 38.138519287109375,
            "right_subspace_overlap_bottom_k": -44.631107330322266,
            "interaction_matrix_overlap_top_k": 20.93419647216797,
            "interaction_matrix_overlap_bottom_k": -2.8537817001342773,
            "effective_rank": -20.620960235595703,
            "effective_rank_mergeability_score": -5.920535564422607,
            "stable_rank": 2.7238917350769043,
            "spectral_gap": -15.060051918029785,
            "singular_value_ratio": -3.2428507804870605,
            "layerwise_effective_rank": 4.166965007781982,
            "layerwise_effective_rank_mergeability_score": 14.677207946777344,
            "singular_value_overlap": 14.566093444824219,
            "subspace_overlap": 5.924966335296631,
            "right_subspace_overlap": 1.0184274911880493,
            "activation_l2_distance": 9.143299102783203,
            "activation_cosine_similarity": -4.536867618560791,
            "activation_magnitude_ratio": 5.44098424911499,
            "activation_dot_product": 0.008327553980052471,
            "encoder_gradient_cosine_similarity": 15.420088768005371,
            "encoder_gradient_l2_distance": -16.34712791442871,
            "encoder_gradient_dot_product": 5.081700801849365,
            "input_gradient_cosine_similarity": 8.965580940246582,
            "input_gradient_l2_distance": -20.516521453857422,
            "input_gradient_dot_product": -11.482324600219727
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.8344215616949631,
          "val_r": 0.36288035457435835,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.4408797025680542,
            "right_subspace_overlap_bottom_k": -1.5537883043289185,
            "interaction_matrix_overlap_top_k": -0.6196475028991699,
            "interaction_matrix_overlap_bottom_k": 1.3515328168869019,
            "effective_rank": 0.3957357108592987,
            "effective_rank_mergeability_score": -0.1555272936820984,
            "stable_rank": -0.5792864561080933,
            "spectral_gap": -0.16348783671855927,
            "singular_value_ratio": -0.032125502824783325,
            "layerwise_effective_rank": 0.7186047434806824,
            "layerwise_effective_rank_mergeability_score": 0.8045985102653503,
            "singular_value_overlap": 0.08842268586158752,
            "subspace_overlap": -0.18033336102962494,
            "right_subspace_overlap": 0.39315855503082275,
            "activation_l2_distance": 0.14219343662261963,
            "activation_cosine_similarity": 0.4416012465953827,
            "activation_magnitude_ratio": -0.025892535224556923,
            "activation_dot_product": 0.004402498248964548,
            "encoder_gradient_cosine_similarity": 0.023142969235777855,
            "encoder_gradient_l2_distance": -0.32454514503479004,
            "encoder_gradient_dot_product": -0.01529600564390421,
            "input_gradient_cosine_similarity": 0.03833598271012306,
            "input_gradient_l2_distance": -0.17925657331943512,
            "input_gradient_dot_product": -0.0146969398483634
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.6298606639633286,
          "val_r": 0.6637772735650551,
          "n_iterations": 630,
          "coefficients": {
            "right_subspace_overlap_top_k": 72.85150146484375,
            "right_subspace_overlap_bottom_k": -88.92841339111328,
            "interaction_matrix_overlap_top_k": 44.38877868652344,
            "interaction_matrix_overlap_bottom_k": -27.983449935913086,
            "effective_rank": -16.448562622070312,
            "effective_rank_mergeability_score": 7.417191028594971,
            "stable_rank": 25.51403045654297,
            "spectral_gap": -60.60149002075195,
            "singular_value_ratio": -88.2607192993164,
            "layerwise_effective_rank": 24.990421295166016,
            "layerwise_effective_rank_mergeability_score": 9.43873405456543,
            "singular_value_overlap": 93.72869110107422,
            "subspace_overlap": 53.79498291015625,
            "right_subspace_overlap": 103.78233337402344,
            "activation_l2_distance": -110.6910171508789,
            "activation_cosine_similarity": -25.460372924804688,
            "activation_magnitude_ratio": -72.17383575439453,
            "activation_dot_product": 59.15968322753906,
            "encoder_gradient_cosine_similarity": 89.03006744384766,
            "encoder_gradient_l2_distance": -111.34906768798828,
            "encoder_gradient_dot_product": 40.40751266479492,
            "input_gradient_cosine_similarity": 42.406070709228516,
            "input_gradient_l2_distance": -12.856526374816895,
            "input_gradient_dot_product": -51.15900802612305
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.5085185585137801,
          "val_r": 0.34638313268128906,
          "n_iterations": 498,
          "coefficients": {
            "right_subspace_overlap_top_k": -171.44093322753906,
            "right_subspace_overlap_bottom_k": -204.38497924804688,
            "interaction_matrix_overlap_top_k": 481.8224182128906,
            "interaction_matrix_overlap_bottom_k": -52.84648895263672,
            "effective_rank": -28.7302188873291,
            "effective_rank_mergeability_score": 339.37213134765625,
            "stable_rank": -162.6066131591797,
            "spectral_gap": -192.4249267578125,
            "singular_value_ratio": 87.62493133544922,
            "layerwise_effective_rank": -71.11528778076172,
            "layerwise_effective_rank_mergeability_score": -393.4107971191406,
            "singular_value_overlap": 45.78190612792969,
            "subspace_overlap": 45.772945404052734,
            "right_subspace_overlap": 172.59219360351562,
            "activation_l2_distance": -178.35488891601562,
            "activation_cosine_similarity": 100.29986572265625,
            "activation_magnitude_ratio": 138.09471130371094,
            "activation_dot_product": 168.52503967285156,
            "encoder_gradient_cosine_similarity": 34.00831604003906,
            "encoder_gradient_l2_distance": -70.12694549560547,
            "encoder_gradient_dot_product": -50.263671875,
            "input_gradient_cosine_similarity": 84.9127197265625,
            "input_gradient_l2_distance": -128.7242889404297,
            "input_gradient_dot_product": 6.619918346405029
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.8096551077674361,
          "val_r": 0.8026984586879916,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 1.3803812265396118,
            "right_subspace_overlap_bottom_k": -1.3359135389328003,
            "interaction_matrix_overlap_top_k": -0.6971014142036438,
            "interaction_matrix_overlap_bottom_k": 0.6739107966423035,
            "effective_rank": 0.502382218837738,
            "effective_rank_mergeability_score": 0.17593912780284882,
            "stable_rank": 0.20385505259037018,
            "spectral_gap": 0.15584228932857513,
            "singular_value_ratio": 0.09402189403772354,
            "layerwise_effective_rank": -0.12591306865215302,
            "layerwise_effective_rank_mergeability_score": 0.47500067949295044,
            "singular_value_overlap": 0.07009761035442352,
            "subspace_overlap": -0.991852879524231,
            "right_subspace_overlap": 0.8128015398979187,
            "activation_l2_distance": 0.32034438848495483,
            "activation_cosine_similarity": 0.9543534517288208,
            "activation_magnitude_ratio": -0.06712817400693893,
            "activation_dot_product": -0.08808905631303787,
            "encoder_gradient_cosine_similarity": 0.1298855096101761,
            "encoder_gradient_l2_distance": -1.0352933406829834,
            "encoder_gradient_dot_product": 0.05844561755657196,
            "input_gradient_cosine_similarity": 0.14015832543373108,
            "input_gradient_l2_distance": -0.5205288529396057,
            "input_gradient_dot_product": -0.28572142124176025
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6462677926420337,
          "val_r": 0.6644283710120356,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 18.9144344329834,
            "right_subspace_overlap_bottom_k": 6.461788177490234,
            "interaction_matrix_overlap_top_k": 71.96820068359375,
            "interaction_matrix_overlap_bottom_k": 2.4048352241516113,
            "effective_rank": 49.8218994140625,
            "effective_rank_mergeability_score": 1.4989858865737915,
            "stable_rank": -17.028331756591797,
            "spectral_gap": -32.11189270019531,
            "singular_value_ratio": -7.4616899490356445,
            "layerwise_effective_rank": -36.909549713134766,
            "layerwise_effective_rank_mergeability_score": 41.54302215576172,
            "singular_value_overlap": 29.743173599243164,
            "subspace_overlap": 15.14294719696045,
            "right_subspace_overlap": -66.50062561035156,
            "activation_l2_distance": -11.594281196594238,
            "activation_cosine_similarity": 17.48607063293457,
            "activation_magnitude_ratio": -31.355714797973633,
            "activation_dot_product": 64.25263977050781,
            "encoder_gradient_cosine_similarity": 20.132619857788086,
            "encoder_gradient_l2_distance": -46.674808502197266,
            "encoder_gradient_dot_product": -18.189743041992188,
            "input_gradient_cosine_similarity": 8.265043258666992,
            "input_gradient_l2_distance": -62.628074645996094,
            "input_gradient_dot_product": -16.182388305664062
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.6666756438037058,
          "val_r": 0.4200877925657561,
          "n_iterations": 709,
          "coefficients": {
            "right_subspace_overlap_top_k": -16.48417091369629,
            "right_subspace_overlap_bottom_k": -5.182394504547119,
            "interaction_matrix_overlap_top_k": 69.00476837158203,
            "interaction_matrix_overlap_bottom_k": -61.3601188659668,
            "effective_rank": 20.454896926879883,
            "effective_rank_mergeability_score": 28.054227828979492,
            "stable_rank": 31.76280975341797,
            "spectral_gap": -2.156209707260132,
            "singular_value_ratio": 77.3218765258789,
            "layerwise_effective_rank": -61.87644577026367,
            "layerwise_effective_rank_mergeability_score": 67.87799072265625,
            "singular_value_overlap": 75.51193237304688,
            "subspace_overlap": 36.487152099609375,
            "right_subspace_overlap": -2.380192279815674,
            "activation_l2_distance": -85.78472137451172,
            "activation_cosine_similarity": -29.78803825378418,
            "activation_magnitude_ratio": -3.166142702102661,
            "activation_dot_product": 69.02513122558594,
            "encoder_gradient_cosine_similarity": -59.05473327636719,
            "encoder_gradient_l2_distance": -130.15673828125,
            "encoder_gradient_dot_product": 5.767667770385742,
            "input_gradient_cosine_similarity": 15.713849067687988,
            "input_gradient_l2_distance": -45.1771354675293,
            "input_gradient_dot_product": 6.582747459411621
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7694198762172766,
          "val_r": 0.7208386029045378,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 12.070721626281738,
            "right_subspace_overlap_bottom_k": -16.965320587158203,
            "interaction_matrix_overlap_top_k": 5.423648834228516,
            "interaction_matrix_overlap_bottom_k": -1.2820093631744385,
            "effective_rank": 1.2441725730895996,
            "effective_rank_mergeability_score": -3.196380138397217,
            "stable_rank": -4.461429119110107,
            "spectral_gap": -2.2416696548461914,
            "singular_value_ratio": 4.319924354553223,
            "layerwise_effective_rank": -4.668702125549316,
            "layerwise_effective_rank_mergeability_score": 3.1652607917785645,
            "singular_value_overlap": 5.062388896942139,
            "subspace_overlap": -4.562244892120361,
            "right_subspace_overlap": 7.475691318511963,
            "activation_l2_distance": 3.24541974067688,
            "activation_cosine_similarity": 12.587871551513672,
            "activation_magnitude_ratio": -1.7853903770446777,
            "activation_dot_product": 2.9890050888061523,
            "encoder_gradient_cosine_similarity": 5.041551113128662,
            "encoder_gradient_l2_distance": -9.839753150939941,
            "encoder_gradient_dot_product": 3.1399199962615967,
            "input_gradient_cosine_similarity": 3.140817403793335,
            "input_gradient_l2_distance": -11.843501091003418,
            "input_gradient_dot_product": -7.061460018157959
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5637147988506106,
          "val_r": 0.5631597005728042,
          "n_iterations": 510,
          "coefficients": {
            "right_subspace_overlap_top_k": 45.08248519897461,
            "right_subspace_overlap_bottom_k": -57.912044525146484,
            "interaction_matrix_overlap_top_k": 79.36224365234375,
            "interaction_matrix_overlap_bottom_k": 21.149381637573242,
            "effective_rank": -105.19337463378906,
            "effective_rank_mergeability_score": -30.343460083007812,
            "stable_rank": -15.16292667388916,
            "spectral_gap": -26.930904388427734,
            "singular_value_ratio": 50.3669548034668,
            "layerwise_effective_rank": -41.60940933227539,
            "layerwise_effective_rank_mergeability_score": -25.945220947265625,
            "singular_value_overlap": 90.9689712524414,
            "subspace_overlap": 30.078872680664062,
            "right_subspace_overlap": -14.556699752807617,
            "activation_l2_distance": -71.81240844726562,
            "activation_cosine_similarity": 12.166325569152832,
            "activation_magnitude_ratio": -87.40615844726562,
            "activation_dot_product": 77.47400665283203,
            "encoder_gradient_cosine_similarity": 58.610958099365234,
            "encoder_gradient_l2_distance": -29.589693069458008,
            "encoder_gradient_dot_product": 16.660470962524414,
            "input_gradient_cosine_similarity": 79.6991958618164,
            "input_gradient_l2_distance": -18.148202896118164,
            "input_gradient_dot_product": -36.01232147216797
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.8434457231260044,
          "val_r": 0.7271269105603172,
          "n_iterations": 706,
          "coefficients": {
            "right_subspace_overlap_top_k": -0.13304565846920013,
            "right_subspace_overlap_bottom_k": -1.2029260396957397,
            "interaction_matrix_overlap_top_k": -0.45061200857162476,
            "interaction_matrix_overlap_bottom_k": 1.1096901893615723,
            "effective_rank": 0.5815706253051758,
            "effective_rank_mergeability_score": -0.34386831521987915,
            "stable_rank": -0.8374372720718384,
            "spectral_gap": 0.006933585740625858,
            "singular_value_ratio": 0.19082386791706085,
            "layerwise_effective_rank": 0.4711660146713257,
            "layerwise_effective_rank_mergeability_score": 0.7101552486419678,
            "singular_value_overlap": 0.013651767745614052,
            "subspace_overlap": 0.004583925008773804,
            "right_subspace_overlap": 0.6246241331100464,
            "activation_l2_distance": 0.23236966133117676,
            "activation_cosine_similarity": 0.3585260808467865,
            "activation_magnitude_ratio": 0.01025149691849947,
            "activation_dot_product": -0.030817853286862373,
            "encoder_gradient_cosine_similarity": 0.029342228546738625,
            "encoder_gradient_l2_distance": -0.18432177603244781,
            "encoder_gradient_dot_product": 0.007556144148111343,
            "input_gradient_cosine_similarity": 0.02197553589940071,
            "input_gradient_l2_distance": -0.15786153078079224,
            "input_gradient_dot_product": -0.032805152237415314
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7544393379828417,
          "val_r": 0.5755567250158616,
          "n_iterations": 840,
          "coefficients": {
            "right_subspace_overlap_top_k": -6.45759916305542,
            "right_subspace_overlap_bottom_k": -65.86769104003906,
            "interaction_matrix_overlap_top_k": 56.24829864501953,
            "interaction_matrix_overlap_bottom_k": 34.947933197021484,
            "effective_rank": -36.91969680786133,
            "effective_rank_mergeability_score": -18.08863639831543,
            "stable_rank": 21.567323684692383,
            "spectral_gap": -7.6213765144348145,
            "singular_value_ratio": -23.864633560180664,
            "layerwise_effective_rank": 44.24318313598633,
            "layerwise_effective_rank_mergeability_score": 47.059783935546875,
            "singular_value_overlap": 17.93414878845215,
            "subspace_overlap": 38.522926330566406,
            "right_subspace_overlap": -37.52804946899414,
            "activation_l2_distance": -36.700748443603516,
            "activation_cosine_similarity": -17.117942810058594,
            "activation_magnitude_ratio": -27.669479370117188,
            "activation_dot_product": 105.18399047851562,
            "encoder_gradient_cosine_similarity": 16.305883407592773,
            "encoder_gradient_l2_distance": -74.30558013916016,
            "encoder_gradient_dot_product": -31.84343147277832,
            "input_gradient_cosine_similarity": 55.39829635620117,
            "input_gradient_l2_distance": -23.136110305786133,
            "input_gradient_dot_product": -29.292633056640625
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    },
    "isotropic": {
      "aggregate_metrics": {
        "train_r": 0.25727099015489063,
        "train_p": 7.130998351725342e-50,
        "val_r": 0.0009795966766641424,
        "val_p": 0.9852638920607066
      },
      "per_fold_stats": {
        "train_r_mean": 0.42936340306508713,
        "train_r_std": 0.0810609833585073,
        "val_r_mean": 0.3137737044104799,
        "val_r_std": 0.14728447151934837
      },
      "average_coefficients": {
        "right_subspace_overlap_top_k": 11.649996757507324,
        "right_subspace_overlap_bottom_k": 34.1492919921875,
        "interaction_matrix_overlap_top_k": 20.721921920776367,
        "interaction_matrix_overlap_bottom_k": 25.3687744140625,
        "effective_rank": -2.1606807708740234,
        "effective_rank_mergeability_score": 14.109103202819824,
        "stable_rank": -6.3288092613220215,
        "spectral_gap": 19.968759536743164,
        "singular_value_ratio": -1.0466731786727905,
        "layerwise_effective_rank": 4.553788661956787,
        "layerwise_effective_rank_mergeability_score": -0.8343027234077454,
        "singular_value_overlap": -33.686927795410156,
        "subspace_overlap": 13.653875350952148,
        "right_subspace_overlap": 23.551822662353516,
        "activation_l2_distance": -21.098356246948242,
        "activation_cosine_similarity": 10.338589668273926,
        "activation_magnitude_ratio": -13.575243949890137,
        "activation_dot_product": -22.958171844482422,
        "encoder_gradient_cosine_similarity": 8.615370750427246,
        "encoder_gradient_l2_distance": -35.867462158203125,
        "encoder_gradient_dot_product": 4.456513404846191,
        "input_gradient_cosine_similarity": 17.097152709960938,
        "input_gradient_l2_distance": -35.59779357910156,
        "input_gradient_dot_product": -34.08332061767578
      },
      "coefficient_std": {
        "right_subspace_overlap_top_k": 20.296411514282227,
        "right_subspace_overlap_bottom_k": 27.330020904541016,
        "interaction_matrix_overlap_top_k": 23.23905372619629,
        "interaction_matrix_overlap_bottom_k": 27.155546188354492,
        "effective_rank": 35.07756805419922,
        "effective_rank_mergeability_score": 26.944433212280273,
        "stable_rank": 25.312644958496094,
        "spectral_gap": 27.12713623046875,
        "singular_value_ratio": 30.362823486328125,
        "layerwise_effective_rank": 21.185985565185547,
        "layerwise_effective_rank_mergeability_score": 15.452764511108398,
        "singular_value_overlap": 19.33830451965332,
        "subspace_overlap": 26.032541275024414,
        "right_subspace_overlap": 32.62809753417969,
        "activation_l2_distance": 24.20085334777832,
        "activation_cosine_similarity": 26.4206485748291,
        "activation_magnitude_ratio": 26.45641326904297,
        "activation_dot_product": 29.326196670532227,
        "encoder_gradient_cosine_similarity": 12.887967109680176,
        "encoder_gradient_l2_distance": 25.502674102783203,
        "encoder_gradient_dot_product": 21.77952766418457,
        "input_gradient_cosine_similarity": 11.798457145690918,
        "input_gradient_l2_distance": 23.741247177124023,
        "input_gradient_dot_product": 19.329442977905273
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.46979573810238956,
          "val_r": 0.338952369833496,
          "n_iterations": 569,
          "coefficients": {
            "right_subspace_overlap_top_k": 23.97238540649414,
            "right_subspace_overlap_bottom_k": 29.194351196289062,
            "interaction_matrix_overlap_top_k": 17.94818878173828,
            "interaction_matrix_overlap_bottom_k": 17.28635597229004,
            "effective_rank": -15.134220123291016,
            "effective_rank_mergeability_score": 16.686498641967773,
            "stable_rank": 4.5886430740356445,
            "spectral_gap": 36.08311080932617,
            "singular_value_ratio": 6.396190643310547,
            "layerwise_effective_rank": 47.34772491455078,
            "layerwise_effective_rank_mergeability_score": 17.393320083618164,
            "singular_value_overlap": -62.586971282958984,
            "subspace_overlap": 22.976734161376953,
            "right_subspace_overlap": 9.640213966369629,
            "activation_l2_distance": -24.940523147583008,
            "activation_cosine_similarity": 14.707571029663086,
            "activation_magnitude_ratio": -11.384641647338867,
            "activation_dot_product": -17.32496452331543,
            "encoder_gradient_cosine_similarity": -8.665376663208008,
            "encoder_gradient_l2_distance": -51.55845260620117,
            "encoder_gradient_dot_product": -21.718379974365234,
            "input_gradient_cosine_similarity": 22.906417846679688,
            "input_gradient_l2_distance": -34.99213409423828,
            "input_gradient_dot_product": -37.82466125488281
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4602230624615796,
          "val_r": 0.3625107033079123,
          "n_iterations": 604,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.7537693977355957,
            "right_subspace_overlap_bottom_k": 14.371106147766113,
            "interaction_matrix_overlap_top_k": 24.455995559692383,
            "interaction_matrix_overlap_bottom_k": 21.478757858276367,
            "effective_rank": 1.9670764207839966,
            "effective_rank_mergeability_score": 10.366402626037598,
            "stable_rank": -2.7474441528320312,
            "spectral_gap": 23.865812301635742,
            "singular_value_ratio": 3.880199670791626,
            "layerwise_effective_rank": 6.157888412475586,
            "layerwise_effective_rank_mergeability_score": -9.185694694519043,
            "singular_value_overlap": -23.149019241333008,
            "subspace_overlap": 5.929421424865723,
            "right_subspace_overlap": -12.410135269165039,
            "activation_l2_distance": -7.199288368225098,
            "activation_cosine_similarity": 6.733505725860596,
            "activation_magnitude_ratio": -7.699024200439453,
            "activation_dot_product": -9.027274131774902,
            "encoder_gradient_cosine_similarity": -2.58949613571167,
            "encoder_gradient_l2_distance": -17.294437408447266,
            "encoder_gradient_dot_product": 4.326783180236816,
            "input_gradient_cosine_similarity": 10.073469161987305,
            "input_gradient_l2_distance": -22.961097717285156,
            "input_gradient_dot_product": -22.099655151367188
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.3794461142892105,
          "val_r": 0.2483521996278329,
          "n_iterations": 417,
          "coefficients": {
            "right_subspace_overlap_top_k": -2.7118642330169678,
            "right_subspace_overlap_bottom_k": 84.15865325927734,
            "interaction_matrix_overlap_top_k": 81.01242065429688,
            "interaction_matrix_overlap_bottom_k": -21.186899185180664,
            "effective_rank": -12.172431945800781,
            "effective_rank_mergeability_score": -21.43813133239746,
            "stable_rank": -51.31786346435547,
            "spectral_gap": 55.970542907714844,
            "singular_value_ratio": 5.3521037101745605,
            "layerwise_effective_rank": 28.13033676147461,
            "layerwise_effective_rank_mergeability_score": -18.407222747802734,
            "singular_value_overlap": -18.410829544067383,
            "subspace_overlap": 60.269920349121094,
            "right_subspace_overlap": 54.414066314697266,
            "activation_l2_distance": -58.64801025390625,
            "activation_cosine_similarity": 11.139493942260742,
            "activation_magnitude_ratio": -53.108829498291016,
            "activation_dot_product": -80.69512176513672,
            "encoder_gradient_cosine_similarity": 4.7522759437561035,
            "encoder_gradient_l2_distance": -37.519683837890625,
            "encoder_gradient_dot_product": 31.39511489868164,
            "input_gradient_cosine_similarity": 36.4407844543457,
            "input_gradient_l2_distance": -30.021881103515625,
            "input_gradient_dot_product": -46.40047836303711
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4421929922388805,
          "val_r": 0.39406486231040067,
          "n_iterations": 603,
          "coefficients": {
            "right_subspace_overlap_top_k": 17.355365753173828,
            "right_subspace_overlap_bottom_k": 14.378504753112793,
            "interaction_matrix_overlap_top_k": 10.396254539489746,
            "interaction_matrix_overlap_bottom_k": 2.1700000762939453,
            "effective_rank": 12.658023834228516,
            "effective_rank_mergeability_score": 22.681196212768555,
            "stable_rank": -7.365971088409424,
            "spectral_gap": 13.907086372375488,
            "singular_value_ratio": 10.471515655517578,
            "layerwise_effective_rank": -1.238071322441101,
            "layerwise_effective_rank_mergeability_score": 8.139994621276855,
            "singular_value_overlap": -48.12273406982422,
            "subspace_overlap": 47.324546813964844,
            "right_subspace_overlap": 27.161867141723633,
            "activation_l2_distance": -25.9833927154541,
            "activation_cosine_similarity": 29.79199981689453,
            "activation_magnitude_ratio": -14.001786231994629,
            "activation_dot_product": -52.08904266357422,
            "encoder_gradient_cosine_similarity": 3.912843704223633,
            "encoder_gradient_l2_distance": -42.650245666503906,
            "encoder_gradient_dot_product": 22.450387954711914,
            "input_gradient_cosine_similarity": 24.668703079223633,
            "input_gradient_l2_distance": -39.548500061035156,
            "input_gradient_dot_product": -35.47105407714844
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.38276022582963476,
          "val_r": 0.3081010031950796,
          "n_iterations": 475,
          "coefficients": {
            "right_subspace_overlap_top_k": 25.277692794799805,
            "right_subspace_overlap_bottom_k": -14.299094200134277,
            "interaction_matrix_overlap_top_k": -7.595681667327881,
            "interaction_matrix_overlap_bottom_k": 68.19696807861328,
            "effective_rank": -33.69648742675781,
            "effective_rank_mergeability_score": 27.47527313232422,
            "stable_rank": -42.43592834472656,
            "spectral_gap": 29.531532287597656,
            "singular_value_ratio": 60.18963623046875,
            "layerwise_effective_rank": 5.780750274658203,
            "layerwise_effective_rank_mergeability_score": -41.560115814208984,
            "singular_value_overlap": -44.64156723022461,
            "subspace_overlap": 30.1988468170166,
            "right_subspace_overlap": 37.48487091064453,
            "activation_l2_distance": -14.74904727935791,
            "activation_cosine_similarity": 13.98790454864502,
            "activation_magnitude_ratio": -1.5310003757476807,
            "activation_dot_product": -23.74994468688965,
            "encoder_gradient_cosine_similarity": 10.117646217346191,
            "encoder_gradient_l2_distance": -66.71602630615234,
            "encoder_gradient_dot_product": -15.408079147338867,
            "input_gradient_cosine_similarity": 17.79145622253418,
            "input_gradient_l2_distance": 5.573187828063965,
            "input_gradient_dot_product": -24.225910186767578
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.3949547279027246,
          "val_r": 0.4511864319448954,
          "n_iterations": 438,
          "coefficients": {
            "right_subspace_overlap_top_k": 37.78691864013672,
            "right_subspace_overlap_bottom_k": 23.237815856933594,
            "interaction_matrix_overlap_top_k": -28.129459381103516,
            "interaction_matrix_overlap_bottom_k": 86.78421783447266,
            "effective_rank": 35.746055603027344,
            "effective_rank_mergeability_score": 82.93053436279297,
            "stable_rank": 19.864032745361328,
            "spectral_gap": 33.519859313964844,
            "singular_value_ratio": 12.763982772827148,
            "layerwise_effective_rank": -24.520980834960938,
            "layerwise_effective_rank_mergeability_score": -11.397705078125,
            "singular_value_overlap": -18.247467041015625,
            "subspace_overlap": 52.35498046875,
            "right_subspace_overlap": 55.422611236572266,
            "activation_l2_distance": -83.43352508544922,
            "activation_cosine_similarity": 1.5081106424331665,
            "activation_magnitude_ratio": -84.55077362060547,
            "activation_dot_product": -77.0965576171875,
            "encoder_gradient_cosine_similarity": 41.216129302978516,
            "encoder_gradient_l2_distance": 9.578646659851074,
            "encoder_gradient_dot_product": -12.242634773254395,
            "input_gradient_cosine_similarity": -6.257050514221191,
            "input_gradient_l2_distance": -100.20965576171875,
            "input_gradient_dot_product": -45.631507873535156
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.4941370630308177,
          "val_r": 0.09608779832622288,
          "n_iterations": 595,
          "coefficients": {
            "right_subspace_overlap_top_k": 42.21785354614258,
            "right_subspace_overlap_bottom_k": 21.72258949279785,
            "interaction_matrix_overlap_top_k": 7.037164211273193,
            "interaction_matrix_overlap_bottom_k": 23.771852493286133,
            "effective_rank": 29.25082778930664,
            "effective_rank_mergeability_score": 22.007278442382812,
            "stable_rank": -4.7875657081604,
            "spectral_gap": 29.655988693237305,
            "singular_value_ratio": 9.410063743591309,
            "layerwise_effective_rank": -38.167808532714844,
            "layerwise_effective_rank_mergeability_score": -17.30375099182129,
            "singular_value_overlap": -70.01484680175781,
            "subspace_overlap": 0.2286325991153717,
            "right_subspace_overlap": 7.519412994384766,
            "activation_l2_distance": -4.6738505363464355,
            "activation_cosine_similarity": 51.429229736328125,
            "activation_magnitude_ratio": 23.489835739135742,
            "activation_dot_product": -63.303985595703125,
            "encoder_gradient_cosine_similarity": 12.424308776855469,
            "encoder_gradient_l2_distance": -45.55799102783203,
            "encoder_gradient_dot_product": 21.73341178894043,
            "input_gradient_cosine_similarity": 23.800308227539062,
            "input_gradient_l2_distance": -57.91584014892578,
            "input_gradient_dot_product": -22.975618362426758
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.45976303417878306,
          "val_r": 0.1961409334054561,
          "n_iterations": 1000,
          "coefficients": {
            "right_subspace_overlap_top_k": 0.023010091856122017,
            "right_subspace_overlap_bottom_k": -0.42687609791755676,
            "interaction_matrix_overlap_top_k": 0.7812134027481079,
            "interaction_matrix_overlap_bottom_k": 1.9277104139328003,
            "effective_rank": 2.0342745780944824,
            "effective_rank_mergeability_score": 0.4068702757358551,
            "stable_rank": 0.5137621164321899,
            "spectral_gap": 1.3838332891464233,
            "singular_value_ratio": -0.1724242866039276,
            "layerwise_effective_rank": 0.37482741475105286,
            "layerwise_effective_rank_mergeability_score": 1.707295536994934,
            "singular_value_overlap": -1.9705241918563843,
            "subspace_overlap": 0.913504958152771,
            "right_subspace_overlap": -0.007917307317256927,
            "activation_l2_distance": -1.773064374923706,
            "activation_cosine_similarity": 1.2111581563949585,
            "activation_magnitude_ratio": -0.756436288356781,
            "activation_dot_product": -3.056039810180664,
            "encoder_gradient_cosine_similarity": 0.1280798614025116,
            "encoder_gradient_l2_distance": -1.090460181236267,
            "encoder_gradient_dot_product": 0.09625506401062012,
            "input_gradient_cosine_similarity": 0.21609137952327728,
            "input_gradient_l2_distance": -1.2043458223342896,
            "input_gradient_dot_product": -0.25990623235702515
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.44850777758719695,
          "val_r": 0.04771284145232177,
          "n_iterations": 521,
          "coefficients": {
            "right_subspace_overlap_top_k": 9.93059253692627,
            "right_subspace_overlap_bottom_k": 24.583871841430664,
            "interaction_matrix_overlap_top_k": 21.873687744140625,
            "interaction_matrix_overlap_bottom_k": 5.531846523284912,
            "effective_rank": -6.752991676330566,
            "effective_rank_mergeability_score": 33.286190032958984,
            "stable_rank": -7.012603282928467,
            "spectral_gap": -5.662708282470703,
            "singular_value_ratio": 4.281495094299316,
            "layerwise_effective_rank": 15.589825630187988,
            "layerwise_effective_rank_mergeability_score": 10.474573135375977,
            "singular_value_overlap": -40.02949523925781,
            "subspace_overlap": 22.641496658325195,
            "right_subspace_overlap": 17.908733367919922,
            "activation_l2_distance": -22.678186416625977,
            "activation_cosine_similarity": 17.4051513671875,
            "activation_magnitude_ratio": -7.117465019226074,
            "activation_dot_product": -46.49014663696289,
            "encoder_gradient_cosine_similarity": 26.58070182800293,
            "encoder_gradient_l2_distance": -30.390758514404297,
            "encoder_gradient_dot_product": 21.32163429260254,
            "input_gradient_cosine_similarity": 2.978970527648926,
            "input_gradient_l2_distance": -34.159671783447266,
            "input_gradient_dot_product": -33.09768295288086
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.4399117742293768,
          "val_r": 0.4170922740076364,
          "n_iterations": 563,
          "coefficients": {
            "right_subspace_overlap_top_k": 15.444375038146973,
            "right_subspace_overlap_bottom_k": 44.11532974243164,
            "interaction_matrix_overlap_top_k": 16.940567016601562,
            "interaction_matrix_overlap_bottom_k": 17.822551727294922,
            "effective_rank": -29.48676872253418,
            "effective_rank_mergeability_score": 10.830028533935547,
            "stable_rank": 39.97486114501953,
            "spectral_gap": 76.67321014404297,
            "singular_value_ratio": 51.67594909667969,
            "layerwise_effective_rank": -14.302372932434082,
            "layerwise_effective_rank_mergeability_score": -3.837223768234253,
            "singular_value_overlap": -30.162437438964844,
            "subspace_overlap": -18.739665985107422,
            "right_subspace_overlap": 45.01473617553711,
            "activation_l2_distance": -36.67196273803711,
            "activation_cosine_similarity": -4.120615482330322,
            "activation_magnitude_ratio": -22.240224838256836,
            "activation_dot_product": -25.388446807861328,
            "encoder_gradient_cosine_similarity": 9.833162307739258,
            "encoder_gradient_l2_distance": -32.83637237548828,
            "encoder_gradient_dot_product": 18.619789123535156,
            "input_gradient_cosine_similarity": -1.407348394393921,
            "input_gradient_l2_distance": -48.00542068481445,
            "input_gradient_dot_product": -78.74835205078125
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.45199755082894433,
          "val_r": 0.40381550180025655,
          "n_iterations": 502,
          "coefficients": {
            "right_subspace_overlap_top_k": 2.9033381938934326,
            "right_subspace_overlap_bottom_k": 9.47927474975586,
            "interaction_matrix_overlap_top_k": 8.988037109375,
            "interaction_matrix_overlap_bottom_k": 27.559396743774414,
            "effective_rank": -17.586946487426758,
            "effective_rank_mergeability_score": 1.8171942234039307,
            "stable_rank": 14.799571990966797,
            "spectral_gap": 4.701232433319092,
            "singular_value_ratio": -17.79917335510254,
            "layerwise_effective_rank": 19.700664520263672,
            "layerwise_effective_rank_mergeability_score": 5.86049747467041,
            "singular_value_overlap": -25.10976791381836,
            "subspace_overlap": 1.460201382637024,
            "right_subspace_overlap": 10.945161819458008,
            "activation_l2_distance": -3.699244976043701,
            "activation_cosine_similarity": 18.440561294555664,
            "activation_magnitude_ratio": -7.668326377868652,
            "activation_dot_product": -18.665002822875977,
            "encoder_gradient_cosine_similarity": -4.756895542144775,
            "encoder_gradient_l2_distance": -9.940494537353516,
            "encoder_gradient_dot_product": 0.3771572709083557,
            "input_gradient_cosine_similarity": 19.08604621887207,
            "input_gradient_l2_distance": -21.37872886657715,
            "input_gradient_dot_product": -18.516618728637695
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.4063415446816754,
          "val_r": 0.35974223641573433,
          "n_iterations": 507,
          "coefficients": {
            "right_subspace_overlap_top_k": 40.298336029052734,
            "right_subspace_overlap_bottom_k": 29.989171981811523,
            "interaction_matrix_overlap_top_k": -5.169058799743652,
            "interaction_matrix_overlap_bottom_k": 64.34332275390625,
            "effective_rank": 16.091611862182617,
            "effective_rank_mergeability_score": 30.90460777282715,
            "stable_rank": -8.322002410888672,
            "spectral_gap": 0.3884178400039673,
            "singular_value_ratio": -38.447242736816406,
            "layerwise_effective_rank": 32.210472106933594,
            "layerwise_effective_rank_mergeability_score": 2.3757429122924805,
            "singular_value_overlap": -1.7474082708358765,
            "subspace_overlap": 10.34628963470459,
            "right_subspace_overlap": -23.81633186340332,
            "activation_l2_distance": -0.8883248567581177,
            "activation_cosine_similarity": 30.882099151611328,
            "activation_magnitude_ratio": -32.45075988769531,
            "activation_dot_product": -27.414575576782227,
            "encoder_gradient_cosine_similarity": -0.026741307228803635,
            "encoder_gradient_l2_distance": -41.99982833862305,
            "encoder_gradient_dot_product": 9.731099128723145,
            "input_gradient_cosine_similarity": 11.4453125,
            "input_gradient_l2_distance": -48.337581634521484,
            "input_gradient_dot_product": -49.38956069946289
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.3687533393814055,
          "val_r": 0.27852153847816385,
          "n_iterations": 553,
          "coefficients": {
            "right_subspace_overlap_top_k": 3.466433525085449,
            "right_subspace_overlap_bottom_k": 67.83865356445312,
            "interaction_matrix_overlap_top_k": 49.94436264038086,
            "interaction_matrix_overlap_bottom_k": 59.65804672241211,
            "effective_rank": -23.707704544067383,
            "effective_rank_mergeability_score": -54.36846923828125,
            "stable_rank": 11.848012924194336,
            "spectral_gap": 51.69320297241211,
            "singular_value_ratio": -24.316648483276367,
            "layerwise_effective_rank": 19.451618194580078,
            "layerwise_effective_rank_mergeability_score": 29.093839645385742,
            "singular_value_overlap": -12.033036231994629,
            "subspace_overlap": -38.29495620727539,
            "right_subspace_overlap": -25.492273330688477,
            "activation_l2_distance": 16.39139175415039,
            "activation_cosine_similarity": 77.45496368408203,
            "activation_magnitude_ratio": -56.10853576660156,
            "activation_dot_product": -49.722068786621094,
            "encoder_gradient_cosine_similarity": 33.8871955871582,
            "encoder_gradient_l2_distance": -97.4527587890625,
            "encoder_gradient_dot_product": 8.327323913574219,
            "input_gradient_cosine_similarity": 19.240535736083984,
            "input_gradient_l2_distance": -41.1217155456543,
            "input_gradient_dot_product": -24.680152893066406
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.35919680251261393,
          "val_r": 0.5894442101791246,
          "n_iterations": 303,
          "coefficients": {
            "right_subspace_overlap_top_k": -16.410951614379883,
            "right_subspace_overlap_bottom_k": 81.03678894042969,
            "interaction_matrix_overlap_top_k": 42.27745056152344,
            "interaction_matrix_overlap_bottom_k": 17.62109375,
            "effective_rank": 114.89959716796875,
            "effective_rank_mergeability_score": 57.00475311279297,
            "stable_rank": -32.58989334106445,
            "spectral_gap": -31.696826934814453,
            "singular_value_ratio": -84.35101318359375,
            "layerwise_effective_rank": -27.775333404541016,
            "layerwise_effective_rank_mergeability_score": -6.897517681121826,
            "singular_value_overlap": -58.33610534667969,
            "subspace_overlap": -13.934611320495605,
            "right_subspace_overlap": 78.520263671875,
            "activation_l2_distance": -52.31865310668945,
            "activation_cosine_similarity": -24.300621032714844,
            "activation_magnitude_ratio": -14.803442001342773,
            "activation_dot_product": -10.841208457946777,
            "encoder_gradient_cosine_similarity": -2.254340887069702,
            "encoder_gradient_l2_distance": -71.46804809570312,
            "encoder_gradient_dot_product": 25.194156646728516,
            "input_gradient_cosine_similarity": 26.20003890991211,
            "input_gradient_l2_distance": 2.2926950454711914,
            "input_gradient_dot_product": 3.9269959926605225
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.2673664886066269,
          "val_r": 0.3808156455637258,
          "n_iterations": 606,
          "coefficients": {
            "right_subspace_overlap_top_k": 6.143454551696777,
            "right_subspace_overlap_bottom_k": 82.4398193359375,
            "interaction_matrix_overlap_top_k": 29.96533203125,
            "interaction_matrix_overlap_bottom_k": 2.3256497383117676,
            "effective_rank": -64.46756744384766,
            "effective_rank_mergeability_score": -8.196802139282227,
            "stable_rank": -65.5322036743164,
            "spectral_gap": -34.33961868286133,
            "singular_value_ratio": -23.733867645263672,
            "layerwise_effective_rank": 18.925174713134766,
            "layerwise_effective_rank_mergeability_score": 23.63319969177246,
            "singular_value_overlap": -22.140737533569336,
            "subspace_overlap": 53.08012771606445,
            "right_subspace_overlap": 99.69469451904297,
            "activation_l2_distance": -37.061614990234375,
            "activation_cosine_similarity": -19.45453453063965,
            "activation_magnitude_ratio": -13.738645553588867,
            "activation_dot_product": 15.18479061126709,
            "encoder_gradient_cosine_similarity": 21.5302677154541,
            "encoder_gradient_l2_distance": 7.403499603271484,
            "encoder_gradient_dot_product": -39.81175231933594,
            "input_gradient_cosine_similarity": 31.922622680664062,
            "input_gradient_l2_distance": -19.873441696166992,
            "input_gradient_dot_product": -42.9005241394043
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.3951693172952636,
          "val_r": 0.3846924410985273,
          "n_iterations": 576,
          "coefficients": {
            "right_subspace_overlap_top_k": 9.337300300598145,
            "right_subspace_overlap_bottom_k": 27.165311813354492,
            "interaction_matrix_overlap_top_k": 21.39183235168457,
            "interaction_matrix_overlap_bottom_k": 31.298091888427734,
            "effective_rank": -28.13469886779785,
            "effective_rank_mergeability_score": 11.144755363464355,
            "stable_rank": 2.716564655303955,
            "spectral_gap": 40.0201416015625,
            "singular_value_ratio": 34.665740966796875,
            "layerwise_effective_rank": 6.074166774749756,
            "layerwise_effective_rank_mergeability_score": 5.992241859436035,
            "singular_value_overlap": -48.275970458984375,
            "subspace_overlap": -14.583415031433105,
            "right_subspace_overlap": 49.43265914916992,
            "activation_l2_distance": 5.978150844573975,
            "activation_cosine_similarity": 24.906951904296875,
            "activation_magnitude_ratio": -5.613810062408447,
            "activation_dot_product": -7.502982139587402,
            "encoder_gradient_cosine_similarity": -5.451595306396484,
            "encoder_gradient_l2_distance": -28.208993911743164,
            "encoder_gradient_dot_product": -43.13862228393555,
            "input_gradient_cosine_similarity": 23.822080612182617,
            "input_gradient_l2_distance": -58.74522399902344,
            "input_gradient_dot_product": -53.29322052001953
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.38576117830802437,
          "val_r": 0.3738107323155557,
          "n_iterations": 405,
          "coefficients": {
            "right_subspace_overlap_top_k": 10.10191822052002,
            "right_subspace_overlap_bottom_k": 56.86296844482422,
            "interaction_matrix_overlap_top_k": 51.88310241699219,
            "interaction_matrix_overlap_bottom_k": 32.76401901245117,
            "effective_rank": -4.260359287261963,
            "effective_rank_mergeability_score": 3.063633441925049,
            "stable_rank": 11.038808822631836,
            "spectral_gap": 15.563023567199707,
            "singular_value_ratio": -15.716529846191406,
            "layerwise_effective_rank": -24.115097045898438,
            "layerwise_effective_rank_mergeability_score": -4.898578643798828,
            "singular_value_overlap": -38.755802154541016,
            "subspace_overlap": 9.587625503540039,
            "right_subspace_overlap": -0.18561439216136932,
            "activation_l2_distance": -15.460369110107422,
            "activation_cosine_similarity": -26.01104164123535,
            "activation_magnitude_ratio": 2.908951997756958,
            "activation_dot_product": 18.5849609375,
            "encoder_gradient_cosine_similarity": 9.681266784667969,
            "encoder_gradient_l2_distance": -30.832170486450195,
            "encoder_gradient_dot_product": 14.634305000305176,
            "input_gradient_cosine_similarity": 14.958735466003418,
            "input_gradient_l2_distance": -32.92957305908203,
            "input_gradient_dot_product": -57.471778869628906
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.45635313943387434,
          "val_r": 0.13872280707832646,
          "n_iterations": 643,
          "coefficients": {
            "right_subspace_overlap_top_k": 30.319732666015625,
            "right_subspace_overlap_bottom_k": 40.77039337158203,
            "interaction_matrix_overlap_top_k": 28.44640350341797,
            "interaction_matrix_overlap_bottom_k": 6.9890241622924805,
            "effective_rank": 6.501036643981934,
            "effective_rank_mergeability_score": 14.372530937194824,
            "stable_rank": -26.00762367248535,
            "spectral_gap": 18.121007919311523,
            "singular_value_ratio": -2.32293438911438,
            "layerwise_effective_rank": 14.17103385925293,
            "layerwise_effective_rank_mergeability_score": 1.967625379562378,
            "singular_value_overlap": -51.66890335083008,
            "subspace_overlap": 35.096431732177734,
            "right_subspace_overlap": -7.414251804351807,
            "activation_l2_distance": -27.333160400390625,
            "activation_cosine_similarity": 0.38295748829841614,
            "activation_magnitude_ratio": 7.129226207733154,
            "activation_dot_product": -5.118483066558838,
            "encoder_gradient_cosine_similarity": 6.703526973724365,
            "encoder_gradient_l2_distance": -40.34563064575195,
            "encoder_gradient_dot_product": 3.0843594074249268,
            "input_gradient_cosine_similarity": 27.30048942565918,
            "input_gradient_l2_distance": -53.88762664794922,
            "input_gradient_dot_product": -26.25958251953125
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7075522216576059,
          "val_r": 0.4976647660198655,
          "n_iterations": 856,
          "coefficients": {
            "right_subspace_overlap_top_k": 22.010971069335938,
            "right_subspace_overlap_bottom_k": 7.632535457611084,
            "interaction_matrix_overlap_top_k": 19.31400489807129,
            "interaction_matrix_overlap_bottom_k": -7.665547847747803,
            "effective_rank": -1.883679747581482,
            "effective_rank_mergeability_score": 11.876880645751953,
            "stable_rank": -4.3805718421936035,
            "spectral_gap": -0.6980230808258057,
            "singular_value_ratio": 0.3923068642616272,
            "layerwise_effective_rank": 4.131041526794434,
            "layerwise_effective_rank_mergeability_score": 2.466278076171875,
            "singular_value_overlap": -14.192687034606934,
            "subspace_overlap": -6.545577049255371,
            "right_subspace_overlap": 7.701757431030273,
            "activation_l2_distance": 8.830185890197754,
            "activation_cosine_similarity": 21.284833908081055,
            "activation_magnitude_ratio": -9.440481185913086,
            "activation_dot_product": 3.4666202068328857,
            "encoder_gradient_cosine_similarity": 8.918931007385254,
            "encoder_gradient_l2_distance": -36.4274787902832,
            "encoder_gradient_dot_product": -1.9242652654647827,
            "input_gradient_cosine_similarity": 5.118567943572998,
            "input_gradient_l2_distance": -23.149394989013672,
            "input_gradient_dot_product": -15.838983535766602
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4170839687451148,
          "val_r": 0.008042791849064812,
          "n_iterations": 432,
          "coefficients": {
            "right_subspace_overlap_top_k": -48.22069549560547,
            "right_subspace_overlap_bottom_k": 38.73475646972656,
            "interaction_matrix_overlap_top_k": 22.67664909362793,
            "interaction_matrix_overlap_bottom_k": 48.699039459228516,
            "effective_rank": -25.078266143798828,
            "effective_rank_mergeability_score": 9.330804824829102,
            "stable_rank": 20.579208374023438,
            "spectral_gap": 40.694374084472656,
            "singular_value_ratio": -13.552813529968262,
            "layerwise_effective_rank": 3.1499087810516357,
            "layerwise_effective_rank_mergeability_score": -12.302857398986816,
            "singular_value_overlap": -44.142147064208984,
            "subspace_overlap": 12.766984939575195,
            "right_subspace_overlap": 39.50187683105469,
            "activation_l2_distance": -35.654632568359375,
            "activation_cosine_similarity": -40.60790252685547,
            "activation_magnitude_ratio": 37.1812858581543,
            "activation_dot_product": 21.08609390258789,
            "encoder_gradient_cosine_similarity": 6.365538120269775,
            "encoder_gradient_l2_distance": -52.041622161865234,
            "encoder_gradient_dot_product": 42.08221435546875,
            "input_gradient_cosine_similarity": 31.6368408203125,
            "input_gradient_l2_distance": -51.37989807128906,
            "input_gradient_dot_product": -50.508155822753906
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    }
  }
}