{
  "aggregate_metrics": {
    "train_r": 0.24321332424059944,
    "train_p": 1.3356030775018332e-44,
    "val_r": 0.16969554671155934,
    "val_p": 0.0012686993272305021
  },
  "per_fold_stats": {
    "train_r_mean": 0.6737788837351036,
    "train_r_std": 0.16036575846408999,
    "val_r_mean": 0.5032944983265961,
    "val_r_std": 0.24533633061389143
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 29.923198699951172,
    "right_subspace_overlap_bottom_k": -10.144109725952148,
    "interaction_matrix_overlap_top_k": 12.671030044555664,
    "interaction_matrix_overlap_bottom_k": -0.8807390332221985,
    "effective_rank": 0.29870548844337463,
    "effective_rank_mergeability_score": -1.990128755569458,
    "stable_rank": -5.9369049072265625,
    "spectral_gap": -5.73242712020874,
    "singular_value_ratio": -15.533482551574707,
    "layerwise_effective_rank": -2.445176362991333,
    "layerwise_effective_rank_mergeability_score": -5.340041637420654,
    "singular_value_overlap": 4.114165782928467,
    "subspace_overlap": 5.891267776489258,
    "right_subspace_overlap": 5.781153202056885,
    "activation_l2_distance": -9.188437461853027,
    "activation_cosine_similarity": 21.343982696533203,
    "activation_magnitude_ratio": -10.236796379089355,
    "activation_dot_product": 14.112627029418945,
    "encoder_gradient_cosine_similarity": 20.656883239746094,
    "encoder_gradient_l2_distance": -20.630489349365234,
    "encoder_gradient_dot_product": 5.564703941345215,
    "input_gradient_cosine_similarity": 22.066795349121094,
    "input_gradient_l2_distance": -25.119680404663086,
    "input_gradient_dot_product": -28.24483871459961
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 67.34864044189453,
    "right_subspace_overlap_bottom_k": 18.757143020629883,
    "interaction_matrix_overlap_top_k": 24.30814552307129,
    "interaction_matrix_overlap_bottom_k": 57.056427001953125,
    "effective_rank": 17.388412475585938,
    "effective_rank_mergeability_score": 29.018451690673828,
    "stable_rank": 33.6640739440918,
    "spectral_gap": 28.734027862548828,
    "singular_value_ratio": 75.260009765625,
    "layerwise_effective_rank": 16.16051483154297,
    "layerwise_effective_rank_mergeability_score": 57.31739807128906,
    "singular_value_overlap": 10.781160354614258,
    "subspace_overlap": 15.491127967834473,
    "right_subspace_overlap": 21.175626754760742,
    "activation_l2_distance": 19.662403106689453,
    "activation_cosine_similarity": 53.65087890625,
    "activation_magnitude_ratio": 22.500125885009766,
    "activation_dot_product": 25.764963150024414,
    "encoder_gradient_cosine_similarity": 46.81007766723633,
    "encoder_gradient_l2_distance": 19.402572631835938,
    "encoder_gradient_dot_product": 12.72139835357666,
    "input_gradient_cosine_similarity": 67.79020690917969,
    "input_gradient_l2_distance": 22.032320022583008,
    "input_gradient_dot_product": 59.38526153564453
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7121420910281249,
      "val_r": 0.5031965450847742,
      "n_iterations": 977,
      "coefficients": {
        "right_subspace_overlap_top_k": 35.53596496582031,
        "right_subspace_overlap_bottom_k": -19.701066970825195,
        "interaction_matrix_overlap_top_k": -2.7738521099090576,
        "interaction_matrix_overlap_bottom_k": 0.5659106373786926,
        "effective_rank": -8.596423149108887,
        "effective_rank_mergeability_score": 3.937828540802002,
        "stable_rank": -7.490433216094971,
        "spectral_gap": 5.257785797119141,
        "singular_value_ratio": 7.523526668548584,
        "layerwise_effective_rank": 12.240213394165039,
        "layerwise_effective_rank_mergeability_score": -2.605897903442383,
        "singular_value_overlap": -0.8168977499008179,
        "subspace_overlap": -6.567772388458252,
        "right_subspace_overlap": 5.598260402679443,
        "activation_l2_distance": 4.064518928527832,
        "activation_cosine_similarity": 32.83512878417969,
        "activation_magnitude_ratio": -8.837263107299805,
        "activation_dot_product": 1.9137041568756104,
        "encoder_gradient_cosine_similarity": 5.976358890533447,
        "encoder_gradient_l2_distance": -5.630343914031982,
        "encoder_gradient_dot_product": 6.704716205596924,
        "input_gradient_cosine_similarity": 10.443083763122559,
        "input_gradient_l2_distance": -44.40338897705078,
        "input_gradient_dot_product": -24.175195693969727
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7161444051404551,
      "val_r": 0.8040140366427124,
      "n_iterations": 979,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.5078394412994385,
        "right_subspace_overlap_bottom_k": -5.487580299377441,
        "interaction_matrix_overlap_top_k": 3.3367135524749756,
        "interaction_matrix_overlap_bottom_k": -8.533060073852539,
        "effective_rank": 3.072209358215332,
        "effective_rank_mergeability_score": 7.508904933929443,
        "stable_rank": 2.0721728801727295,
        "spectral_gap": 18.27300262451172,
        "singular_value_ratio": 16.549415588378906,
        "layerwise_effective_rank": -8.61815071105957,
        "layerwise_effective_rank_mergeability_score": -6.847635746002197,
        "singular_value_overlap": 3.5723516941070557,
        "subspace_overlap": -3.769291639328003,
        "right_subspace_overlap": 14.920522689819336,
        "activation_l2_distance": -8.849101066589355,
        "activation_cosine_similarity": 1.6945377588272095,
        "activation_magnitude_ratio": -1.827242136001587,
        "activation_dot_product": 13.829036712646484,
        "encoder_gradient_cosine_similarity": 4.935365676879883,
        "encoder_gradient_l2_distance": -29.951974868774414,
        "encoder_gradient_dot_product": 4.715671539306641,
        "input_gradient_cosine_similarity": 4.4250288009643555,
        "input_gradient_l2_distance": -17.157360076904297,
        "input_gradient_dot_product": -10.372819900512695
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7264945881000596,
      "val_r": 0.7122515302116154,
      "n_iterations": 685,
      "coefficients": {
        "right_subspace_overlap_top_k": 10.600981712341309,
        "right_subspace_overlap_bottom_k": -16.713817596435547,
        "interaction_matrix_overlap_top_k": 24.072681427001953,
        "interaction_matrix_overlap_bottom_k": -16.683923721313477,
        "effective_rank": -2.1806037425994873,
        "effective_rank_mergeability_score": 10.108807563781738,
        "stable_rank": -3.294917345046997,
        "spectral_gap": 4.818902969360352,
        "singular_value_ratio": 9.169554710388184,
        "layerwise_effective_rank": -7.836231708526611,
        "layerwise_effective_rank_mergeability_score": -9.69926643371582,
        "singular_value_overlap": 2.4161126613616943,
        "subspace_overlap": 9.4708251953125,
        "right_subspace_overlap": 14.486412048339844,
        "activation_l2_distance": 1.059071660041809,
        "activation_cosine_similarity": 23.213523864746094,
        "activation_magnitude_ratio": -7.008007049560547,
        "activation_dot_product": 17.1151123046875,
        "encoder_gradient_cosine_similarity": 8.495945930480957,
        "encoder_gradient_l2_distance": -40.81058883666992,
        "encoder_gradient_dot_product": 7.379431247711182,
        "input_gradient_cosine_similarity": 12.342602729797363,
        "input_gradient_l2_distance": -24.949092864990234,
        "input_gradient_dot_product": -24.575773239135742
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.2989723700349547,
      "val_r": 0.202461301381188,
      "n_iterations": 822,
      "coefficients": {
        "right_subspace_overlap_top_k": 311.9278564453125,
        "right_subspace_overlap_bottom_k": 45.13705062866211,
        "interaction_matrix_overlap_top_k": 105.15354919433594,
        "interaction_matrix_overlap_bottom_k": 231.79421997070312,
        "effective_rank": -50.411582946777344,
        "effective_rank_mergeability_score": -109.51924896240234,
        "stable_rank": -148.86453247070312,
        "spectral_gap": -126.84222412109375,
        "singular_value_ratio": -341.222412109375,
        "layerwise_effective_rank": -37.82576370239258,
        "layerwise_effective_rank_mergeability_score": -245.3921661376953,
        "singular_value_overlap": 47.64558410644531,
        "subspace_overlap": -11.218626976013184,
        "right_subspace_overlap": -52.072044372558594,
        "activation_l2_distance": -45.746456146240234,
        "activation_cosine_similarity": 250.0570068359375,
        "activation_magnitude_ratio": -94.69527435302734,
        "activation_dot_product": 121.43932342529297,
        "encoder_gradient_cosine_similarity": 219.2974090576172,
        "encoder_gradient_l2_distance": -1.9678473472595215,
        "encoder_gradient_dot_product": -26.97553253173828,
        "input_gradient_cosine_similarity": 316.4059753417969,
        "input_gradient_l2_distance": -73.4978256225586,
        "input_gradient_dot_product": -281.6084289550781
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7275762120087739,
      "val_r": 0.7122774142914976,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.74330997467041,
        "right_subspace_overlap_bottom_k": -11.175572395324707,
        "interaction_matrix_overlap_top_k": -2.095107078552246,
        "interaction_matrix_overlap_bottom_k": -4.09853982925415,
        "effective_rank": -2.9909744262695312,
        "effective_rank_mergeability_score": 1.4379851818084717,
        "stable_rank": 0.6595509052276611,
        "spectral_gap": 3.330216646194458,
        "singular_value_ratio": 4.384298801422119,
        "layerwise_effective_rank": 2.417710065841675,
        "layerwise_effective_rank_mergeability_score": 2.4904303550720215,
        "singular_value_overlap": 1.328108310699463,
        "subspace_overlap": -1.498388648033142,
        "right_subspace_overlap": 13.948307037353516,
        "activation_l2_distance": -2.338834047317505,
        "activation_cosine_similarity": 8.606063842773438,
        "activation_magnitude_ratio": -1.063188910484314,
        "activation_dot_product": 6.316108226776123,
        "encoder_gradient_cosine_similarity": 4.851066589355469,
        "encoder_gradient_l2_distance": -15.326361656188965,
        "encoder_gradient_dot_product": 4.251776695251465,
        "input_gradient_cosine_similarity": 4.29746150970459,
        "input_gradient_l2_distance": -16.542911529541016,
        "input_gradient_dot_product": -9.933989524841309
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.13459628869023982,
      "val_r": 0.059729777568229156,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.3807962238788605,
        "right_subspace_overlap_bottom_k": -0.5065087080001831,
        "interaction_matrix_overlap_top_k": -0.3801059126853943,
        "interaction_matrix_overlap_bottom_k": -0.6223934292793274,
        "effective_rank": 0.471926212310791,
        "effective_rank_mergeability_score": 0.5102970004081726,
        "stable_rank": -0.36171892285346985,
        "spectral_gap": 0.5695211887359619,
        "singular_value_ratio": -0.2251194417476654,
        "layerwise_effective_rank": -0.3297889828681946,
        "layerwise_effective_rank_mergeability_score": 0.3796103894710541,
        "singular_value_overlap": 0.12687671184539795,
        "subspace_overlap": 0.1779066026210785,
        "right_subspace_overlap": -0.42596760392189026,
        "activation_l2_distance": 0.5048025846481323,
        "activation_cosine_similarity": 0.45081713795661926,
        "activation_magnitude_ratio": -0.3131135404109955,
        "activation_dot_product": 0.012651152908802032,
        "encoder_gradient_cosine_similarity": 0.4039915204048157,
        "encoder_gradient_l2_distance": -0.12845169007778168,
        "encoder_gradient_dot_product": -0.0031546251848340034,
        "input_gradient_cosine_similarity": 0.42448848485946655,
        "input_gradient_l2_distance": -0.025794606655836105,
        "input_gradient_dot_product": -0.03583447262644768
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.6917316526095062,
      "val_r": 0.45839049914647345,
      "n_iterations": 893,
      "coefficients": {
        "right_subspace_overlap_top_k": 77.24364471435547,
        "right_subspace_overlap_bottom_k": -24.72637367248535,
        "interaction_matrix_overlap_top_k": 29.249021530151367,
        "interaction_matrix_overlap_bottom_k": -65.5291976928711,
        "effective_rank": 0.4337623119354248,
        "effective_rank_mergeability_score": -4.642549991607666,
        "stable_rank": 17.224390029907227,
        "spectral_gap": 4.602863311767578,
        "singular_value_ratio": -6.579765319824219,
        "layerwise_effective_rank": 17.633310317993164,
        "layerwise_effective_rank_mergeability_score": 41.494720458984375,
        "singular_value_overlap": -2.2937068939208984,
        "subspace_overlap": -2.3058359622955322,
        "right_subspace_overlap": -5.820679187774658,
        "activation_l2_distance": -31.986656188964844,
        "activation_cosine_similarity": 1.4521076679229736,
        "activation_magnitude_ratio": 0.835326075553894,
        "activation_dot_product": 4.030367374420166,
        "encoder_gradient_cosine_similarity": 45.46967315673828,
        "encoder_gradient_l2_distance": -36.74824905395508,
        "encoder_gradient_dot_product": 38.60593032836914,
        "input_gradient_cosine_similarity": -0.1472739428281784,
        "input_gradient_l2_distance": -63.123722076416016,
        "input_gradient_dot_product": -33.3727912902832
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7818637858192218,
      "val_r": 0.4260946254949668,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.45489510893821716,
        "right_subspace_overlap_bottom_k": -3.1078853607177734,
        "interaction_matrix_overlap_top_k": -1.5976710319519043,
        "interaction_matrix_overlap_bottom_k": 2.990208864212036,
        "effective_rank": 0.6338799595832825,
        "effective_rank_mergeability_score": -0.6311330795288086,
        "stable_rank": -0.75898277759552,
        "spectral_gap": 0.31910276412963867,
        "singular_value_ratio": 0.4269951581954956,
        "layerwise_effective_rank": 0.06873010098934174,
        "layerwise_effective_rank_mergeability_score": 0.6910304427146912,
        "singular_value_overlap": -0.0967569500207901,
        "subspace_overlap": 0.39181092381477356,
        "right_subspace_overlap": 0.8015221953392029,
        "activation_l2_distance": 0.3543247878551483,
        "activation_cosine_similarity": 0.7631135582923889,
        "activation_magnitude_ratio": -0.010478322394192219,
        "activation_dot_product": -0.1634347289800644,
        "encoder_gradient_cosine_similarity": 0.07551097869873047,
        "encoder_gradient_l2_distance": -0.5330403447151184,
        "encoder_gradient_dot_product": -0.029729001224040985,
        "input_gradient_cosine_similarity": 0.09932780265808105,
        "input_gradient_l2_distance": -0.20978917181491852,
        "input_gradient_dot_product": 0.06730777770280838
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7478160560521236,
      "val_r": 0.217864174673657,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.7945609092712402,
        "right_subspace_overlap_bottom_k": -25.162765502929688,
        "interaction_matrix_overlap_top_k": 7.995614528656006,
        "interaction_matrix_overlap_bottom_k": -3.7278048992156982,
        "effective_rank": -14.561978340148926,
        "effective_rank_mergeability_score": 14.486581802368164,
        "stable_rank": 11.727489471435547,
        "spectral_gap": -9.584914207458496,
        "singular_value_ratio": 6.56268310546875,
        "layerwise_effective_rank": -7.465231895446777,
        "layerwise_effective_rank_mergeability_score": 3.791034698486328,
        "singular_value_overlap": 2.8713247776031494,
        "subspace_overlap": 13.105937957763672,
        "right_subspace_overlap": 16.71063232421875,
        "activation_l2_distance": 0.6444698572158813,
        "activation_cosine_similarity": 20.6313419342041,
        "activation_magnitude_ratio": 4.034377098083496,
        "activation_dot_product": 4.431493282318115,
        "encoder_gradient_cosine_similarity": 13.93678092956543,
        "encoder_gradient_l2_distance": -15.592002868652344,
        "encoder_gradient_dot_product": 5.297479629516602,
        "input_gradient_cosine_similarity": 5.657290458679199,
        "input_gradient_l2_distance": -34.834327697753906,
        "input_gradient_dot_product": -19.16243553161621
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6705820876292603,
      "val_r": 0.5014903964166735,
      "n_iterations": 729,
      "coefficients": {
        "right_subspace_overlap_top_k": 26.607677459716797,
        "right_subspace_overlap_bottom_k": -11.914787292480469,
        "interaction_matrix_overlap_top_k": 30.35012435913086,
        "interaction_matrix_overlap_bottom_k": -33.19498062133789,
        "effective_rank": 3.809415340423584,
        "effective_rank_mergeability_score": 13.329366683959961,
        "stable_rank": 11.024301528930664,
        "spectral_gap": -9.303595542907715,
        "singular_value_ratio": -12.750418663024902,
        "layerwise_effective_rank": -18.13887596130371,
        "layerwise_effective_rank_mergeability_score": 3.674454927444458,
        "singular_value_overlap": 7.348223686218262,
        "subspace_overlap": 27.71588134765625,
        "right_subspace_overlap": 12.961286544799805,
        "activation_l2_distance": 11.432286262512207,
        "activation_cosine_similarity": -5.223141670227051,
        "activation_magnitude_ratio": -3.2267568111419678,
        "activation_dot_product": 16.9110050201416,
        "encoder_gradient_cosine_similarity": 26.364097595214844,
        "encoder_gradient_l2_distance": -31.817142486572266,
        "encoder_gradient_dot_product": 8.793128967285156,
        "input_gradient_cosine_similarity": 17.054567337036133,
        "input_gradient_l2_distance": -49.823219299316406,
        "input_gradient_dot_product": -40.98501968383789
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7722742329162947,
      "val_r": 0.2889026577503253,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.47611141204834,
        "right_subspace_overlap_bottom_k": -4.303760528564453,
        "interaction_matrix_overlap_top_k": 0.27359703183174133,
        "interaction_matrix_overlap_bottom_k": 1.1805673837661743,
        "effective_rank": 1.3466981649398804,
        "effective_rank_mergeability_score": 1.497442364692688,
        "stable_rank": -0.2796474099159241,
        "spectral_gap": 1.0534954071044922,
        "singular_value_ratio": 0.9219269752502441,
        "layerwise_effective_rank": -1.5359278917312622,
        "layerwise_effective_rank_mergeability_score": -1.125542402267456,
        "singular_value_overlap": 0.6607012748718262,
        "subspace_overlap": -3.660885810852051,
        "right_subspace_overlap": 2.4284980297088623,
        "activation_l2_distance": 1.1305280923843384,
        "activation_cosine_similarity": 6.780707359313965,
        "activation_magnitude_ratio": -0.5891835689544678,
        "activation_dot_product": 0.012958774343132973,
        "encoder_gradient_cosine_similarity": 0.6359961032867432,
        "encoder_gradient_l2_distance": -5.805887222290039,
        "encoder_gradient_dot_product": 0.5492598414421082,
        "input_gradient_cosine_similarity": 1.0021209716796875,
        "input_gradient_l2_distance": -3.4920358657836914,
        "input_gradient_dot_product": -1.1587938070297241
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7397700561386569,
      "val_r": 0.749096718583626,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.768495559692383,
        "right_subspace_overlap_bottom_k": 1.582855224609375,
        "interaction_matrix_overlap_top_k": -5.130660057067871,
        "interaction_matrix_overlap_bottom_k": -9.417582511901855,
        "effective_rank": -0.8531336188316345,
        "effective_rank_mergeability_score": 4.893632888793945,
        "stable_rank": -1.129515290260315,
        "spectral_gap": 0.16712096333503723,
        "singular_value_ratio": 1.7824628353118896,
        "layerwise_effective_rank": 2.404609441757202,
        "layerwise_effective_rank_mergeability_score": -1.640493392944336,
        "singular_value_overlap": 0.9443963766098022,
        "subspace_overlap": -0.09792424738407135,
        "right_subspace_overlap": 7.7312211990356445,
        "activation_l2_distance": 2.129016399383545,
        "activation_cosine_similarity": 8.574955940246582,
        "activation_magnitude_ratio": -1.305867075920105,
        "activation_dot_product": 3.7000293731689453,
        "encoder_gradient_cosine_similarity": 2.6545679569244385,
        "encoder_gradient_l2_distance": -12.875205039978027,
        "encoder_gradient_dot_product": 0.9881574511528015,
        "input_gradient_cosine_similarity": 2.785982370376587,
        "input_gradient_l2_distance": -9.402982711791992,
        "input_gradient_dot_product": -4.2554168701171875
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7966875251616099,
      "val_r": 0.7626395555446668,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5480037927627563,
        "right_subspace_overlap_bottom_k": -2.8323919773101807,
        "interaction_matrix_overlap_top_k": -1.2335162162780762,
        "interaction_matrix_overlap_bottom_k": 2.737562656402588,
        "effective_rank": 1.184205412864685,
        "effective_rank_mergeability_score": -0.41716742515563965,
        "stable_rank": -0.8158910870552063,
        "spectral_gap": -0.9980124831199646,
        "singular_value_ratio": -0.8607582449913025,
        "layerwise_effective_rank": 0.6119584441184998,
        "layerwise_effective_rank_mergeability_score": 1.533812165260315,
        "singular_value_overlap": -0.11926592141389847,
        "subspace_overlap": 0.37090468406677246,
        "right_subspace_overlap": 0.4189610481262207,
        "activation_l2_distance": 0.8216736316680908,
        "activation_cosine_similarity": 1.214774489402771,
        "activation_magnitude_ratio": 0.017830798402428627,
        "activation_dot_product": -0.19170476496219635,
        "encoder_gradient_cosine_similarity": 0.09833906590938568,
        "encoder_gradient_l2_distance": -0.48587435483932495,
        "encoder_gradient_dot_product": 0.03301704674959183,
        "input_gradient_cosine_similarity": 0.07800602912902832,
        "input_gradient_l2_distance": -0.5263983011245728,
        "input_gradient_dot_product": -0.19041362404823303
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7282262860523483,
      "val_r": 0.7153304585547655,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 13.79046630859375,
        "right_subspace_overlap_bottom_k": -3.930928945541382,
        "interaction_matrix_overlap_top_k": 7.266302585601807,
        "interaction_matrix_overlap_bottom_k": -6.84897518157959,
        "effective_rank": -2.666510820388794,
        "effective_rank_mergeability_score": 8.496403694152832,
        "stable_rank": 10.62496566772461,
        "spectral_gap": 4.915859222412109,
        "singular_value_ratio": 6.081844806671143,
        "layerwise_effective_rank": -2.370492696762085,
        "layerwise_effective_rank_mergeability_score": 3.3401083946228027,
        "singular_value_overlap": 1.2967160940170288,
        "subspace_overlap": 5.1389594078063965,
        "right_subspace_overlap": -8.335824012756348,
        "activation_l2_distance": -7.945807456970215,
        "activation_cosine_similarity": 5.257299900054932,
        "activation_magnitude_ratio": -2.3196468353271484,
        "activation_dot_product": 7.135577201843262,
        "encoder_gradient_cosine_similarity": 5.248079776763916,
        "encoder_gradient_l2_distance": -27.4298095703125,
        "encoder_gradient_dot_product": 1.8447003364562988,
        "input_gradient_cosine_similarity": 3.3921825885772705,
        "input_gradient_l2_distance": -9.769912719726562,
        "input_gradient_dot_product": -11.212986946105957
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7358682269909206,
      "val_r": 0.7996104084270184,
      "n_iterations": 898,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.2283237725496292,
        "right_subspace_overlap_bottom_k": -17.9476318359375,
        "interaction_matrix_overlap_top_k": 4.741369247436523,
        "interaction_matrix_overlap_bottom_k": 1.8543000221252441,
        "effective_rank": 1.9163018465042114,
        "effective_rank_mergeability_score": 7.818216323852539,
        "stable_rank": 11.073718070983887,
        "spectral_gap": 6.993395805358887,
        "singular_value_ratio": 2.345874547958374,
        "layerwise_effective_rank": -14.792780876159668,
        "layerwise_effective_rank_mergeability_score": -9.5382661819458,
        "singular_value_overlap": 2.371358633041382,
        "subspace_overlap": -1.5721869468688965,
        "right_subspace_overlap": 15.363202095031738,
        "activation_l2_distance": 3.214367151260376,
        "activation_cosine_similarity": 17.003461837768555,
        "activation_magnitude_ratio": -1.524810791015625,
        "activation_dot_product": 4.8718342781066895,
        "encoder_gradient_cosine_similarity": 4.106510639190674,
        "encoder_gradient_l2_distance": -28.54589080810547,
        "encoder_gradient_dot_product": 3.6236655712127686,
        "input_gradient_cosine_similarity": 4.402499675750732,
        "input_gradient_l2_distance": -9.796453475952148,
        "input_gradient_dot_product": -6.755390167236328
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7053617323157264,
      "val_r": 0.08280884063300056,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.120969295501709,
        "right_subspace_overlap_bottom_k": 8.792340278625488,
        "interaction_matrix_overlap_top_k": 3.2975170612335205,
        "interaction_matrix_overlap_bottom_k": -26.540075302124023,
        "effective_rank": -8.847957611083984,
        "effective_rank_mergeability_score": -9.152019500732422,
        "stable_rank": 2.232511043548584,
        "spectral_gap": -4.4024224281311035,
        "singular_value_ratio": 8.383139610290527,
        "layerwise_effective_rank": -24.907569885253906,
        "layerwise_effective_rank_mergeability_score": 2.193969249725342,
        "singular_value_overlap": 16.426998138427734,
        "subspace_overlap": 13.433082580566406,
        "right_subspace_overlap": 11.641752243041992,
        "activation_l2_distance": 15.777573585510254,
        "activation_cosine_similarity": 33.853614807128906,
        "activation_magnitude_ratio": -7.972553253173828,
        "activation_dot_product": 19.330171585083008,
        "encoder_gradient_cosine_similarity": 16.470516204833984,
        "encoder_gradient_l2_distance": -14.133688926696777,
        "encoder_gradient_dot_product": 8.256880760192871,
        "input_gradient_cosine_similarity": 6.45627498626709,
        "input_gradient_l2_distance": -41.669002532958984,
        "input_gradient_dot_product": -35.04356384277344
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7031081246212492,
      "val_r": 0.6777928525671546,
      "n_iterations": 936,
      "coefficients": {
        "right_subspace_overlap_top_k": 21.675466537475586,
        "right_subspace_overlap_bottom_k": -38.74187088012695,
        "interaction_matrix_overlap_top_k": -7.921904563903809,
        "interaction_matrix_overlap_bottom_k": -20.29034996032715,
        "effective_rank": 4.279170989990234,
        "effective_rank_mergeability_score": -5.2115960121154785,
        "stable_rank": -13.442952156066895,
        "spectral_gap": 12.543571472167969,
        "singular_value_ratio": 18.98656463623047,
        "layerwise_effective_rank": 34.61944580078125,
        "layerwise_effective_rank_mergeability_score": 39.31643295288086,
        "singular_value_overlap": -0.2811890244483948,
        "subspace_overlap": -0.7209911346435547,
        "right_subspace_overlap": 61.54486846923828,
        "activation_l2_distance": -40.64036560058594,
        "activation_cosine_similarity": 9.944061279296875,
        "activation_magnitude_ratio": -23.496051788330078,
        "activation_dot_product": 3.8622426986694336,
        "encoder_gradient_cosine_similarity": 15.758731842041016,
        "encoder_gradient_l2_distance": -84.12553405761719,
        "encoder_gradient_dot_product": 14.233826637268066,
        "input_gradient_cosine_similarity": 11.472973823547363,
        "input_gradient_l2_distance": -6.3558454513549805,
        "input_gradient_dot_product": -6.010327339172363
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7234326801791722,
      "val_r": 0.5375351522138571,
      "n_iterations": 921,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.975987195968628,
        "right_subspace_overlap_bottom_k": -14.666023254394531,
        "interaction_matrix_overlap_top_k": 17.922163009643555,
        "interaction_matrix_overlap_bottom_k": -0.4834803640842438,
        "effective_rank": 2.579922676086426,
        "effective_rank_mergeability_score": 6.366745948791504,
        "stable_rank": 2.1546642780303955,
        "spectral_gap": -8.220237731933594,
        "singular_value_ratio": -4.353963851928711,
        "layerwise_effective_rank": -1.3584836721420288,
        "layerwise_effective_rank_mergeability_score": 7.297514915466309,
        "singular_value_overlap": 3.753061056137085,
        "subspace_overlap": -5.499792098999023,
        "right_subspace_overlap": 1.2686349153518677,
        "activation_l2_distance": -0.27518177032470703,
        "activation_cosine_similarity": 8.389434814453125,
        "activation_magnitude_ratio": 1.0905474424362183,
        "activation_dot_product": 12.342170715332031,
        "encoder_gradient_cosine_similarity": 5.830009937286377,
        "encoder_gradient_l2_distance": -22.52074432373047,
        "encoder_gradient_dot_product": 7.294764041900635,
        "input_gradient_cosine_similarity": 4.528866291046143,
        "input_gradient_l2_distance": -15.764089584350586,
        "input_gradient_dot_product": -9.654119491577148
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5912258864706917,
      "val_r": 0.1792967169451582,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 41.83648681640625,
        "right_subspace_overlap_bottom_k": -6.080262184143066,
        "interaction_matrix_overlap_top_k": 30.228759765625,
        "interaction_matrix_overlap_bottom_k": -65.8370590209961,
        "effective_rank": 44.729454040527344,
        "effective_rank_mergeability_score": -39.94880676269531,
        "stable_rank": -12.333821296691895,
        "spectral_gap": -8.300590515136719,
        "singular_value_ratio": -21.25279998779297,
        "layerwise_effective_rank": -17.49350357055664,
        "layerwise_effective_rank_mergeability_score": 46.13560485839844,
        "singular_value_overlap": -2.346085786819458,
        "subspace_overlap": 56.8310432434082,
        "right_subspace_overlap": 28.480024337768555,
        "activation_l2_distance": -55.73516082763672,
        "activation_cosine_similarity": -10.430456161499023,
        "activation_magnitude_ratio": -49.125022888183594,
        "activation_dot_product": 24.27330207824707,
        "encoder_gradient_cosine_similarity": 19.36042022705078,
        "encoder_gradient_l2_distance": -6.39532470703125,
        "encoder_gradient_dot_product": 31.838321685791016,
        "input_gradient_cosine_similarity": 21.615358352661133,
        "input_gradient_l2_distance": -25.0025577545166,
        "input_gradient_dot_product": -24.04884910583496
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7717033867426828,
      "val_r": 0.6751063044005635,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 25.291929244995117,
        "right_subspace_overlap_bottom_k": -51.39521789550781,
        "interaction_matrix_overlap_top_k": 10.666016578674316,
        "interaction_matrix_overlap_bottom_k": 3.0698773860931396,
        "effective_rank": 32.62632369995117,
        "effective_rank_mergeability_score": 49.327728271484375,
        "stable_rank": 1.2405662536621094,
        "spectral_gap": -9.841392517089844,
        "singular_value_ratio": -6.542737007141113,
        "layerwise_effective_rank": 23.77329444885254,
        "layerwise_effective_rank_mergeability_score": 17.7097225189209,
        "singular_value_overlap": -2.5245978832244873,
        "subspace_overlap": 28.100698471069336,
        "right_subspace_overlap": -26.026538848876953,
        "activation_l2_distance": -31.383840560913086,
        "activation_cosine_similarity": 11.8113431930542,
        "activation_magnitude_ratio": -7.3995680809021,
        "activation_dot_product": 21.08059310913086,
        "encoder_gradient_cosine_similarity": 13.168323516845703,
        "encoder_gradient_l2_distance": -31.78582191467285,
        "encoder_gradient_dot_product": -6.108211517333984,
        "input_gradient_cosine_similarity": 14.59909725189209,
        "input_gradient_l2_distance": -56.04694747924805,
        "input_gradient_dot_product": -22.412038803100586
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}