{
  "aggregate_metrics": {
    "train_r": 0.25727099015489063,
    "train_p": 7.130998351725342e-50,
    "val_r": 0.0009795966766641424,
    "val_p": 0.9852638920607066
  },
  "per_fold_stats": {
    "train_r_mean": 0.42936340306508713,
    "train_r_std": 0.0810609833585073,
    "val_r_mean": 0.3137737044104799,
    "val_r_std": 0.14728447151934837
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 11.649996757507324,
    "right_subspace_overlap_bottom_k": 34.1492919921875,
    "interaction_matrix_overlap_top_k": 20.721921920776367,
    "interaction_matrix_overlap_bottom_k": 25.3687744140625,
    "effective_rank": -2.1606807708740234,
    "effective_rank_mergeability_score": 14.109103202819824,
    "stable_rank": -6.3288092613220215,
    "spectral_gap": 19.968759536743164,
    "singular_value_ratio": -1.0466731786727905,
    "layerwise_effective_rank": 4.553788661956787,
    "layerwise_effective_rank_mergeability_score": -0.8343027234077454,
    "singular_value_overlap": -33.686927795410156,
    "subspace_overlap": 13.653875350952148,
    "right_subspace_overlap": 23.551822662353516,
    "activation_l2_distance": -21.098356246948242,
    "activation_cosine_similarity": 10.338589668273926,
    "activation_magnitude_ratio": -13.575243949890137,
    "activation_dot_product": -22.958171844482422,
    "encoder_gradient_cosine_similarity": 8.615370750427246,
    "encoder_gradient_l2_distance": -35.867462158203125,
    "encoder_gradient_dot_product": 4.456513404846191,
    "input_gradient_cosine_similarity": 17.097152709960938,
    "input_gradient_l2_distance": -35.59779357910156,
    "input_gradient_dot_product": -34.08332061767578
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 20.296411514282227,
    "right_subspace_overlap_bottom_k": 27.330020904541016,
    "interaction_matrix_overlap_top_k": 23.23905372619629,
    "interaction_matrix_overlap_bottom_k": 27.155546188354492,
    "effective_rank": 35.07756805419922,
    "effective_rank_mergeability_score": 26.944433212280273,
    "stable_rank": 25.312644958496094,
    "spectral_gap": 27.12713623046875,
    "singular_value_ratio": 30.362823486328125,
    "layerwise_effective_rank": 21.185985565185547,
    "layerwise_effective_rank_mergeability_score": 15.452764511108398,
    "singular_value_overlap": 19.33830451965332,
    "subspace_overlap": 26.032541275024414,
    "right_subspace_overlap": 32.62809753417969,
    "activation_l2_distance": 24.20085334777832,
    "activation_cosine_similarity": 26.4206485748291,
    "activation_magnitude_ratio": 26.45641326904297,
    "activation_dot_product": 29.326196670532227,
    "encoder_gradient_cosine_similarity": 12.887967109680176,
    "encoder_gradient_l2_distance": 25.502674102783203,
    "encoder_gradient_dot_product": 21.77952766418457,
    "input_gradient_cosine_similarity": 11.798457145690918,
    "input_gradient_l2_distance": 23.741247177124023,
    "input_gradient_dot_product": 19.329442977905273
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.46979573810238956,
      "val_r": 0.338952369833496,
      "n_iterations": 569,
      "coefficients": {
        "right_subspace_overlap_top_k": 23.97238540649414,
        "right_subspace_overlap_bottom_k": 29.194351196289062,
        "interaction_matrix_overlap_top_k": 17.94818878173828,
        "interaction_matrix_overlap_bottom_k": 17.28635597229004,
        "effective_rank": -15.134220123291016,
        "effective_rank_mergeability_score": 16.686498641967773,
        "stable_rank": 4.5886430740356445,
        "spectral_gap": 36.08311080932617,
        "singular_value_ratio": 6.396190643310547,
        "layerwise_effective_rank": 47.34772491455078,
        "layerwise_effective_rank_mergeability_score": 17.393320083618164,
        "singular_value_overlap": -62.586971282958984,
        "subspace_overlap": 22.976734161376953,
        "right_subspace_overlap": 9.640213966369629,
        "activation_l2_distance": -24.940523147583008,
        "activation_cosine_similarity": 14.707571029663086,
        "activation_magnitude_ratio": -11.384641647338867,
        "activation_dot_product": -17.32496452331543,
        "encoder_gradient_cosine_similarity": -8.665376663208008,
        "encoder_gradient_l2_distance": -51.55845260620117,
        "encoder_gradient_dot_product": -21.718379974365234,
        "input_gradient_cosine_similarity": 22.906417846679688,
        "input_gradient_l2_distance": -34.99213409423828,
        "input_gradient_dot_product": -37.82466125488281
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4602230624615796,
      "val_r": 0.3625107033079123,
      "n_iterations": 604,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.7537693977355957,
        "right_subspace_overlap_bottom_k": 14.371106147766113,
        "interaction_matrix_overlap_top_k": 24.455995559692383,
        "interaction_matrix_overlap_bottom_k": 21.478757858276367,
        "effective_rank": 1.9670764207839966,
        "effective_rank_mergeability_score": 10.366402626037598,
        "stable_rank": -2.7474441528320312,
        "spectral_gap": 23.865812301635742,
        "singular_value_ratio": 3.880199670791626,
        "layerwise_effective_rank": 6.157888412475586,
        "layerwise_effective_rank_mergeability_score": -9.185694694519043,
        "singular_value_overlap": -23.149019241333008,
        "subspace_overlap": 5.929421424865723,
        "right_subspace_overlap": -12.410135269165039,
        "activation_l2_distance": -7.199288368225098,
        "activation_cosine_similarity": 6.733505725860596,
        "activation_magnitude_ratio": -7.699024200439453,
        "activation_dot_product": -9.027274131774902,
        "encoder_gradient_cosine_similarity": -2.58949613571167,
        "encoder_gradient_l2_distance": -17.294437408447266,
        "encoder_gradient_dot_product": 4.326783180236816,
        "input_gradient_cosine_similarity": 10.073469161987305,
        "input_gradient_l2_distance": -22.961097717285156,
        "input_gradient_dot_product": -22.099655151367188
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.3794461142892105,
      "val_r": 0.2483521996278329,
      "n_iterations": 417,
      "coefficients": {
        "right_subspace_overlap_top_k": -2.7118642330169678,
        "right_subspace_overlap_bottom_k": 84.15865325927734,
        "interaction_matrix_overlap_top_k": 81.01242065429688,
        "interaction_matrix_overlap_bottom_k": -21.186899185180664,
        "effective_rank": -12.172431945800781,
        "effective_rank_mergeability_score": -21.43813133239746,
        "stable_rank": -51.31786346435547,
        "spectral_gap": 55.970542907714844,
        "singular_value_ratio": 5.3521037101745605,
        "layerwise_effective_rank": 28.13033676147461,
        "layerwise_effective_rank_mergeability_score": -18.407222747802734,
        "singular_value_overlap": -18.410829544067383,
        "subspace_overlap": 60.269920349121094,
        "right_subspace_overlap": 54.414066314697266,
        "activation_l2_distance": -58.64801025390625,
        "activation_cosine_similarity": 11.139493942260742,
        "activation_magnitude_ratio": -53.108829498291016,
        "activation_dot_product": -80.69512176513672,
        "encoder_gradient_cosine_similarity": 4.7522759437561035,
        "encoder_gradient_l2_distance": -37.519683837890625,
        "encoder_gradient_dot_product": 31.39511489868164,
        "input_gradient_cosine_similarity": 36.4407844543457,
        "input_gradient_l2_distance": -30.021881103515625,
        "input_gradient_dot_product": -46.40047836303711
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4421929922388805,
      "val_r": 0.39406486231040067,
      "n_iterations": 603,
      "coefficients": {
        "right_subspace_overlap_top_k": 17.355365753173828,
        "right_subspace_overlap_bottom_k": 14.378504753112793,
        "interaction_matrix_overlap_top_k": 10.396254539489746,
        "interaction_matrix_overlap_bottom_k": 2.1700000762939453,
        "effective_rank": 12.658023834228516,
        "effective_rank_mergeability_score": 22.681196212768555,
        "stable_rank": -7.365971088409424,
        "spectral_gap": 13.907086372375488,
        "singular_value_ratio": 10.471515655517578,
        "layerwise_effective_rank": -1.238071322441101,
        "layerwise_effective_rank_mergeability_score": 8.139994621276855,
        "singular_value_overlap": -48.12273406982422,
        "subspace_overlap": 47.324546813964844,
        "right_subspace_overlap": 27.161867141723633,
        "activation_l2_distance": -25.9833927154541,
        "activation_cosine_similarity": 29.79199981689453,
        "activation_magnitude_ratio": -14.001786231994629,
        "activation_dot_product": -52.08904266357422,
        "encoder_gradient_cosine_similarity": 3.912843704223633,
        "encoder_gradient_l2_distance": -42.650245666503906,
        "encoder_gradient_dot_product": 22.450387954711914,
        "input_gradient_cosine_similarity": 24.668703079223633,
        "input_gradient_l2_distance": -39.548500061035156,
        "input_gradient_dot_product": -35.47105407714844
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.38276022582963476,
      "val_r": 0.3081010031950796,
      "n_iterations": 475,
      "coefficients": {
        "right_subspace_overlap_top_k": 25.277692794799805,
        "right_subspace_overlap_bottom_k": -14.299094200134277,
        "interaction_matrix_overlap_top_k": -7.595681667327881,
        "interaction_matrix_overlap_bottom_k": 68.19696807861328,
        "effective_rank": -33.69648742675781,
        "effective_rank_mergeability_score": 27.47527313232422,
        "stable_rank": -42.43592834472656,
        "spectral_gap": 29.531532287597656,
        "singular_value_ratio": 60.18963623046875,
        "layerwise_effective_rank": 5.780750274658203,
        "layerwise_effective_rank_mergeability_score": -41.560115814208984,
        "singular_value_overlap": -44.64156723022461,
        "subspace_overlap": 30.1988468170166,
        "right_subspace_overlap": 37.48487091064453,
        "activation_l2_distance": -14.74904727935791,
        "activation_cosine_similarity": 13.98790454864502,
        "activation_magnitude_ratio": -1.5310003757476807,
        "activation_dot_product": -23.74994468688965,
        "encoder_gradient_cosine_similarity": 10.117646217346191,
        "encoder_gradient_l2_distance": -66.71602630615234,
        "encoder_gradient_dot_product": -15.408079147338867,
        "input_gradient_cosine_similarity": 17.79145622253418,
        "input_gradient_l2_distance": 5.573187828063965,
        "input_gradient_dot_product": -24.225910186767578
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.3949547279027246,
      "val_r": 0.4511864319448954,
      "n_iterations": 438,
      "coefficients": {
        "right_subspace_overlap_top_k": 37.78691864013672,
        "right_subspace_overlap_bottom_k": 23.237815856933594,
        "interaction_matrix_overlap_top_k": -28.129459381103516,
        "interaction_matrix_overlap_bottom_k": 86.78421783447266,
        "effective_rank": 35.746055603027344,
        "effective_rank_mergeability_score": 82.93053436279297,
        "stable_rank": 19.864032745361328,
        "spectral_gap": 33.519859313964844,
        "singular_value_ratio": 12.763982772827148,
        "layerwise_effective_rank": -24.520980834960938,
        "layerwise_effective_rank_mergeability_score": -11.397705078125,
        "singular_value_overlap": -18.247467041015625,
        "subspace_overlap": 52.35498046875,
        "right_subspace_overlap": 55.422611236572266,
        "activation_l2_distance": -83.43352508544922,
        "activation_cosine_similarity": 1.5081106424331665,
        "activation_magnitude_ratio": -84.55077362060547,
        "activation_dot_product": -77.0965576171875,
        "encoder_gradient_cosine_similarity": 41.216129302978516,
        "encoder_gradient_l2_distance": 9.578646659851074,
        "encoder_gradient_dot_product": -12.242634773254395,
        "input_gradient_cosine_similarity": -6.257050514221191,
        "input_gradient_l2_distance": -100.20965576171875,
        "input_gradient_dot_product": -45.631507873535156
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.4941370630308177,
      "val_r": 0.09608779832622288,
      "n_iterations": 595,
      "coefficients": {
        "right_subspace_overlap_top_k": 42.21785354614258,
        "right_subspace_overlap_bottom_k": 21.72258949279785,
        "interaction_matrix_overlap_top_k": 7.037164211273193,
        "interaction_matrix_overlap_bottom_k": 23.771852493286133,
        "effective_rank": 29.25082778930664,
        "effective_rank_mergeability_score": 22.007278442382812,
        "stable_rank": -4.7875657081604,
        "spectral_gap": 29.655988693237305,
        "singular_value_ratio": 9.410063743591309,
        "layerwise_effective_rank": -38.167808532714844,
        "layerwise_effective_rank_mergeability_score": -17.30375099182129,
        "singular_value_overlap": -70.01484680175781,
        "subspace_overlap": 0.2286325991153717,
        "right_subspace_overlap": 7.519412994384766,
        "activation_l2_distance": -4.6738505363464355,
        "activation_cosine_similarity": 51.429229736328125,
        "activation_magnitude_ratio": 23.489835739135742,
        "activation_dot_product": -63.303985595703125,
        "encoder_gradient_cosine_similarity": 12.424308776855469,
        "encoder_gradient_l2_distance": -45.55799102783203,
        "encoder_gradient_dot_product": 21.73341178894043,
        "input_gradient_cosine_similarity": 23.800308227539062,
        "input_gradient_l2_distance": -57.91584014892578,
        "input_gradient_dot_product": -22.975618362426758
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.45976303417878306,
      "val_r": 0.1961409334054561,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.023010091856122017,
        "right_subspace_overlap_bottom_k": -0.42687609791755676,
        "interaction_matrix_overlap_top_k": 0.7812134027481079,
        "interaction_matrix_overlap_bottom_k": 1.9277104139328003,
        "effective_rank": 2.0342745780944824,
        "effective_rank_mergeability_score": 0.4068702757358551,
        "stable_rank": 0.5137621164321899,
        "spectral_gap": 1.3838332891464233,
        "singular_value_ratio": -0.1724242866039276,
        "layerwise_effective_rank": 0.37482741475105286,
        "layerwise_effective_rank_mergeability_score": 1.707295536994934,
        "singular_value_overlap": -1.9705241918563843,
        "subspace_overlap": 0.913504958152771,
        "right_subspace_overlap": -0.007917307317256927,
        "activation_l2_distance": -1.773064374923706,
        "activation_cosine_similarity": 1.2111581563949585,
        "activation_magnitude_ratio": -0.756436288356781,
        "activation_dot_product": -3.056039810180664,
        "encoder_gradient_cosine_similarity": 0.1280798614025116,
        "encoder_gradient_l2_distance": -1.090460181236267,
        "encoder_gradient_dot_product": 0.09625506401062012,
        "input_gradient_cosine_similarity": 0.21609137952327728,
        "input_gradient_l2_distance": -1.2043458223342896,
        "input_gradient_dot_product": -0.25990623235702515
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.44850777758719695,
      "val_r": 0.04771284145232177,
      "n_iterations": 521,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.93059253692627,
        "right_subspace_overlap_bottom_k": 24.583871841430664,
        "interaction_matrix_overlap_top_k": 21.873687744140625,
        "interaction_matrix_overlap_bottom_k": 5.531846523284912,
        "effective_rank": -6.752991676330566,
        "effective_rank_mergeability_score": 33.286190032958984,
        "stable_rank": -7.012603282928467,
        "spectral_gap": -5.662708282470703,
        "singular_value_ratio": 4.281495094299316,
        "layerwise_effective_rank": 15.589825630187988,
        "layerwise_effective_rank_mergeability_score": 10.474573135375977,
        "singular_value_overlap": -40.02949523925781,
        "subspace_overlap": 22.641496658325195,
        "right_subspace_overlap": 17.908733367919922,
        "activation_l2_distance": -22.678186416625977,
        "activation_cosine_similarity": 17.4051513671875,
        "activation_magnitude_ratio": -7.117465019226074,
        "activation_dot_product": -46.49014663696289,
        "encoder_gradient_cosine_similarity": 26.58070182800293,
        "encoder_gradient_l2_distance": -30.390758514404297,
        "encoder_gradient_dot_product": 21.32163429260254,
        "input_gradient_cosine_similarity": 2.978970527648926,
        "input_gradient_l2_distance": -34.159671783447266,
        "input_gradient_dot_product": -33.09768295288086
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4399117742293768,
      "val_r": 0.4170922740076364,
      "n_iterations": 563,
      "coefficients": {
        "right_subspace_overlap_top_k": 15.444375038146973,
        "right_subspace_overlap_bottom_k": 44.11532974243164,
        "interaction_matrix_overlap_top_k": 16.940567016601562,
        "interaction_matrix_overlap_bottom_k": 17.822551727294922,
        "effective_rank": -29.48676872253418,
        "effective_rank_mergeability_score": 10.830028533935547,
        "stable_rank": 39.97486114501953,
        "spectral_gap": 76.67321014404297,
        "singular_value_ratio": 51.67594909667969,
        "layerwise_effective_rank": -14.302372932434082,
        "layerwise_effective_rank_mergeability_score": -3.837223768234253,
        "singular_value_overlap": -30.162437438964844,
        "subspace_overlap": -18.739665985107422,
        "right_subspace_overlap": 45.01473617553711,
        "activation_l2_distance": -36.67196273803711,
        "activation_cosine_similarity": -4.120615482330322,
        "activation_magnitude_ratio": -22.240224838256836,
        "activation_dot_product": -25.388446807861328,
        "encoder_gradient_cosine_similarity": 9.833162307739258,
        "encoder_gradient_l2_distance": -32.83637237548828,
        "encoder_gradient_dot_product": 18.619789123535156,
        "input_gradient_cosine_similarity": -1.407348394393921,
        "input_gradient_l2_distance": -48.00542068481445,
        "input_gradient_dot_product": -78.74835205078125
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.45199755082894433,
      "val_r": 0.40381550180025655,
      "n_iterations": 502,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.9033381938934326,
        "right_subspace_overlap_bottom_k": 9.47927474975586,
        "interaction_matrix_overlap_top_k": 8.988037109375,
        "interaction_matrix_overlap_bottom_k": 27.559396743774414,
        "effective_rank": -17.586946487426758,
        "effective_rank_mergeability_score": 1.8171942234039307,
        "stable_rank": 14.799571990966797,
        "spectral_gap": 4.701232433319092,
        "singular_value_ratio": -17.79917335510254,
        "layerwise_effective_rank": 19.700664520263672,
        "layerwise_effective_rank_mergeability_score": 5.86049747467041,
        "singular_value_overlap": -25.10976791381836,
        "subspace_overlap": 1.460201382637024,
        "right_subspace_overlap": 10.945161819458008,
        "activation_l2_distance": -3.699244976043701,
        "activation_cosine_similarity": 18.440561294555664,
        "activation_magnitude_ratio": -7.668326377868652,
        "activation_dot_product": -18.665002822875977,
        "encoder_gradient_cosine_similarity": -4.756895542144775,
        "encoder_gradient_l2_distance": -9.940494537353516,
        "encoder_gradient_dot_product": 0.3771572709083557,
        "input_gradient_cosine_similarity": 19.08604621887207,
        "input_gradient_l2_distance": -21.37872886657715,
        "input_gradient_dot_product": -18.516618728637695
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4063415446816754,
      "val_r": 0.35974223641573433,
      "n_iterations": 507,
      "coefficients": {
        "right_subspace_overlap_top_k": 40.298336029052734,
        "right_subspace_overlap_bottom_k": 29.989171981811523,
        "interaction_matrix_overlap_top_k": -5.169058799743652,
        "interaction_matrix_overlap_bottom_k": 64.34332275390625,
        "effective_rank": 16.091611862182617,
        "effective_rank_mergeability_score": 30.90460777282715,
        "stable_rank": -8.322002410888672,
        "spectral_gap": 0.3884178400039673,
        "singular_value_ratio": -38.447242736816406,
        "layerwise_effective_rank": 32.210472106933594,
        "layerwise_effective_rank_mergeability_score": 2.3757429122924805,
        "singular_value_overlap": -1.7474082708358765,
        "subspace_overlap": 10.34628963470459,
        "right_subspace_overlap": -23.81633186340332,
        "activation_l2_distance": -0.8883248567581177,
        "activation_cosine_similarity": 30.882099151611328,
        "activation_magnitude_ratio": -32.45075988769531,
        "activation_dot_product": -27.414575576782227,
        "encoder_gradient_cosine_similarity": -0.026741307228803635,
        "encoder_gradient_l2_distance": -41.99982833862305,
        "encoder_gradient_dot_product": 9.731099128723145,
        "input_gradient_cosine_similarity": 11.4453125,
        "input_gradient_l2_distance": -48.337581634521484,
        "input_gradient_dot_product": -49.38956069946289
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.3687533393814055,
      "val_r": 0.27852153847816385,
      "n_iterations": 553,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.466433525085449,
        "right_subspace_overlap_bottom_k": 67.83865356445312,
        "interaction_matrix_overlap_top_k": 49.94436264038086,
        "interaction_matrix_overlap_bottom_k": 59.65804672241211,
        "effective_rank": -23.707704544067383,
        "effective_rank_mergeability_score": -54.36846923828125,
        "stable_rank": 11.848012924194336,
        "spectral_gap": 51.69320297241211,
        "singular_value_ratio": -24.316648483276367,
        "layerwise_effective_rank": 19.451618194580078,
        "layerwise_effective_rank_mergeability_score": 29.093839645385742,
        "singular_value_overlap": -12.033036231994629,
        "subspace_overlap": -38.29495620727539,
        "right_subspace_overlap": -25.492273330688477,
        "activation_l2_distance": 16.39139175415039,
        "activation_cosine_similarity": 77.45496368408203,
        "activation_magnitude_ratio": -56.10853576660156,
        "activation_dot_product": -49.722068786621094,
        "encoder_gradient_cosine_similarity": 33.8871955871582,
        "encoder_gradient_l2_distance": -97.4527587890625,
        "encoder_gradient_dot_product": 8.327323913574219,
        "input_gradient_cosine_similarity": 19.240535736083984,
        "input_gradient_l2_distance": -41.1217155456543,
        "input_gradient_dot_product": -24.680152893066406
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.35919680251261393,
      "val_r": 0.5894442101791246,
      "n_iterations": 303,
      "coefficients": {
        "right_subspace_overlap_top_k": -16.410951614379883,
        "right_subspace_overlap_bottom_k": 81.03678894042969,
        "interaction_matrix_overlap_top_k": 42.27745056152344,
        "interaction_matrix_overlap_bottom_k": 17.62109375,
        "effective_rank": 114.89959716796875,
        "effective_rank_mergeability_score": 57.00475311279297,
        "stable_rank": -32.58989334106445,
        "spectral_gap": -31.696826934814453,
        "singular_value_ratio": -84.35101318359375,
        "layerwise_effective_rank": -27.775333404541016,
        "layerwise_effective_rank_mergeability_score": -6.897517681121826,
        "singular_value_overlap": -58.33610534667969,
        "subspace_overlap": -13.934611320495605,
        "right_subspace_overlap": 78.520263671875,
        "activation_l2_distance": -52.31865310668945,
        "activation_cosine_similarity": -24.300621032714844,
        "activation_magnitude_ratio": -14.803442001342773,
        "activation_dot_product": -10.841208457946777,
        "encoder_gradient_cosine_similarity": -2.254340887069702,
        "encoder_gradient_l2_distance": -71.46804809570312,
        "encoder_gradient_dot_product": 25.194156646728516,
        "input_gradient_cosine_similarity": 26.20003890991211,
        "input_gradient_l2_distance": 2.2926950454711914,
        "input_gradient_dot_product": 3.9269959926605225
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.2673664886066269,
      "val_r": 0.3808156455637258,
      "n_iterations": 606,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.143454551696777,
        "right_subspace_overlap_bottom_k": 82.4398193359375,
        "interaction_matrix_overlap_top_k": 29.96533203125,
        "interaction_matrix_overlap_bottom_k": 2.3256497383117676,
        "effective_rank": -64.46756744384766,
        "effective_rank_mergeability_score": -8.196802139282227,
        "stable_rank": -65.5322036743164,
        "spectral_gap": -34.33961868286133,
        "singular_value_ratio": -23.733867645263672,
        "layerwise_effective_rank": 18.925174713134766,
        "layerwise_effective_rank_mergeability_score": 23.63319969177246,
        "singular_value_overlap": -22.140737533569336,
        "subspace_overlap": 53.08012771606445,
        "right_subspace_overlap": 99.69469451904297,
        "activation_l2_distance": -37.061614990234375,
        "activation_cosine_similarity": -19.45453453063965,
        "activation_magnitude_ratio": -13.738645553588867,
        "activation_dot_product": 15.18479061126709,
        "encoder_gradient_cosine_similarity": 21.5302677154541,
        "encoder_gradient_l2_distance": 7.403499603271484,
        "encoder_gradient_dot_product": -39.81175231933594,
        "input_gradient_cosine_similarity": 31.922622680664062,
        "input_gradient_l2_distance": -19.873441696166992,
        "input_gradient_dot_product": -42.9005241394043
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.3951693172952636,
      "val_r": 0.3846924410985273,
      "n_iterations": 576,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.337300300598145,
        "right_subspace_overlap_bottom_k": 27.165311813354492,
        "interaction_matrix_overlap_top_k": 21.39183235168457,
        "interaction_matrix_overlap_bottom_k": 31.298091888427734,
        "effective_rank": -28.13469886779785,
        "effective_rank_mergeability_score": 11.144755363464355,
        "stable_rank": 2.716564655303955,
        "spectral_gap": 40.0201416015625,
        "singular_value_ratio": 34.665740966796875,
        "layerwise_effective_rank": 6.074166774749756,
        "layerwise_effective_rank_mergeability_score": 5.992241859436035,
        "singular_value_overlap": -48.275970458984375,
        "subspace_overlap": -14.583415031433105,
        "right_subspace_overlap": 49.43265914916992,
        "activation_l2_distance": 5.978150844573975,
        "activation_cosine_similarity": 24.906951904296875,
        "activation_magnitude_ratio": -5.613810062408447,
        "activation_dot_product": -7.502982139587402,
        "encoder_gradient_cosine_similarity": -5.451595306396484,
        "encoder_gradient_l2_distance": -28.208993911743164,
        "encoder_gradient_dot_product": -43.13862228393555,
        "input_gradient_cosine_similarity": 23.822080612182617,
        "input_gradient_l2_distance": -58.74522399902344,
        "input_gradient_dot_product": -53.29322052001953
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.38576117830802437,
      "val_r": 0.3738107323155557,
      "n_iterations": 405,
      "coefficients": {
        "right_subspace_overlap_top_k": 10.10191822052002,
        "right_subspace_overlap_bottom_k": 56.86296844482422,
        "interaction_matrix_overlap_top_k": 51.88310241699219,
        "interaction_matrix_overlap_bottom_k": 32.76401901245117,
        "effective_rank": -4.260359287261963,
        "effective_rank_mergeability_score": 3.063633441925049,
        "stable_rank": 11.038808822631836,
        "spectral_gap": 15.563023567199707,
        "singular_value_ratio": -15.716529846191406,
        "layerwise_effective_rank": -24.115097045898438,
        "layerwise_effective_rank_mergeability_score": -4.898578643798828,
        "singular_value_overlap": -38.755802154541016,
        "subspace_overlap": 9.587625503540039,
        "right_subspace_overlap": -0.18561439216136932,
        "activation_l2_distance": -15.460369110107422,
        "activation_cosine_similarity": -26.01104164123535,
        "activation_magnitude_ratio": 2.908951997756958,
        "activation_dot_product": 18.5849609375,
        "encoder_gradient_cosine_similarity": 9.681266784667969,
        "encoder_gradient_l2_distance": -30.832170486450195,
        "encoder_gradient_dot_product": 14.634305000305176,
        "input_gradient_cosine_similarity": 14.958735466003418,
        "input_gradient_l2_distance": -32.92957305908203,
        "input_gradient_dot_product": -57.471778869628906
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.45635313943387434,
      "val_r": 0.13872280707832646,
      "n_iterations": 643,
      "coefficients": {
        "right_subspace_overlap_top_k": 30.319732666015625,
        "right_subspace_overlap_bottom_k": 40.77039337158203,
        "interaction_matrix_overlap_top_k": 28.44640350341797,
        "interaction_matrix_overlap_bottom_k": 6.9890241622924805,
        "effective_rank": 6.501036643981934,
        "effective_rank_mergeability_score": 14.372530937194824,
        "stable_rank": -26.00762367248535,
        "spectral_gap": 18.121007919311523,
        "singular_value_ratio": -2.32293438911438,
        "layerwise_effective_rank": 14.17103385925293,
        "layerwise_effective_rank_mergeability_score": 1.967625379562378,
        "singular_value_overlap": -51.66890335083008,
        "subspace_overlap": 35.096431732177734,
        "right_subspace_overlap": -7.414251804351807,
        "activation_l2_distance": -27.333160400390625,
        "activation_cosine_similarity": 0.38295748829841614,
        "activation_magnitude_ratio": 7.129226207733154,
        "activation_dot_product": -5.118483066558838,
        "encoder_gradient_cosine_similarity": 6.703526973724365,
        "encoder_gradient_l2_distance": -40.34563064575195,
        "encoder_gradient_dot_product": 3.0843594074249268,
        "input_gradient_cosine_similarity": 27.30048942565918,
        "input_gradient_l2_distance": -53.88762664794922,
        "input_gradient_dot_product": -26.25958251953125
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7075522216576059,
      "val_r": 0.4976647660198655,
      "n_iterations": 856,
      "coefficients": {
        "right_subspace_overlap_top_k": 22.010971069335938,
        "right_subspace_overlap_bottom_k": 7.632535457611084,
        "interaction_matrix_overlap_top_k": 19.31400489807129,
        "interaction_matrix_overlap_bottom_k": -7.665547847747803,
        "effective_rank": -1.883679747581482,
        "effective_rank_mergeability_score": 11.876880645751953,
        "stable_rank": -4.3805718421936035,
        "spectral_gap": -0.6980230808258057,
        "singular_value_ratio": 0.3923068642616272,
        "layerwise_effective_rank": 4.131041526794434,
        "layerwise_effective_rank_mergeability_score": 2.466278076171875,
        "singular_value_overlap": -14.192687034606934,
        "subspace_overlap": -6.545577049255371,
        "right_subspace_overlap": 7.701757431030273,
        "activation_l2_distance": 8.830185890197754,
        "activation_cosine_similarity": 21.284833908081055,
        "activation_magnitude_ratio": -9.440481185913086,
        "activation_dot_product": 3.4666202068328857,
        "encoder_gradient_cosine_similarity": 8.918931007385254,
        "encoder_gradient_l2_distance": -36.4274787902832,
        "encoder_gradient_dot_product": -1.9242652654647827,
        "input_gradient_cosine_similarity": 5.118567943572998,
        "input_gradient_l2_distance": -23.149394989013672,
        "input_gradient_dot_product": -15.838983535766602
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4170839687451148,
      "val_r": 0.008042791849064812,
      "n_iterations": 432,
      "coefficients": {
        "right_subspace_overlap_top_k": -48.22069549560547,
        "right_subspace_overlap_bottom_k": 38.73475646972656,
        "interaction_matrix_overlap_top_k": 22.67664909362793,
        "interaction_matrix_overlap_bottom_k": 48.699039459228516,
        "effective_rank": -25.078266143798828,
        "effective_rank_mergeability_score": 9.330804824829102,
        "stable_rank": 20.579208374023438,
        "spectral_gap": 40.694374084472656,
        "singular_value_ratio": -13.552813529968262,
        "layerwise_effective_rank": 3.1499087810516357,
        "layerwise_effective_rank_mergeability_score": -12.302857398986816,
        "singular_value_overlap": -44.142147064208984,
        "subspace_overlap": 12.766984939575195,
        "right_subspace_overlap": 39.50187683105469,
        "activation_l2_distance": -35.654632568359375,
        "activation_cosine_similarity": -40.60790252685547,
        "activation_magnitude_ratio": 37.1812858581543,
        "activation_dot_product": 21.08609390258789,
        "encoder_gradient_cosine_similarity": 6.365538120269775,
        "encoder_gradient_l2_distance": -52.041622161865234,
        "encoder_gradient_dot_product": 42.08221435546875,
        "input_gradient_cosine_similarity": 31.6368408203125,
        "input_gradient_l2_distance": -51.37989807128906,
        "input_gradient_dot_product": -50.508155822753906
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}