{
  "aggregate_metrics": {
    "train_r": 0.28567495517533215,
    "train_p": 1.4593879409336424e-61,
    "val_r": 0.14568159931877056,
    "val_p": 0.005753077140043521
  },
  "per_fold_stats": {
    "train_r_mean": 0.7441484014528033,
    "train_r_std": 0.09382002159424227,
    "val_r_mean": 0.5915126984908212,
    "val_r_std": 0.16260935649852143
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 3.3161540031433105,
    "right_subspace_overlap_bottom_k": -27.092483520507812,
    "interaction_matrix_overlap_top_k": 41.90476989746094,
    "interaction_matrix_overlap_bottom_k": -4.802565574645996,
    "effective_rank": -5.052855014801025,
    "effective_rank_mergeability_score": 14.695791244506836,
    "stable_rank": -7.6664838790893555,
    "spectral_gap": -15.222320556640625,
    "singular_value_ratio": 7.169997215270996,
    "layerwise_effective_rank": -8.384817123413086,
    "layerwise_effective_rank_mergeability_score": -10.571024894714355,
    "singular_value_overlap": 20.35552978515625,
    "subspace_overlap": 9.691378593444824,
    "right_subspace_overlap": 9.217711448669434,
    "activation_l2_distance": -24.106435775756836,
    "activation_cosine_similarity": 5.551836967468262,
    "activation_magnitude_ratio": -4.51003360748291,
    "activation_dot_product": 29.411157608032227,
    "encoder_gradient_cosine_similarity": 9.732672691345215,
    "encoder_gradient_l2_distance": -28.891748428344727,
    "encoder_gradient_dot_product": -1.629195213317871,
    "input_gradient_cosine_similarity": 15.343626022338867,
    "input_gradient_l2_distance": -19.00566291809082,
    "input_gradient_dot_product": -8.456148147583008
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 45.141624450683594,
    "right_subspace_overlap_bottom_k": 47.7766227722168,
    "interaction_matrix_overlap_top_k": 104.62875366210938,
    "interaction_matrix_overlap_bottom_k": 20.835735321044922,
    "effective_rank": 29.36737632751465,
    "effective_rank_mergeability_score": 75.30974578857422,
    "stable_rank": 38.110862731933594,
    "spectral_gap": 44.092041015625,
    "singular_value_ratio": 35.189849853515625,
    "layerwise_effective_rank": 26.099443435668945,
    "layerwise_effective_rank_mergeability_score": 90.06269836425781,
    "singular_value_overlap": 30.289445877075195,
    "subspace_overlap": 19.819482803344727,
    "right_subspace_overlap": 47.5316047668457,
    "activation_l2_distance": 48.272247314453125,
    "activation_cosine_similarity": 24.80201530456543,
    "activation_magnitude_ratio": 40.826541900634766,
    "activation_dot_product": 45.41999053955078,
    "encoder_gradient_cosine_similarity": 27.47447395324707,
    "encoder_gradient_l2_distance": 37.78289794921875,
    "encoder_gradient_dot_product": 17.118532180786133,
    "input_gradient_cosine_similarity": 26.607271194458008,
    "input_gradient_l2_distance": 29.676898956298828,
    "input_gradient_dot_product": 14.37448787689209
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7374980889456173,
      "val_r": 0.41600436632638527,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 40.41664505004883,
        "right_subspace_overlap_bottom_k": -15.073270797729492,
        "interaction_matrix_overlap_top_k": 5.760771751403809,
        "interaction_matrix_overlap_bottom_k": -4.398040294647217,
        "effective_rank": 28.3582820892334,
        "effective_rank_mergeability_score": -18.779197692871094,
        "stable_rank": -31.44269561767578,
        "spectral_gap": 27.0040283203125,
        "singular_value_ratio": 32.85797119140625,
        "layerwise_effective_rank": -19.623628616333008,
        "layerwise_effective_rank_mergeability_score": 6.474867343902588,
        "singular_value_overlap": 15.187405586242676,
        "subspace_overlap": -26.320110321044922,
        "right_subspace_overlap": -0.25081759691238403,
        "activation_l2_distance": 4.064082145690918,
        "activation_cosine_similarity": 14.512115478515625,
        "activation_magnitude_ratio": -4.761567115783691,
        "activation_dot_product": 24.373695373535156,
        "encoder_gradient_cosine_similarity": 3.0195415019989014,
        "encoder_gradient_l2_distance": -37.235591888427734,
        "encoder_gradient_dot_product": -7.38693380355835,
        "input_gradient_cosine_similarity": -1.8948602676391602,
        "input_gradient_l2_distance": -20.35753631591797,
        "input_gradient_dot_product": -13.506656646728516
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8383059942097896,
      "val_r": 0.72809583251584,
      "n_iterations": 972,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.04446364566683769,
        "right_subspace_overlap_bottom_k": -1.323655366897583,
        "interaction_matrix_overlap_top_k": -0.5420386791229248,
        "interaction_matrix_overlap_bottom_k": 1.2514384984970093,
        "effective_rank": 0.3202945291996002,
        "effective_rank_mergeability_score": -0.4731675386428833,
        "stable_rank": -0.6406416893005371,
        "spectral_gap": 0.25184473395347595,
        "singular_value_ratio": 0.37967437505722046,
        "layerwise_effective_rank": 0.3027866780757904,
        "layerwise_effective_rank_mergeability_score": 0.5622750520706177,
        "singular_value_overlap": 0.006170673295855522,
        "subspace_overlap": 0.06039559468626976,
        "right_subspace_overlap": 0.4646780490875244,
        "activation_l2_distance": 0.2859630584716797,
        "activation_cosine_similarity": 0.43322300910949707,
        "activation_magnitude_ratio": 0.004515196196734905,
        "activation_dot_product": -0.06492716819047928,
        "encoder_gradient_cosine_similarity": 0.02419627085328102,
        "encoder_gradient_l2_distance": -0.2044024020433426,
        "encoder_gradient_dot_product": 0.027923068031668663,
        "input_gradient_cosine_similarity": 0.013690070249140263,
        "input_gradient_l2_distance": -0.17120708525180817,
        "input_gradient_dot_product": -0.01390120480209589
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7802591583635948,
      "val_r": 0.7476138311504754,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.2125580310821533,
        "right_subspace_overlap_bottom_k": -9.853775024414062,
        "interaction_matrix_overlap_top_k": 2.078845739364624,
        "interaction_matrix_overlap_bottom_k": 0.7608920931816101,
        "effective_rank": 4.428793907165527,
        "effective_rank_mergeability_score": -2.115644693374634,
        "stable_rank": -2.968055248260498,
        "spectral_gap": 5.0213165283203125,
        "singular_value_ratio": 7.3710551261901855,
        "layerwise_effective_rank": -0.9665985703468323,
        "layerwise_effective_rank_mergeability_score": 6.6432061195373535,
        "singular_value_overlap": 1.880854845046997,
        "subspace_overlap": 0.02649400196969509,
        "right_subspace_overlap": 6.161594390869141,
        "activation_l2_distance": -4.966587066650391,
        "activation_cosine_similarity": 2.5561773777008057,
        "activation_magnitude_ratio": -2.125331401824951,
        "activation_dot_product": 2.267437219619751,
        "encoder_gradient_cosine_similarity": 0.9286357760429382,
        "encoder_gradient_l2_distance": -9.315266609191895,
        "encoder_gradient_dot_product": -0.10228590667247772,
        "input_gradient_cosine_similarity": 2.1145665645599365,
        "input_gradient_l2_distance": -9.071244239807129,
        "input_gradient_dot_product": -2.9684343338012695
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8299122491481804,
      "val_r": 0.8141604210978313,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.8312404155731201,
        "right_subspace_overlap_bottom_k": -4.800971984863281,
        "interaction_matrix_overlap_top_k": -3.2685413360595703,
        "interaction_matrix_overlap_bottom_k": 4.212291717529297,
        "effective_rank": 1.6230412721633911,
        "effective_rank_mergeability_score": -2.6565966606140137,
        "stable_rank": -3.598100185394287,
        "spectral_gap": -0.401001513004303,
        "singular_value_ratio": 0.358318030834198,
        "layerwise_effective_rank": 1.128957986831665,
        "layerwise_effective_rank_mergeability_score": 2.4536187648773193,
        "singular_value_overlap": 0.0428723581135273,
        "subspace_overlap": 0.40113532543182373,
        "right_subspace_overlap": 2.4038429260253906,
        "activation_l2_distance": 1.8159470558166504,
        "activation_cosine_similarity": 2.6011745929718018,
        "activation_magnitude_ratio": -0.03288964554667473,
        "activation_dot_product": -0.4656289219856262,
        "encoder_gradient_cosine_similarity": 0.1801685243844986,
        "encoder_gradient_l2_distance": -0.8974834084510803,
        "encoder_gradient_dot_product": 0.06134781986474991,
        "input_gradient_cosine_similarity": 0.03124108538031578,
        "input_gradient_l2_distance": -0.8467810750007629,
        "input_gradient_dot_product": -0.17857396602630615
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7446381261287824,
      "val_r": 0.7006762908022628,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 16.21272850036621,
        "right_subspace_overlap_bottom_k": -9.579460144042969,
        "interaction_matrix_overlap_top_k": 3.017984628677368,
        "interaction_matrix_overlap_bottom_k": -5.483421325683594,
        "effective_rank": -7.645815372467041,
        "effective_rank_mergeability_score": 5.600058555603027,
        "stable_rank": 8.311503410339355,
        "spectral_gap": -1.451088786125183,
        "singular_value_ratio": -1.5232964754104614,
        "layerwise_effective_rank": -0.10458706319332123,
        "layerwise_effective_rank_mergeability_score": -3.206059455871582,
        "singular_value_overlap": 7.886322975158691,
        "subspace_overlap": 5.529664516448975,
        "right_subspace_overlap": -6.844853401184082,
        "activation_l2_distance": 0.4266088008880615,
        "activation_cosine_similarity": 8.665726661682129,
        "activation_magnitude_ratio": -0.9669709205627441,
        "activation_dot_product": 7.49919319152832,
        "encoder_gradient_cosine_similarity": 3.5541179180145264,
        "encoder_gradient_l2_distance": -18.52302360534668,
        "encoder_gradient_dot_product": -0.043505601584911346,
        "input_gradient_cosine_similarity": 3.6460607051849365,
        "input_gradient_l2_distance": -9.190518379211426,
        "input_gradient_dot_product": -4.78877067565918
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7690415021697049,
      "val_r": 0.7274810331144873,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.133244514465332,
        "right_subspace_overlap_bottom_k": -9.658954620361328,
        "interaction_matrix_overlap_top_k": 2.5783019065856934,
        "interaction_matrix_overlap_bottom_k": -6.093449115753174,
        "effective_rank": 3.510601282119751,
        "effective_rank_mergeability_score": 0.8061385750770569,
        "stable_rank": 1.492677927017212,
        "spectral_gap": 2.8382856845855713,
        "singular_value_ratio": 3.8996872901916504,
        "layerwise_effective_rank": -6.35392951965332,
        "layerwise_effective_rank_mergeability_score": 1.9603509902954102,
        "singular_value_overlap": 4.638339519500732,
        "subspace_overlap": -2.286855459213257,
        "right_subspace_overlap": 8.978087425231934,
        "activation_l2_distance": -4.63250207901001,
        "activation_cosine_similarity": 6.664045810699463,
        "activation_magnitude_ratio": -2.0336835384368896,
        "activation_dot_product": 4.741621494293213,
        "encoder_gradient_cosine_similarity": 4.851641654968262,
        "encoder_gradient_l2_distance": -12.664204597473145,
        "encoder_gradient_dot_product": 1.466078519821167,
        "input_gradient_cosine_similarity": 3.2171428203582764,
        "input_gradient_l2_distance": -8.422534942626953,
        "input_gradient_dot_product": -5.631503105163574
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7639768017862987,
      "val_r": 0.6894112803061293,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.288342237472534,
        "right_subspace_overlap_bottom_k": -8.280232429504395,
        "interaction_matrix_overlap_top_k": 1.9487673044204712,
        "interaction_matrix_overlap_bottom_k": -2.8243775367736816,
        "effective_rank": 3.048292398452759,
        "effective_rank_mergeability_score": -6.5289225578308105,
        "stable_rank": -5.274056911468506,
        "spectral_gap": 0.6570937633514404,
        "singular_value_ratio": 2.1134212017059326,
        "layerwise_effective_rank": -0.4945640563964844,
        "layerwise_effective_rank_mergeability_score": 6.700590133666992,
        "singular_value_overlap": 3.936520576477051,
        "subspace_overlap": -3.2283313274383545,
        "right_subspace_overlap": 6.881446361541748,
        "activation_l2_distance": 2.3743040561676025,
        "activation_cosine_similarity": 7.237292289733887,
        "activation_magnitude_ratio": -0.12999314069747925,
        "activation_dot_product": 3.6554160118103027,
        "encoder_gradient_cosine_similarity": 2.278597593307495,
        "encoder_gradient_l2_distance": -8.353442192077637,
        "encoder_gradient_dot_product": 2.576129198074341,
        "input_gradient_cosine_similarity": 0.9364966154098511,
        "input_gradient_l2_distance": -7.816174030303955,
        "input_gradient_dot_product": -3.7040581703186035
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.800553918128157,
      "val_r": 0.4409971441556559,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.9347283840179443,
        "right_subspace_overlap_bottom_k": -0.9470694065093994,
        "interaction_matrix_overlap_top_k": -0.5516523718833923,
        "interaction_matrix_overlap_bottom_k": 0.4022236466407776,
        "effective_rank": 0.04642748460173607,
        "effective_rank_mergeability_score": -0.551649272441864,
        "stable_rank": -0.36694034934043884,
        "spectral_gap": 0.5238763689994812,
        "singular_value_ratio": 0.5883870124816895,
        "layerwise_effective_rank": 0.24738557636737823,
        "layerwise_effective_rank_mergeability_score": 0.5526418685913086,
        "singular_value_overlap": 0.06617379188537598,
        "subspace_overlap": -0.4169482886791229,
        "right_subspace_overlap": 0.43005648255348206,
        "activation_l2_distance": 0.2115102857351303,
        "activation_cosine_similarity": 0.7218717336654663,
        "activation_magnitude_ratio": -0.05652294680476189,
        "activation_dot_product": -0.2238234579563141,
        "encoder_gradient_cosine_similarity": 0.1173773854970932,
        "encoder_gradient_l2_distance": -0.6121653318405151,
        "encoder_gradient_dot_product": 0.013588456436991692,
        "input_gradient_cosine_similarity": 0.08903530240058899,
        "input_gradient_l2_distance": -0.23049917817115784,
        "input_gradient_dot_product": 0.016740325838327408
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.8636284103264029,
      "val_r": 0.39119638408691,
      "n_iterations": 421,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.11404532194137573,
        "right_subspace_overlap_bottom_k": -0.8294604420661926,
        "interaction_matrix_overlap_top_k": -0.3121929466724396,
        "interaction_matrix_overlap_bottom_k": 0.8096815347671509,
        "effective_rank": 0.16513997316360474,
        "effective_rank_mergeability_score": 0.14475463330745697,
        "stable_rank": 0.060751721262931824,
        "spectral_gap": 0.25848710536956787,
        "singular_value_ratio": 0.2982265055179596,
        "layerwise_effective_rank": -0.1171981543302536,
        "layerwise_effective_rank_mergeability_score": 0.04227873310446739,
        "singular_value_overlap": -0.00351183139719069,
        "subspace_overlap": 0.06719641387462616,
        "right_subspace_overlap": 0.3965240716934204,
        "activation_l2_distance": 0.14638009667396545,
        "activation_cosine_similarity": 0.2537095844745636,
        "activation_magnitude_ratio": 0.0055742813274264336,
        "activation_dot_product": -0.06309990584850311,
        "encoder_gradient_cosine_similarity": 0.022072969004511833,
        "encoder_gradient_l2_distance": -0.09548326581716537,
        "encoder_gradient_dot_product": -0.00737382285296917,
        "input_gradient_cosine_similarity": 0.017131740227341652,
        "input_gradient_l2_distance": -0.11875122785568237,
        "input_gradient_dot_product": -0.02711227908730507
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7287347152875535,
      "val_r": 0.3276800641204435,
      "n_iterations": 833,
      "coefficients": {
        "right_subspace_overlap_top_k": 38.138519287109375,
        "right_subspace_overlap_bottom_k": -44.631107330322266,
        "interaction_matrix_overlap_top_k": 20.93419647216797,
        "interaction_matrix_overlap_bottom_k": -2.8537817001342773,
        "effective_rank": -20.620960235595703,
        "effective_rank_mergeability_score": -5.920535564422607,
        "stable_rank": 2.7238917350769043,
        "spectral_gap": -15.060051918029785,
        "singular_value_ratio": -3.2428507804870605,
        "layerwise_effective_rank": 4.166965007781982,
        "layerwise_effective_rank_mergeability_score": 14.677207946777344,
        "singular_value_overlap": 14.566093444824219,
        "subspace_overlap": 5.924966335296631,
        "right_subspace_overlap": 1.0184274911880493,
        "activation_l2_distance": 9.143299102783203,
        "activation_cosine_similarity": -4.536867618560791,
        "activation_magnitude_ratio": 5.44098424911499,
        "activation_dot_product": 0.008327553980052471,
        "encoder_gradient_cosine_similarity": 15.420088768005371,
        "encoder_gradient_l2_distance": -16.34712791442871,
        "encoder_gradient_dot_product": 5.081700801849365,
        "input_gradient_cosine_similarity": 8.965580940246582,
        "input_gradient_l2_distance": -20.516521453857422,
        "input_gradient_dot_product": -11.482324600219727
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8344215616949631,
      "val_r": 0.36288035457435835,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.4408797025680542,
        "right_subspace_overlap_bottom_k": -1.5537883043289185,
        "interaction_matrix_overlap_top_k": -0.6196475028991699,
        "interaction_matrix_overlap_bottom_k": 1.3515328168869019,
        "effective_rank": 0.3957357108592987,
        "effective_rank_mergeability_score": -0.1555272936820984,
        "stable_rank": -0.5792864561080933,
        "spectral_gap": -0.16348783671855927,
        "singular_value_ratio": -0.032125502824783325,
        "layerwise_effective_rank": 0.7186047434806824,
        "layerwise_effective_rank_mergeability_score": 0.8045985102653503,
        "singular_value_overlap": 0.08842268586158752,
        "subspace_overlap": -0.18033336102962494,
        "right_subspace_overlap": 0.39315855503082275,
        "activation_l2_distance": 0.14219343662261963,
        "activation_cosine_similarity": 0.4416012465953827,
        "activation_magnitude_ratio": -0.025892535224556923,
        "activation_dot_product": 0.004402498248964548,
        "encoder_gradient_cosine_similarity": 0.023142969235777855,
        "encoder_gradient_l2_distance": -0.32454514503479004,
        "encoder_gradient_dot_product": -0.01529600564390421,
        "input_gradient_cosine_similarity": 0.03833598271012306,
        "input_gradient_l2_distance": -0.17925657331943512,
        "input_gradient_dot_product": -0.0146969398483634
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6298606639633286,
      "val_r": 0.6637772735650551,
      "n_iterations": 630,
      "coefficients": {
        "right_subspace_overlap_top_k": 72.85150146484375,
        "right_subspace_overlap_bottom_k": -88.92841339111328,
        "interaction_matrix_overlap_top_k": 44.38877868652344,
        "interaction_matrix_overlap_bottom_k": -27.983449935913086,
        "effective_rank": -16.448562622070312,
        "effective_rank_mergeability_score": 7.417191028594971,
        "stable_rank": 25.51403045654297,
        "spectral_gap": -60.60149002075195,
        "singular_value_ratio": -88.2607192993164,
        "layerwise_effective_rank": 24.990421295166016,
        "layerwise_effective_rank_mergeability_score": 9.43873405456543,
        "singular_value_overlap": 93.72869110107422,
        "subspace_overlap": 53.79498291015625,
        "right_subspace_overlap": 103.78233337402344,
        "activation_l2_distance": -110.6910171508789,
        "activation_cosine_similarity": -25.460372924804688,
        "activation_magnitude_ratio": -72.17383575439453,
        "activation_dot_product": 59.15968322753906,
        "encoder_gradient_cosine_similarity": 89.03006744384766,
        "encoder_gradient_l2_distance": -111.34906768798828,
        "encoder_gradient_dot_product": 40.40751266479492,
        "input_gradient_cosine_similarity": 42.406070709228516,
        "input_gradient_l2_distance": -12.856526374816895,
        "input_gradient_dot_product": -51.15900802612305
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5085185585137801,
      "val_r": 0.34638313268128906,
      "n_iterations": 498,
      "coefficients": {
        "right_subspace_overlap_top_k": -171.44093322753906,
        "right_subspace_overlap_bottom_k": -204.38497924804688,
        "interaction_matrix_overlap_top_k": 481.8224182128906,
        "interaction_matrix_overlap_bottom_k": -52.84648895263672,
        "effective_rank": -28.7302188873291,
        "effective_rank_mergeability_score": 339.37213134765625,
        "stable_rank": -162.6066131591797,
        "spectral_gap": -192.4249267578125,
        "singular_value_ratio": 87.62493133544922,
        "layerwise_effective_rank": -71.11528778076172,
        "layerwise_effective_rank_mergeability_score": -393.4107971191406,
        "singular_value_overlap": 45.78190612792969,
        "subspace_overlap": 45.772945404052734,
        "right_subspace_overlap": 172.59219360351562,
        "activation_l2_distance": -178.35488891601562,
        "activation_cosine_similarity": 100.29986572265625,
        "activation_magnitude_ratio": 138.09471130371094,
        "activation_dot_product": 168.52503967285156,
        "encoder_gradient_cosine_similarity": 34.00831604003906,
        "encoder_gradient_l2_distance": -70.12694549560547,
        "encoder_gradient_dot_product": -50.263671875,
        "input_gradient_cosine_similarity": 84.9127197265625,
        "input_gradient_l2_distance": -128.7242889404297,
        "input_gradient_dot_product": 6.619918346405029
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8096551077674361,
      "val_r": 0.8026984586879916,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.3803812265396118,
        "right_subspace_overlap_bottom_k": -1.3359135389328003,
        "interaction_matrix_overlap_top_k": -0.6971014142036438,
        "interaction_matrix_overlap_bottom_k": 0.6739107966423035,
        "effective_rank": 0.502382218837738,
        "effective_rank_mergeability_score": 0.17593912780284882,
        "stable_rank": 0.20385505259037018,
        "spectral_gap": 0.15584228932857513,
        "singular_value_ratio": 0.09402189403772354,
        "layerwise_effective_rank": -0.12591306865215302,
        "layerwise_effective_rank_mergeability_score": 0.47500067949295044,
        "singular_value_overlap": 0.07009761035442352,
        "subspace_overlap": -0.991852879524231,
        "right_subspace_overlap": 0.8128015398979187,
        "activation_l2_distance": 0.32034438848495483,
        "activation_cosine_similarity": 0.9543534517288208,
        "activation_magnitude_ratio": -0.06712817400693893,
        "activation_dot_product": -0.08808905631303787,
        "encoder_gradient_cosine_similarity": 0.1298855096101761,
        "encoder_gradient_l2_distance": -1.0352933406829834,
        "encoder_gradient_dot_product": 0.05844561755657196,
        "input_gradient_cosine_similarity": 0.14015832543373108,
        "input_gradient_l2_distance": -0.5205288529396057,
        "input_gradient_dot_product": -0.28572142124176025
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6462677926420337,
      "val_r": 0.6644283710120356,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 18.9144344329834,
        "right_subspace_overlap_bottom_k": 6.461788177490234,
        "interaction_matrix_overlap_top_k": 71.96820068359375,
        "interaction_matrix_overlap_bottom_k": 2.4048352241516113,
        "effective_rank": 49.8218994140625,
        "effective_rank_mergeability_score": 1.4989858865737915,
        "stable_rank": -17.028331756591797,
        "spectral_gap": -32.11189270019531,
        "singular_value_ratio": -7.4616899490356445,
        "layerwise_effective_rank": -36.909549713134766,
        "layerwise_effective_rank_mergeability_score": 41.54302215576172,
        "singular_value_overlap": 29.743173599243164,
        "subspace_overlap": 15.14294719696045,
        "right_subspace_overlap": -66.50062561035156,
        "activation_l2_distance": -11.594281196594238,
        "activation_cosine_similarity": 17.48607063293457,
        "activation_magnitude_ratio": -31.355714797973633,
        "activation_dot_product": 64.25263977050781,
        "encoder_gradient_cosine_similarity": 20.132619857788086,
        "encoder_gradient_l2_distance": -46.674808502197266,
        "encoder_gradient_dot_product": -18.189743041992188,
        "input_gradient_cosine_similarity": 8.265043258666992,
        "input_gradient_l2_distance": -62.628074645996094,
        "input_gradient_dot_product": -16.182388305664062
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.6666756438037058,
      "val_r": 0.4200877925657561,
      "n_iterations": 709,
      "coefficients": {
        "right_subspace_overlap_top_k": -16.48417091369629,
        "right_subspace_overlap_bottom_k": -5.182394504547119,
        "interaction_matrix_overlap_top_k": 69.00476837158203,
        "interaction_matrix_overlap_bottom_k": -61.3601188659668,
        "effective_rank": 20.454896926879883,
        "effective_rank_mergeability_score": 28.054227828979492,
        "stable_rank": 31.76280975341797,
        "spectral_gap": -2.156209707260132,
        "singular_value_ratio": 77.3218765258789,
        "layerwise_effective_rank": -61.87644577026367,
        "layerwise_effective_rank_mergeability_score": 67.87799072265625,
        "singular_value_overlap": 75.51193237304688,
        "subspace_overlap": 36.487152099609375,
        "right_subspace_overlap": -2.380192279815674,
        "activation_l2_distance": -85.78472137451172,
        "activation_cosine_similarity": -29.78803825378418,
        "activation_magnitude_ratio": -3.166142702102661,
        "activation_dot_product": 69.02513122558594,
        "encoder_gradient_cosine_similarity": -59.05473327636719,
        "encoder_gradient_l2_distance": -130.15673828125,
        "encoder_gradient_dot_product": 5.767667770385742,
        "input_gradient_cosine_similarity": 15.713849067687988,
        "input_gradient_l2_distance": -45.1771354675293,
        "input_gradient_dot_product": 6.582747459411621
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7694198762172766,
      "val_r": 0.7208386029045378,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 12.070721626281738,
        "right_subspace_overlap_bottom_k": -16.965320587158203,
        "interaction_matrix_overlap_top_k": 5.423648834228516,
        "interaction_matrix_overlap_bottom_k": -1.2820093631744385,
        "effective_rank": 1.2441725730895996,
        "effective_rank_mergeability_score": -3.196380138397217,
        "stable_rank": -4.461429119110107,
        "spectral_gap": -2.2416696548461914,
        "singular_value_ratio": 4.319924354553223,
        "layerwise_effective_rank": -4.668702125549316,
        "layerwise_effective_rank_mergeability_score": 3.1652607917785645,
        "singular_value_overlap": 5.062388896942139,
        "subspace_overlap": -4.562244892120361,
        "right_subspace_overlap": 7.475691318511963,
        "activation_l2_distance": 3.24541974067688,
        "activation_cosine_similarity": 12.587871551513672,
        "activation_magnitude_ratio": -1.7853903770446777,
        "activation_dot_product": 2.9890050888061523,
        "encoder_gradient_cosine_similarity": 5.041551113128662,
        "encoder_gradient_l2_distance": -9.839753150939941,
        "encoder_gradient_dot_product": 3.1399199962615967,
        "input_gradient_cosine_similarity": 3.140817403793335,
        "input_gradient_l2_distance": -11.843501091003418,
        "input_gradient_dot_product": -7.061460018157959
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5637147988506106,
      "val_r": 0.5631597005728042,
      "n_iterations": 510,
      "coefficients": {
        "right_subspace_overlap_top_k": 45.08248519897461,
        "right_subspace_overlap_bottom_k": -57.912044525146484,
        "interaction_matrix_overlap_top_k": 79.36224365234375,
        "interaction_matrix_overlap_bottom_k": 21.149381637573242,
        "effective_rank": -105.19337463378906,
        "effective_rank_mergeability_score": -30.343460083007812,
        "stable_rank": -15.16292667388916,
        "spectral_gap": -26.930904388427734,
        "singular_value_ratio": 50.3669548034668,
        "layerwise_effective_rank": -41.60940933227539,
        "layerwise_effective_rank_mergeability_score": -25.945220947265625,
        "singular_value_overlap": 90.9689712524414,
        "subspace_overlap": 30.078872680664062,
        "right_subspace_overlap": -14.556699752807617,
        "activation_l2_distance": -71.81240844726562,
        "activation_cosine_similarity": 12.166325569152832,
        "activation_magnitude_ratio": -87.40615844726562,
        "activation_dot_product": 77.47400665283203,
        "encoder_gradient_cosine_similarity": 58.610958099365234,
        "encoder_gradient_l2_distance": -29.589693069458008,
        "encoder_gradient_dot_product": 16.660470962524414,
        "input_gradient_cosine_similarity": 79.6991958618164,
        "input_gradient_l2_distance": -18.148202896118164,
        "input_gradient_dot_product": -36.01232147216797
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8434457231260044,
      "val_r": 0.7271269105603172,
      "n_iterations": 706,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.13304565846920013,
        "right_subspace_overlap_bottom_k": -1.2029260396957397,
        "interaction_matrix_overlap_top_k": -0.45061200857162476,
        "interaction_matrix_overlap_bottom_k": 1.1096901893615723,
        "effective_rank": 0.5815706253051758,
        "effective_rank_mergeability_score": -0.34386831521987915,
        "stable_rank": -0.8374372720718384,
        "spectral_gap": 0.006933585740625858,
        "singular_value_ratio": 0.19082386791706085,
        "layerwise_effective_rank": 0.4711660146713257,
        "layerwise_effective_rank_mergeability_score": 0.7101552486419678,
        "singular_value_overlap": 0.013651767745614052,
        "subspace_overlap": 0.004583925008773804,
        "right_subspace_overlap": 0.6246241331100464,
        "activation_l2_distance": 0.23236966133117676,
        "activation_cosine_similarity": 0.3585260808467865,
        "activation_magnitude_ratio": 0.01025149691849947,
        "activation_dot_product": -0.030817853286862373,
        "encoder_gradient_cosine_similarity": 0.029342228546738625,
        "encoder_gradient_l2_distance": -0.18432177603244781,
        "encoder_gradient_dot_product": 0.007556144148111343,
        "input_gradient_cosine_similarity": 0.02197553589940071,
        "input_gradient_l2_distance": -0.15786153078079224,
        "input_gradient_dot_product": -0.032805152237415314
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7544393379828417,
      "val_r": 0.5755567250158616,
      "n_iterations": 840,
      "coefficients": {
        "right_subspace_overlap_top_k": -6.45759916305542,
        "right_subspace_overlap_bottom_k": -65.86769104003906,
        "interaction_matrix_overlap_top_k": 56.24829864501953,
        "interaction_matrix_overlap_bottom_k": 34.947933197021484,
        "effective_rank": -36.91969680786133,
        "effective_rank_mergeability_score": -18.08863639831543,
        "stable_rank": 21.567323684692383,
        "spectral_gap": -7.6213765144348145,
        "singular_value_ratio": -23.864633560180664,
        "layerwise_effective_rank": 44.24318313598633,
        "layerwise_effective_rank_mergeability_score": 47.059783935546875,
        "singular_value_overlap": 17.93414878845215,
        "subspace_overlap": 38.522926330566406,
        "right_subspace_overlap": -37.52804946899414,
        "activation_l2_distance": -36.700748443603516,
        "activation_cosine_similarity": -17.117942810058594,
        "activation_magnitude_ratio": -27.669479370117188,
        "activation_dot_product": 105.18399047851562,
        "encoder_gradient_cosine_similarity": 16.305883407592773,
        "encoder_gradient_l2_distance": -74.30558013916016,
        "encoder_gradient_dot_product": -31.84343147277832,
        "input_gradient_cosine_similarity": 55.39829635620117,
        "input_gradient_l2_distance": -23.136110305786133,
        "input_gradient_dot_product": -29.292633056640625
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}