{
  "aggregate_metrics": {
    "train_r": 0.17891359136337182,
    "train_p": 1.3912318155259876e-24,
    "val_r": 0.18409811720354996,
    "val_p": 0.00046336208345082577
  },
  "per_fold_stats": {
    "train_r_mean": 0.705871397622871,
    "train_r_std": 0.08947805308757759,
    "val_r_mean": 0.5545710942052537,
    "val_r_std": 0.1648076852524083
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 16.217172622680664,
    "right_subspace_overlap_bottom_k": -12.269826889038086,
    "interaction_matrix_overlap_top_k": 10.097150802612305,
    "interaction_matrix_overlap_bottom_k": -14.775733947753906,
    "effective_rank": 4.421771049499512,
    "effective_rank_mergeability_score": 2.0172879695892334,
    "stable_rank": -5.468749046325684,
    "spectral_gap": -1.8826297521591187,
    "singular_value_ratio": -1.393678903579712,
    "layerwise_effective_rank": -1.6530590057373047,
    "layerwise_effective_rank_mergeability_score": -7.542841911315918,
    "task_vector_cosine_similarity": 5.33427619934082,
    "task_vector_l2_distance": 1.5981534719467163,
    "task_vector_dot_product": 1.9995132684707642,
    "weight_space_angle": 1.9936158657073975,
    "task_vector_magnitude_ratio": -2.3999812602996826,
    "singular_value_overlap": 12.514625549316406,
    "subspace_overlap": 11.776375770568848,
    "activation_l2_distance": -5.260807037353516,
    "activation_cosine_similarity": 3.5630733966827393,
    "activation_magnitude_ratio": -13.262484550476074,
    "activation_dot_product": 7.796156883239746,
    "encoder_gradient_cosine_similarity": 12.075560569763184,
    "encoder_gradient_l2_distance": -19.644845962524414,
    "encoder_gradient_dot_product": -2.0560097694396973,
    "input_gradient_cosine_similarity": -3.8531081676483154,
    "input_gradient_l2_distance": -8.708963394165039,
    "input_gradient_dot_product": -10.31798267364502
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 45.824378967285156,
    "right_subspace_overlap_bottom_k": 24.812183380126953,
    "interaction_matrix_overlap_top_k": 20.77006721496582,
    "interaction_matrix_overlap_bottom_k": 41.538604736328125,
    "effective_rank": 16.657848358154297,
    "effective_rank_mergeability_score": 9.126858711242676,
    "stable_rank": 18.39784049987793,
    "spectral_gap": 10.025642395019531,
    "singular_value_ratio": 7.452380657196045,
    "layerwise_effective_rank": 13.823369026184082,
    "layerwise_effective_rank_mergeability_score": 41.89503479003906,
    "task_vector_cosine_similarity": 23.63102149963379,
    "task_vector_l2_distance": 19.68213653564453,
    "task_vector_dot_product": 8.334638595581055,
    "weight_space_angle": 12.850915908813477,
    "task_vector_magnitude_ratio": 20.67136001586914,
    "singular_value_overlap": 50.12227249145508,
    "subspace_overlap": 37.52310562133789,
    "activation_l2_distance": 23.35011100769043,
    "activation_cosine_similarity": 16.790674209594727,
    "activation_magnitude_ratio": 43.3186149597168,
    "activation_dot_product": 12.998655319213867,
    "encoder_gradient_cosine_similarity": 28.824628829956055,
    "encoder_gradient_l2_distance": 33.50678634643555,
    "encoder_gradient_dot_product": 33.791439056396484,
    "input_gradient_cosine_similarity": 43.086788177490234,
    "input_gradient_l2_distance": 19.81756019592285,
    "input_gradient_dot_product": 21.910812377929688
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.676932970159759,
      "val_r": 0.541924076448876,
      "n_iterations": 632,
      "coefficients": {
        "right_subspace_overlap_top_k": 10.815317153930664,
        "right_subspace_overlap_bottom_k": 4.629868984222412,
        "interaction_matrix_overlap_top_k": 9.687125205993652,
        "interaction_matrix_overlap_bottom_k": -9.287591934204102,
        "effective_rank": -1.7448968887329102,
        "effective_rank_mergeability_score": 9.445255279541016,
        "stable_rank": 4.907670021057129,
        "spectral_gap": -3.726963758468628,
        "singular_value_ratio": -4.972543239593506,
        "layerwise_effective_rank": 3.057689905166626,
        "layerwise_effective_rank_mergeability_score": -2.4242970943450928,
        "task_vector_cosine_similarity": -8.233859062194824,
        "task_vector_l2_distance": -9.642667770385742,
        "task_vector_dot_product": 1.2729228734970093,
        "weight_space_angle": 3.3705897331237793,
        "task_vector_magnitude_ratio": -1.5204594135284424,
        "singular_value_overlap": -4.05494499206543,
        "subspace_overlap": -11.412577629089355,
        "activation_l2_distance": 2.531320810317993,
        "activation_cosine_similarity": 5.692016124725342,
        "activation_magnitude_ratio": -9.601290702819824,
        "activation_dot_product": 16.1361083984375,
        "encoder_gradient_cosine_similarity": 4.235287189483643,
        "encoder_gradient_l2_distance": -8.621488571166992,
        "encoder_gradient_dot_product": 4.2583489418029785,
        "input_gradient_cosine_similarity": 7.108040809631348,
        "input_gradient_l2_distance": -11.200943946838379,
        "input_gradient_dot_product": -17.480745315551758
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3606218996203189,
      "val_r": 0.2646163468022115,
      "n_iterations": 750,
      "coefficients": {
        "right_subspace_overlap_top_k": 209.7996826171875,
        "right_subspace_overlap_bottom_k": -108.91521453857422,
        "interaction_matrix_overlap_top_k": 88.01747131347656,
        "interaction_matrix_overlap_bottom_k": -189.22323608398438,
        "effective_rank": 71.94137573242188,
        "effective_rank_mergeability_score": -18.537752151489258,
        "stable_rank": -84.40901947021484,
        "spectral_gap": -0.3506886661052704,
        "singular_value_ratio": -26.851970672607422,
        "layerwise_effective_rank": 33.32416915893555,
        "layerwise_effective_rank_mergeability_score": -188.26788330078125,
        "task_vector_cosine_similarity": 104.91497802734375,
        "task_vector_l2_distance": 80.69624328613281,
        "task_vector_dot_product": 5.304648399353027,
        "weight_space_angle": 41.95238494873047,
        "task_vector_magnitude_ratio": -90.10459899902344,
        "singular_value_overlap": 230.52420043945312,
        "subspace_overlap": 167.56875610351562,
        "activation_l2_distance": -99.61461639404297,
        "activation_cosine_similarity": -49.047306060791016,
        "activation_magnitude_ratio": -200.71177673339844,
        "activation_dot_product": -9.951485633850098,
        "encoder_gradient_cosine_similarity": 132.50836181640625,
        "encoder_gradient_l2_distance": -148.66036987304688,
        "encoder_gradient_dot_product": -143.86575317382812,
        "input_gradient_cosine_similarity": -188.05648803710938,
        "input_gradient_l2_distance": 52.456512451171875,
        "input_gradient_dot_product": 44.223541259765625
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.722833698070565,
      "val_r": 0.65503142090392,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 18.970111846923828,
        "right_subspace_overlap_bottom_k": -15.439996719360352,
        "interaction_matrix_overlap_top_k": 10.28979206085205,
        "interaction_matrix_overlap_bottom_k": -6.431593894958496,
        "effective_rank": -6.006157875061035,
        "effective_rank_mergeability_score": 0.17464172840118408,
        "stable_rank": -7.137606620788574,
        "spectral_gap": 9.360986709594727,
        "singular_value_ratio": 6.2300238609313965,
        "layerwise_effective_rank": -2.4711170196533203,
        "layerwise_effective_rank_mergeability_score": 2.36083984375,
        "task_vector_cosine_similarity": -8.754404067993164,
        "task_vector_l2_distance": -7.626856327056885,
        "task_vector_dot_product": 1.1018520593643188,
        "weight_space_angle": 2.7626261711120605,
        "task_vector_magnitude_ratio": 13.282713890075684,
        "singular_value_overlap": 0.7720403075218201,
        "subspace_overlap": 5.214878559112549,
        "activation_l2_distance": -6.028151512145996,
        "activation_cosine_similarity": 3.1079392433166504,
        "activation_magnitude_ratio": -4.043381690979004,
        "activation_dot_product": 24.897727966308594,
        "encoder_gradient_cosine_similarity": 9.246057510375977,
        "encoder_gradient_l2_distance": -20.30702018737793,
        "encoder_gradient_dot_product": 10.136849403381348,
        "input_gradient_cosine_similarity": 11.324827194213867,
        "input_gradient_l2_distance": -27.676773071289062,
        "input_gradient_dot_product": -24.347549438476562
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7490761822170471,
      "val_r": 0.6305319663582833,
      "n_iterations": 108,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.8016818761825562,
        "right_subspace_overlap_bottom_k": -0.46532008051872253,
        "interaction_matrix_overlap_top_k": -0.33926764130592346,
        "interaction_matrix_overlap_bottom_k": -0.026932407170534134,
        "effective_rank": 0.5473513603210449,
        "effective_rank_mergeability_score": 0.38051509857177734,
        "stable_rank": 0.08988827466964722,
        "spectral_gap": 0.14336232841014862,
        "singular_value_ratio": 0.1917315274477005,
        "layerwise_effective_rank": -0.10231217741966248,
        "layerwise_effective_rank_mergeability_score": 0.27999675273895264,
        "task_vector_cosine_similarity": 0.013821781612932682,
        "task_vector_l2_distance": -0.02062283642590046,
        "task_vector_dot_product": -0.2630227208137512,
        "weight_space_angle": 0.26179319620132446,
        "task_vector_magnitude_ratio": -0.03761863335967064,
        "singular_value_overlap": -0.026707064360380173,
        "subspace_overlap": 0.2772010862827301,
        "activation_l2_distance": -0.06828649342060089,
        "activation_cosine_similarity": 0.42715024948120117,
        "activation_magnitude_ratio": -0.1475706547498703,
        "activation_dot_product": 0.011079120449721813,
        "encoder_gradient_cosine_similarity": 0.18472294509410858,
        "encoder_gradient_l2_distance": -0.6286116242408752,
        "encoder_gradient_dot_product": 0.19694723188877106,
        "input_gradient_cosine_similarity": 0.036935433745384216,
        "input_gradient_l2_distance": -0.6930220723152161,
        "input_gradient_dot_product": -0.2575126588344574
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7297412074540837,
      "val_r": 0.7000760600016983,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.053845405578613,
        "right_subspace_overlap_bottom_k": -16.34423828125,
        "interaction_matrix_overlap_top_k": 9.892040252685547,
        "interaction_matrix_overlap_bottom_k": 2.6113314628601074,
        "effective_rank": 4.194843292236328,
        "effective_rank_mergeability_score": 9.101902961730957,
        "stable_rank": -4.8049211502075195,
        "spectral_gap": -0.08812663704156876,
        "singular_value_ratio": 3.0195648670196533,
        "layerwise_effective_rank": -3.791459321975708,
        "layerwise_effective_rank_mergeability_score": -5.368062496185303,
        "task_vector_cosine_similarity": -7.3670477867126465,
        "task_vector_l2_distance": -5.824749946594238,
        "task_vector_dot_product": 3.364595651626587,
        "weight_space_angle": 7.7787184715271,
        "task_vector_magnitude_ratio": 1.506390929222107,
        "singular_value_overlap": 0.8383315205574036,
        "subspace_overlap": 8.738720893859863,
        "activation_l2_distance": -0.8141508102416992,
        "activation_cosine_similarity": 8.2622652053833,
        "activation_magnitude_ratio": -1.3874008655548096,
        "activation_dot_product": 8.839762687683105,
        "encoder_gradient_cosine_similarity": 7.139543533325195,
        "encoder_gradient_l2_distance": -19.181638717651367,
        "encoder_gradient_dot_product": 3.616562843322754,
        "input_gradient_cosine_similarity": 4.47452974319458,
        "input_gradient_l2_distance": -15.693343162536621,
        "input_gradient_dot_product": -13.056943893432617
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5914487825874487,
      "val_r": 0.604844894179446,
      "n_iterations": 448,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.2860307693481445,
        "right_subspace_overlap_bottom_k": -30.95191192626953,
        "interaction_matrix_overlap_top_k": 6.469112873077393,
        "interaction_matrix_overlap_bottom_k": -14.460234642028809,
        "effective_rank": -10.462809562683105,
        "effective_rank_mergeability_score": 17.941495895385742,
        "stable_rank": -3.3724663257598877,
        "spectral_gap": -37.39173889160156,
        "singular_value_ratio": -5.055760383605957,
        "layerwise_effective_rank": 1.7656939029693604,
        "layerwise_effective_rank_mergeability_score": 24.489295959472656,
        "task_vector_cosine_similarity": 20.12004852294922,
        "task_vector_l2_distance": 18.528284072875977,
        "task_vector_dot_product": 34.82016372680664,
        "weight_space_angle": -34.18006896972656,
        "task_vector_magnitude_ratio": -0.9449184536933899,
        "singular_value_overlap": 0.6629822254180908,
        "subspace_overlap": 6.154346942901611,
        "activation_l2_distance": -23.900711059570312,
        "activation_cosine_similarity": 23.913555145263672,
        "activation_magnitude_ratio": -17.03206443786621,
        "activation_dot_product": 18.639814376831055,
        "encoder_gradient_cosine_similarity": 4.5263543128967285,
        "encoder_gradient_l2_distance": -16.4912166595459,
        "encoder_gradient_dot_product": 20.862592697143555,
        "input_gradient_cosine_similarity": 27.641725540161133,
        "input_gradient_l2_distance": -22.591867446899414,
        "input_gradient_dot_product": -63.45818328857422
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.6781156970958873,
      "val_r": 0.4419635347946478,
      "n_iterations": 63,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.31633874773979187,
        "right_subspace_overlap_bottom_k": -0.4742818772792816,
        "interaction_matrix_overlap_top_k": 0.2973743975162506,
        "interaction_matrix_overlap_bottom_k": -0.5336677432060242,
        "effective_rank": 0.03916396573185921,
        "effective_rank_mergeability_score": 0.16545253992080688,
        "stable_rank": -0.1929600089788437,
        "spectral_gap": -0.21910229325294495,
        "singular_value_ratio": -0.012248249724507332,
        "layerwise_effective_rank": 0.07468129694461823,
        "layerwise_effective_rank_mergeability_score": 0.10259929299354553,
        "task_vector_cosine_similarity": -0.032503627240657806,
        "task_vector_l2_distance": -0.13011956214904785,
        "task_vector_dot_product": 0.16391851007938385,
        "weight_space_angle": 0.27308720350265503,
        "task_vector_magnitude_ratio": -0.05416969209909439,
        "singular_value_overlap": 0.160114124417305,
        "subspace_overlap": 0.031269967555999756,
        "activation_l2_distance": 0.223025381565094,
        "activation_cosine_similarity": 0.44003182649612427,
        "activation_magnitude_ratio": 0.05608619377017021,
        "activation_dot_product": 0.4239165186882019,
        "encoder_gradient_cosine_similarity": 0.3394419252872467,
        "encoder_gradient_l2_distance": -0.1896318942308426,
        "encoder_gradient_dot_product": 0.4763224422931671,
        "input_gradient_cosine_similarity": 0.10404834151268005,
        "input_gradient_l2_distance": -0.6326910853385925,
        "input_gradient_dot_product": -0.7073999047279358
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7213643498814806,
      "val_r": 0.3614211052586382,
      "n_iterations": 807,
      "coefficients": {
        "right_subspace_overlap_top_k": 5.889920711517334,
        "right_subspace_overlap_bottom_k": -3.7319159507751465,
        "interaction_matrix_overlap_top_k": 0.36062416434288025,
        "interaction_matrix_overlap_bottom_k": -2.1237573623657227,
        "effective_rank": 1.1828153133392334,
        "effective_rank_mergeability_score": -2.183972120285034,
        "stable_rank": 0.06732881814241409,
        "spectral_gap": -2.2785768508911133,
        "singular_value_ratio": 2.4805095195770264,
        "layerwise_effective_rank": -1.7104568481445312,
        "layerwise_effective_rank_mergeability_score": 4.461458206176758,
        "task_vector_cosine_similarity": -1.6804898977279663,
        "task_vector_l2_distance": -2.137495517730713,
        "task_vector_dot_product": -3.9693715572357178,
        "weight_space_angle": 3.546438217163086,
        "task_vector_magnitude_ratio": -3.9728012084960938,
        "singular_value_overlap": -0.05120572820305824,
        "subspace_overlap": 0.1524745523929596,
        "activation_l2_distance": 1.3926353454589844,
        "activation_cosine_similarity": 6.422201156616211,
        "activation_magnitude_ratio": -1.3081556558609009,
        "activation_dot_product": 2.198533535003662,
        "encoder_gradient_cosine_similarity": 2.676455497741699,
        "encoder_gradient_l2_distance": -9.952215194702148,
        "encoder_gradient_dot_product": 0.9363927245140076,
        "input_gradient_cosine_similarity": 1.8966128826141357,
        "input_gradient_l2_distance": -5.12717866897583,
        "input_gradient_dot_product": -0.22394254803657532
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7175558651694084,
      "val_r": 0.33976592998457045,
      "n_iterations": 68,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.21996255218982697,
        "right_subspace_overlap_bottom_k": -0.5454623699188232,
        "interaction_matrix_overlap_top_k": 0.39658838510513306,
        "interaction_matrix_overlap_bottom_k": -0.3710300028324127,
        "effective_rank": -0.17206071317195892,
        "effective_rank_mergeability_score": 0.059691715985536575,
        "stable_rank": -0.2291603535413742,
        "spectral_gap": -0.019543062895536423,
        "singular_value_ratio": 0.08417581766843796,
        "layerwise_effective_rank": -0.03212916851043701,
        "layerwise_effective_rank_mergeability_score": 0.24600829184055328,
        "task_vector_cosine_similarity": 0.30097100138664246,
        "task_vector_l2_distance": -0.11517414450645447,
        "task_vector_dot_product": -0.006742686033248901,
        "weight_space_angle": 0.09855491667985916,
        "task_vector_magnitude_ratio": 0.2656111419200897,
        "singular_value_overlap": 0.059233587235212326,
        "subspace_overlap": 0.11026331782341003,
        "activation_l2_distance": -0.003208861453458667,
        "activation_cosine_similarity": 0.4522183835506439,
        "activation_magnitude_ratio": -0.19970308244228363,
        "activation_dot_product": 0.5451598167419434,
        "encoder_gradient_cosine_similarity": 0.4769684672355652,
        "encoder_gradient_l2_distance": -0.606772243976593,
        "encoder_gradient_dot_product": 0.2019534409046173,
        "input_gradient_cosine_similarity": 0.36468127369880676,
        "input_gradient_l2_distance": -0.6169788837432861,
        "input_gradient_dot_product": -0.5995616316795349
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6974007591651423,
      "val_r": 0.3358086545634455,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 14.53312873840332,
        "right_subspace_overlap_bottom_k": 9.527280807495117,
        "interaction_matrix_overlap_top_k": 33.93510437011719,
        "interaction_matrix_overlap_bottom_k": -33.918190002441406,
        "effective_rank": 20.30340003967285,
        "effective_rank_mergeability_score": 3.0546083450317383,
        "stable_rank": -1.244361400604248,
        "spectral_gap": 7.838093280792236,
        "singular_value_ratio": 4.759158134460449,
        "layerwise_effective_rank": -40.58120346069336,
        "layerwise_effective_rank_mergeability_score": 5.787209987640381,
        "task_vector_cosine_similarity": 1.1980005502700806,
        "task_vector_l2_distance": -22.82044219970703,
        "task_vector_dot_product": 1.884382963180542,
        "weight_space_angle": 11.858755111694336,
        "task_vector_magnitude_ratio": 14.331391334533691,
        "singular_value_overlap": 7.462627410888672,
        "subspace_overlap": 46.09190368652344,
        "activation_l2_distance": 13.61451530456543,
        "activation_cosine_similarity": -8.730682373046875,
        "activation_magnitude_ratio": 0.3296162486076355,
        "activation_dot_product": -0.8203742504119873,
        "encoder_gradient_cosine_similarity": 25.498985290527344,
        "encoder_gradient_l2_distance": -38.22882080078125,
        "encoder_gradient_dot_product": 12.770146369934082,
        "input_gradient_cosine_similarity": 11.27940845489502,
        "input_gradient_l2_distance": -44.37928009033203,
        "input_gradient_dot_product": -27.98634147644043
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7572814346831539,
      "val_r": 0.3686590946915813,
      "n_iterations": 97,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5320411324501038,
        "right_subspace_overlap_bottom_k": -0.715450644493103,
        "interaction_matrix_overlap_top_k": 0.7240767478942871,
        "interaction_matrix_overlap_bottom_k": -0.16314077377319336,
        "effective_rank": -0.0832231268286705,
        "effective_rank_mergeability_score": 0.3025127351284027,
        "stable_rank": -0.2116202414035797,
        "spectral_gap": -0.046085961163043976,
        "singular_value_ratio": -0.1579410582780838,
        "layerwise_effective_rank": 0.302743524312973,
        "layerwise_effective_rank_mergeability_score": -0.06157970800995827,
        "task_vector_cosine_similarity": 0.0032044367399066687,
        "task_vector_l2_distance": 0.15639358758926392,
        "task_vector_dot_product": -0.3497677743434906,
        "weight_space_angle": 0.6905907988548279,
        "task_vector_magnitude_ratio": 0.22244474291801453,
        "singular_value_overlap": 0.33516424894332886,
        "subspace_overlap": -0.13971047103405,
        "activation_l2_distance": -0.27607017755508423,
        "activation_cosine_similarity": 0.6668900847434998,
        "activation_magnitude_ratio": -0.10573003441095352,
        "activation_dot_product": 0.6134838461875916,
        "encoder_gradient_cosine_similarity": 0.19062578678131104,
        "encoder_gradient_l2_distance": -0.9975411891937256,
        "encoder_gradient_dot_product": 0.12054763734340668,
        "input_gradient_cosine_similarity": 0.2802627384662628,
        "input_gradient_l2_distance": -0.7254942655563354,
        "input_gradient_dot_product": -0.3957917094230652
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7450351799215662,
      "val_r": 0.7978431897156826,
      "n_iterations": 293,
      "coefficients": {
        "right_subspace_overlap_top_k": -1.0713176727294922,
        "right_subspace_overlap_bottom_k": -3.819715738296509,
        "interaction_matrix_overlap_top_k": 3.606071710586548,
        "interaction_matrix_overlap_bottom_k": -0.32081520557403564,
        "effective_rank": -1.3201253414154053,
        "effective_rank_mergeability_score": 0.3157537877559662,
        "stable_rank": 0.06818065047264099,
        "spectral_gap": 1.4910119771957397,
        "singular_value_ratio": 0.49796685576438904,
        "layerwise_effective_rank": 0.6839932799339294,
        "layerwise_effective_rank_mergeability_score": -1.3372467756271362,
        "task_vector_cosine_similarity": 1.7603923082351685,
        "task_vector_l2_distance": 1.242098093032837,
        "task_vector_dot_product": -1.625746250152588,
        "weight_space_angle": 2.4344100952148438,
        "task_vector_magnitude_ratio": 0.9070224165916443,
        "singular_value_overlap": 0.2877458333969116,
        "subspace_overlap": 2.2699267864227295,
        "activation_l2_distance": -0.9969121813774109,
        "activation_cosine_similarity": 2.903012990951538,
        "activation_magnitude_ratio": -0.5587271451950073,
        "activation_dot_product": -1.1261757612228394,
        "encoder_gradient_cosine_similarity": 1.0335348844528198,
        "encoder_gradient_l2_distance": -4.41804313659668,
        "encoder_gradient_dot_product": 0.7095075249671936,
        "input_gradient_cosine_similarity": 0.5514401197433472,
        "input_gradient_l2_distance": -2.4981939792633057,
        "input_gradient_dot_product": -2.1054980754852295
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7688676559301484,
      "val_r": 0.7563361986748638,
      "n_iterations": 325,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.8433433771133423,
        "right_subspace_overlap_bottom_k": -1.1306838989257812,
        "interaction_matrix_overlap_top_k": -0.6230878829956055,
        "interaction_matrix_overlap_bottom_k": 0.5359100103378296,
        "effective_rank": 1.0861247777938843,
        "effective_rank_mergeability_score": 0.19836612045764923,
        "stable_rank": 0.14102144539356232,
        "spectral_gap": 0.45349568128585815,
        "singular_value_ratio": 1.3444000482559204,
        "layerwise_effective_rank": -0.7321234345436096,
        "layerwise_effective_rank_mergeability_score": 0.2618792653083801,
        "task_vector_cosine_similarity": 0.179424449801445,
        "task_vector_l2_distance": -0.046065494418144226,
        "task_vector_dot_product": -0.06658843159675598,
        "weight_space_angle": -0.7403674125671387,
        "task_vector_magnitude_ratio": -1.0316598415374756,
        "singular_value_overlap": -0.08917377144098282,
        "subspace_overlap": -0.7872757315635681,
        "activation_l2_distance": 0.8761737942695618,
        "activation_cosine_similarity": 1.5770047903060913,
        "activation_magnitude_ratio": -0.043277308344841,
        "activation_dot_product": -0.10110093653202057,
        "encoder_gradient_cosine_similarity": 0.30054619908332825,
        "encoder_gradient_l2_distance": -0.9722083806991577,
        "encoder_gradient_dot_product": 0.3251776397228241,
        "input_gradient_cosine_similarity": 0.1832534819841385,
        "input_gradient_l2_distance": -1.2033429145812988,
        "input_gradient_dot_product": -0.6067425012588501
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7181464681990217,
      "val_r": 0.7454119076206862,
      "n_iterations": 70,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.7250922918319702,
        "right_subspace_overlap_bottom_k": 0.1896282583475113,
        "interaction_matrix_overlap_top_k": 0.8904145359992981,
        "interaction_matrix_overlap_bottom_k": -0.7642300128936768,
        "effective_rank": 0.45879244804382324,
        "effective_rank_mergeability_score": 0.4242492616176605,
        "stable_rank": 0.048749666661024094,
        "spectral_gap": -0.3035438358783722,
        "singular_value_ratio": 0.698379635810852,
        "layerwise_effective_rank": -0.4351002275943756,
        "layerwise_effective_rank_mergeability_score": 0.12218160927295685,
        "task_vector_cosine_similarity": -0.11576194316148758,
        "task_vector_l2_distance": -0.23259896039962769,
        "task_vector_dot_product": -0.29378876090049744,
        "weight_space_angle": 0.4476773738861084,
        "task_vector_magnitude_ratio": -0.8350369334220886,
        "singular_value_overlap": -0.06707438081502914,
        "subspace_overlap": -0.5281137228012085,
        "activation_l2_distance": 0.3589142858982086,
        "activation_cosine_similarity": 0.8528138995170593,
        "activation_magnitude_ratio": -0.20124340057373047,
        "activation_dot_product": 0.335062175989151,
        "encoder_gradient_cosine_similarity": 0.2645570635795593,
        "encoder_gradient_l2_distance": -0.22746555507183075,
        "encoder_gradient_dot_product": 0.4270620048046112,
        "input_gradient_cosine_similarity": 0.1854049563407898,
        "input_gradient_l2_distance": -1.5793066024780273,
        "input_gradient_dot_product": -0.6001600027084351
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7541648001656969,
      "val_r": 0.7541533796865081,
      "n_iterations": 866,
      "coefficients": {
        "right_subspace_overlap_top_k": 13.62271785736084,
        "right_subspace_overlap_bottom_k": -10.57902717590332,
        "interaction_matrix_overlap_top_k": -15.763096809387207,
        "interaction_matrix_overlap_bottom_k": -0.09486667066812515,
        "effective_rank": 5.766915798187256,
        "effective_rank_mergeability_score": 2.82585072517395,
        "stable_rank": -0.06560245156288147,
        "spectral_gap": 4.334436416625977,
        "singular_value_ratio": -1.3411279916763306,
        "layerwise_effective_rank": -4.630183219909668,
        "layerwise_effective_rank_mergeability_score": 1.882986307144165,
        "task_vector_cosine_similarity": -3.2278923988342285,
        "task_vector_l2_distance": -1.1760627031326294,
        "task_vector_dot_product": -3.9846274852752686,
        "weight_space_angle": 9.0840425491333,
        "task_vector_magnitude_ratio": 6.735730171203613,
        "singular_value_overlap": 0.7447359561920166,
        "subspace_overlap": 7.073623180389404,
        "activation_l2_distance": -6.424607276916504,
        "activation_cosine_similarity": 1.247839093208313,
        "activation_magnitude_ratio": -2.5842738151550293,
        "activation_dot_product": 6.841739177703857,
        "encoder_gradient_cosine_similarity": 3.205951452255249,
        "encoder_gradient_l2_distance": -14.029099464416504,
        "encoder_gradient_dot_product": 2.411710500717163,
        "input_gradient_cosine_similarity": 1.6459964513778687,
        "input_gradient_l2_distance": -11.112086296081543,
        "input_gradient_dot_product": -5.389786243438721
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.755700701293802,
      "val_r": 0.5855240256990969,
      "n_iterations": 90,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.23786698281764984,
        "right_subspace_overlap_bottom_k": -0.039035290479660034,
        "interaction_matrix_overlap_top_k": 0.8960493206977844,
        "interaction_matrix_overlap_bottom_k": -1.5365550518035889,
        "effective_rank": -1.087588906288147,
        "effective_rank_mergeability_score": 1.1710397005081177,
        "stable_rank": 0.734836220741272,
        "spectral_gap": -0.19183777272701263,
        "singular_value_ratio": 0.5465719699859619,
        "layerwise_effective_rank": 1.8736424446105957,
        "layerwise_effective_rank_mergeability_score": 0.9136219620704651,
        "task_vector_cosine_similarity": -0.1607847660779953,
        "task_vector_l2_distance": -0.44977399706840515,
        "task_vector_dot_product": -0.03332000970840454,
        "weight_space_angle": -0.013159776106476784,
        "task_vector_magnitude_ratio": -0.37140852212905884,
        "singular_value_overlap": 0.5809482336044312,
        "subspace_overlap": -0.6551255583763123,
        "activation_l2_distance": -0.5070301294326782,
        "activation_cosine_similarity": 0.44688451290130615,
        "activation_magnitude_ratio": -0.36530107259750366,
        "activation_dot_product": -0.10903163254261017,
        "encoder_gradient_cosine_similarity": 0.3893975615501404,
        "encoder_gradient_l2_distance": -1.2832438945770264,
        "encoder_gradient_dot_product": 0.4651903212070465,
        "input_gradient_cosine_similarity": 0.12071596086025238,
        "input_gradient_l2_distance": -1.4192270040512085,
        "input_gradient_dot_product": -0.6559588313102722
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.770315667293121,
      "val_r": 0.6914143282686217,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.4458434581756592,
        "right_subspace_overlap_bottom_k": -2.199974298477173,
        "interaction_matrix_overlap_top_k": -0.06459463387727737,
        "interaction_matrix_overlap_bottom_k": 0.7128434181213379,
        "effective_rank": 0.9092509746551514,
        "effective_rank_mergeability_score": -0.7859585881233215,
        "stable_rank": -0.05640888959169388,
        "spectral_gap": -0.16699905693531036,
        "singular_value_ratio": -0.3309541940689087,
        "layerwise_effective_rank": 0.06337163597345352,
        "layerwise_effective_rank_mergeability_score": 2.1672143936157227,
        "task_vector_cosine_similarity": -0.15603652596473694,
        "task_vector_l2_distance": -0.6576847434043884,
        "task_vector_dot_product": 0.20422795414924622,
        "weight_space_angle": 1.7141278982162476,
        "task_vector_magnitude_ratio": 0.10509372502565384,
        "singular_value_overlap": -0.11376918852329254,
        "subspace_overlap": -1.127976894378662,
        "activation_l2_distance": 0.09830201417207718,
        "activation_cosine_similarity": 1.5503146648406982,
        "activation_magnitude_ratio": -0.49828752875328064,
        "activation_dot_product": 0.4348021149635315,
        "encoder_gradient_cosine_similarity": 0.6141040921211243,
        "encoder_gradient_l2_distance": -3.137753963470459,
        "encoder_gradient_dot_product": 0.4283727705478668,
        "input_gradient_cosine_similarity": 0.3809482455253601,
        "input_gradient_l2_distance": -1.9681750535964966,
        "input_gradient_dot_product": -1.0944602489471436
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6944845155234693,
      "val_r": 0.5051484656097774,
      "n_iterations": 828,
      "coefficients": {
        "right_subspace_overlap_top_k": 39.14086151123047,
        "right_subspace_overlap_bottom_k": -33.97603988647461,
        "interaction_matrix_overlap_top_k": 8.726351737976074,
        "interaction_matrix_overlap_bottom_k": -39.46354675292969,
        "effective_rank": 0.9633752107620239,
        "effective_rank_mergeability_score": 24.692424774169922,
        "stable_rank": -11.009618759155273,
        "spectral_gap": -21.631471633911133,
        "singular_value_ratio": -15.768760681152344,
        "layerwise_effective_rank": 4.617624282836914,
        "layerwise_effective_rank_mergeability_score": -5.206801414489746,
        "task_vector_cosine_similarity": 9.3599214553833,
        "task_vector_l2_distance": -7.272907733917236,
        "task_vector_dot_product": 11.602835655212402,
        "weight_space_angle": -4.5597758293151855,
        "task_vector_magnitude_ratio": 0.22418048977851868,
        "singular_value_overlap": 9.74125862121582,
        "subspace_overlap": 6.562191009521484,
        "activation_l2_distance": -3.909294366836548,
        "activation_cosine_similarity": 30.637453079223633,
        "activation_magnitude_ratio": -9.287038803100586,
        "activation_dot_product": 48.209896087646484,
        "encoder_gradient_cosine_similarity": 31.279603958129883,
        "encoder_gradient_l2_distance": -64.69853210449219,
        "encoder_gradient_dot_product": 38.24519729614258,
        "input_gradient_cosine_similarity": 28.8342227935791,
        "input_gradient_l2_distance": -44.81773376464844,
        "input_gradient_dot_product": -56.52177429199219
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7764968174391276,
      "val_r": 0.3680041657422846,
      "n_iterations": 960,
      "coefficients": {
        "right_subspace_overlap_top_k": 13.220345497131348,
        "right_subspace_overlap_bottom_k": -22.980403900146484,
        "interaction_matrix_overlap_top_k": 15.339821815490723,
        "interaction_matrix_overlap_bottom_k": 1.878669261932373,
        "effective_rank": -7.521065711975098,
        "effective_rank_mergeability_score": 6.7562785148620605,
        "stable_rank": 0.41960060596466064,
        "spectral_gap": 0.10466578602790833,
        "singular_value_ratio": -0.16706210374832153,
        "layerwise_effective_rank": 7.058103561401367,
        "layerwise_effective_rank_mergeability_score": 0.6766413450241089,
        "task_vector_cosine_similarity": 2.4684183597564697,
        "task_vector_l2_distance": 2.5392093658447266,
        "task_vector_dot_product": -4.623972415924072,
        "weight_space_angle": 3.026949882507324,
        "task_vector_magnitude_ratio": 5.470572471618652,
        "singular_value_overlap": 6.859819412231445,
        "subspace_overlap": -13.392448425292969,
        "activation_l2_distance": -6.821552276611328,
        "activation_cosine_similarity": -1.1574329137802124,
        "activation_magnitude_ratio": -1.2832685708999634,
        "activation_dot_product": 17.223928451538086,
        "encoder_gradient_cosine_similarity": 8.153797149658203,
        "encoder_gradient_l2_distance": -29.030370712280273,
        "encoder_gradient_dot_product": 2.012813091278076,
        "input_gradient_cosine_similarity": 3.66825532913208,
        "input_gradient_l2_distance": -4.27972412109375,
        "input_gradient_dot_product": -12.61678695678711
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7318433005871742,
      "val_r": 0.6429431391002373,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -22.039384841918945,
        "right_subspace_overlap_bottom_k": -7.4346160888671875,
        "interaction_matrix_overlap_top_k": 29.20502281188965,
        "interaction_matrix_overlap_bottom_k": -2.533996343612671,
        "effective_rank": 9.439937591552734,
        "effective_rank_mergeability_score": -15.156596183776855,
        "stable_rank": -3.118504047393799,
        "spectral_gap": 5.036024570465088,
        "singular_value_ratio": 6.932306289672852,
        "layerwise_effective_rank": -31.396808624267578,
        "layerwise_effective_rank_mergeability_score": 8.057121276855469,
        "task_vector_cosine_similarity": -3.9048988819122314,
        "task_vector_l2_distance": -13.045931816101074,
        "task_vector_dot_product": -4.512324333190918,
        "weight_space_angle": -9.935051918029785,
        "task_vector_magnitude_ratio": 7.821897983551025,
        "singular_value_overlap": -4.33380651473999,
        "subspace_overlap": 13.325182914733887,
        "activation_l2_distance": 25.053546905517578,
        "activation_cosine_similarity": 41.597293853759766,
        "activation_magnitude_ratio": -16.276927947998047,
        "activation_dot_product": 22.680309295654297,
        "encoder_gradient_cosine_similarity": 9.24690055847168,
        "encoder_gradient_l2_distance": -11.234892845153809,
        "encoder_gradient_dot_product": 4.143852233886719,
        "input_gradient_cosine_similarity": 10.913002967834473,
        "input_gradient_l2_distance": -28.420408248901367,
        "input_gradient_dot_product": -22.478050231933594
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}