{
  "aggregate_metrics": {
    "train_r": 0.19028974930235687,
    "train_p": 1.1928867713173494e-27,
    "val_r": 0.06199008854312295,
    "val_p": 0.24202871968255427
  },
  "per_fold_stats": {
    "train_r_mean": 0.4341764130828191,
    "train_r_std": 0.08860438510898413,
    "val_r_mean": 0.3280096782406471,
    "val_r_std": 0.2267723613913172
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 17.938350677490234,
    "right_subspace_overlap_bottom_k": 35.01589584350586,
    "interaction_matrix_overlap_top_k": 7.740365505218506,
    "interaction_matrix_overlap_bottom_k": 30.283626556396484,
    "effective_rank": -5.151604652404785,
    "effective_rank_mergeability_score": 2.6388018131256104,
    "stable_rank": 5.079964637756348,
    "spectral_gap": 9.177169799804688,
    "singular_value_ratio": -1.8075571060180664,
    "layerwise_effective_rank": -2.965121030807495,
    "layerwise_effective_rank_mergeability_score": 7.969317436218262,
    "task_vector_cosine_similarity": -3.917130947113037,
    "task_vector_l2_distance": -21.649877548217773,
    "task_vector_dot_product": -4.729440689086914,
    "weight_space_angle": 6.985878944396973,
    "task_vector_magnitude_ratio": -13.369237899780273,
    "singular_value_overlap": -27.103748321533203,
    "subspace_overlap": 15.006375312805176,
    "activation_l2_distance": -9.562759399414062,
    "activation_cosine_similarity": -0.4627331793308258,
    "activation_magnitude_ratio": -10.791788101196289,
    "activation_dot_product": -5.468896389007568,
    "encoder_gradient_cosine_similarity": 6.039186000823975,
    "encoder_gradient_l2_distance": -33.3134880065918,
    "encoder_gradient_dot_product": 11.208719253540039,
    "input_gradient_cosine_similarity": 14.00854778289795,
    "input_gradient_l2_distance": -36.2991943359375,
    "input_gradient_dot_product": -24.029207229614258
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 39.590003967285156,
    "right_subspace_overlap_bottom_k": 37.4339485168457,
    "interaction_matrix_overlap_top_k": 21.259687423706055,
    "interaction_matrix_overlap_bottom_k": 32.478336334228516,
    "effective_rank": 22.158580780029297,
    "effective_rank_mergeability_score": 29.13016700744629,
    "stable_rank": 24.197223663330078,
    "spectral_gap": 22.79207420349121,
    "singular_value_ratio": 27.51042938232422,
    "layerwise_effective_rank": 28.058137893676758,
    "layerwise_effective_rank_mergeability_score": 31.069971084594727,
    "task_vector_cosine_similarity": 21.3523006439209,
    "task_vector_l2_distance": 25.826208114624023,
    "task_vector_dot_product": 35.2996826171875,
    "weight_space_angle": 35.91207504272461,
    "task_vector_magnitude_ratio": 31.203750610351562,
    "singular_value_overlap": 33.935516357421875,
    "subspace_overlap": 19.117233276367188,
    "activation_l2_distance": 22.16206932067871,
    "activation_cosine_similarity": 23.19867706298828,
    "activation_magnitude_ratio": 26.73688316345215,
    "activation_dot_product": 34.65753936767578,
    "encoder_gradient_cosine_similarity": 19.836931228637695,
    "encoder_gradient_l2_distance": 36.45439147949219,
    "encoder_gradient_dot_product": 14.959484100341797,
    "input_gradient_cosine_similarity": 27.54352569580078,
    "input_gradient_l2_distance": 39.10694885253906,
    "input_gradient_dot_product": 41.709495544433594
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.43637115177059077,
      "val_r": 0.4362766681114702,
      "n_iterations": 118,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.472589492797852,
        "right_subspace_overlap_bottom_k": 6.7315239906311035,
        "interaction_matrix_overlap_top_k": 5.97247314453125,
        "interaction_matrix_overlap_bottom_k": -0.9390110969543457,
        "effective_rank": 5.8185834884643555,
        "effective_rank_mergeability_score": 0.854306697845459,
        "stable_rank": -7.244290351867676,
        "spectral_gap": 6.661945819854736,
        "singular_value_ratio": 4.557575225830078,
        "layerwise_effective_rank": 8.978670120239258,
        "layerwise_effective_rank_mergeability_score": 5.227047920227051,
        "task_vector_cosine_similarity": 6.999259948730469,
        "task_vector_l2_distance": -1.0392751693725586,
        "task_vector_dot_product": 2.3031349182128906,
        "weight_space_angle": -2.6073217391967773,
        "task_vector_magnitude_ratio": -5.422670841217041,
        "singular_value_overlap": -19.41145896911621,
        "subspace_overlap": 8.451225280761719,
        "activation_l2_distance": -12.81315803527832,
        "activation_cosine_similarity": 4.351417064666748,
        "activation_magnitude_ratio": -1.4981119632720947,
        "activation_dot_product": -15.870010375976562,
        "encoder_gradient_cosine_similarity": -1.367856740951538,
        "encoder_gradient_l2_distance": -10.963923454284668,
        "encoder_gradient_dot_product": 0.9812805652618408,
        "input_gradient_cosine_similarity": 10.691497802734375,
        "input_gradient_l2_distance": -5.869184494018555,
        "input_gradient_dot_product": -11.684700965881348
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.43320599370155677,
      "val_r": 0.35000357329746334,
      "n_iterations": 363,
      "coefficients": {
        "right_subspace_overlap_top_k": 38.40121078491211,
        "right_subspace_overlap_bottom_k": 30.975542068481445,
        "interaction_matrix_overlap_top_k": 46.75655746459961,
        "interaction_matrix_overlap_bottom_k": 43.194740295410156,
        "effective_rank": -5.852539539337158,
        "effective_rank_mergeability_score": 33.11430740356445,
        "stable_rank": 36.16534423828125,
        "spectral_gap": 15.958614349365234,
        "singular_value_ratio": -16.046218872070312,
        "layerwise_effective_rank": 43.18035125732422,
        "layerwise_effective_rank_mergeability_score": 39.64760208129883,
        "task_vector_cosine_similarity": -37.17354965209961,
        "task_vector_l2_distance": -43.1589469909668,
        "task_vector_dot_product": -28.141672134399414,
        "weight_space_angle": -37.15380096435547,
        "task_vector_magnitude_ratio": -14.584891319274902,
        "singular_value_overlap": -1.2236307859420776,
        "subspace_overlap": 23.741323471069336,
        "activation_l2_distance": -42.58610916137695,
        "activation_cosine_similarity": -38.95135498046875,
        "activation_magnitude_ratio": -24.29658317565918,
        "activation_dot_product": 10.08937931060791,
        "encoder_gradient_cosine_similarity": 10.15212631225586,
        "encoder_gradient_l2_distance": -69.36176300048828,
        "encoder_gradient_dot_product": 44.50920867919922,
        "input_gradient_cosine_similarity": 52.893089294433594,
        "input_gradient_l2_distance": -63.65631866455078,
        "input_gradient_dot_product": -42.73362350463867
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4127423321110317,
      "val_r": 0.3236707143942362,
      "n_iterations": 447,
      "coefficients": {
        "right_subspace_overlap_top_k": 25.951173782348633,
        "right_subspace_overlap_bottom_k": 45.777278900146484,
        "interaction_matrix_overlap_top_k": 15.97770881652832,
        "interaction_matrix_overlap_bottom_k": 44.78507995605469,
        "effective_rank": -6.196205139160156,
        "effective_rank_mergeability_score": -16.771053314208984,
        "stable_rank": -12.141021728515625,
        "spectral_gap": 33.08909606933594,
        "singular_value_ratio": -1.052532434463501,
        "layerwise_effective_rank": 0.8811860084533691,
        "layerwise_effective_rank_mergeability_score": 11.876771926879883,
        "task_vector_cosine_similarity": -25.22520637512207,
        "task_vector_l2_distance": -30.594314575195312,
        "task_vector_dot_product": 30.84422492980957,
        "weight_space_angle": 1.4257915019989014,
        "task_vector_magnitude_ratio": 3.579155445098877,
        "singular_value_overlap": 1.9921365976333618,
        "subspace_overlap": 33.13579177856445,
        "activation_l2_distance": -25.214168548583984,
        "activation_cosine_similarity": 23.4373836517334,
        "activation_magnitude_ratio": -40.42463302612305,
        "activation_dot_product": -56.70796203613281,
        "encoder_gradient_cosine_similarity": -3.714423179626465,
        "encoder_gradient_l2_distance": -36.870906829833984,
        "encoder_gradient_dot_product": 39.42613983154297,
        "input_gradient_cosine_similarity": 16.49706268310547,
        "input_gradient_l2_distance": -51.933128356933594,
        "input_gradient_dot_product": -11.716316223144531
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.49533059403271407,
      "val_r": 0.47905657137239144,
      "n_iterations": 968,
      "coefficients": {
        "right_subspace_overlap_top_k": 19.1173152923584,
        "right_subspace_overlap_bottom_k": 10.346872329711914,
        "interaction_matrix_overlap_top_k": -15.575028419494629,
        "interaction_matrix_overlap_bottom_k": 38.917877197265625,
        "effective_rank": 3.8361024856567383,
        "effective_rank_mergeability_score": -29.352767944335938,
        "stable_rank": 23.606311798095703,
        "spectral_gap": 16.928258895874023,
        "singular_value_ratio": 27.164297103881836,
        "layerwise_effective_rank": -6.211184978485107,
        "layerwise_effective_rank_mergeability_score": 42.76747512817383,
        "task_vector_cosine_similarity": 4.081961631774902,
        "task_vector_l2_distance": -20.53386116027832,
        "task_vector_dot_product": -11.007296562194824,
        "weight_space_angle": 38.97189712524414,
        "task_vector_magnitude_ratio": -41.74916076660156,
        "singular_value_overlap": -18.12070083618164,
        "subspace_overlap": 29.178464889526367,
        "activation_l2_distance": -8.253798484802246,
        "activation_cosine_similarity": 8.01998519897461,
        "activation_magnitude_ratio": -19.035837173461914,
        "activation_dot_product": -19.960264205932617,
        "encoder_gradient_cosine_similarity": -2.2246532440185547,
        "encoder_gradient_l2_distance": -13.481712341308594,
        "encoder_gradient_dot_product": 32.2896728515625,
        "input_gradient_cosine_similarity": -18.999996185302734,
        "input_gradient_l2_distance": -51.6826171875,
        "input_gradient_dot_product": -33.69929122924805
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4519700897707759,
      "val_r": 0.3382519315023582,
      "n_iterations": 899,
      "coefficients": {
        "right_subspace_overlap_top_k": -101.88894653320312,
        "right_subspace_overlap_bottom_k": 90.68684387207031,
        "interaction_matrix_overlap_top_k": -1.143739938735962,
        "interaction_matrix_overlap_bottom_k": 91.78868103027344,
        "effective_rank": -10.568662643432617,
        "effective_rank_mergeability_score": 77.47010040283203,
        "stable_rank": 10.215014457702637,
        "spectral_gap": 31.749107360839844,
        "singular_value_ratio": 7.084072113037109,
        "layerwise_effective_rank": 37.784915924072266,
        "layerwise_effective_rank_mergeability_score": -64.52510070800781,
        "task_vector_cosine_similarity": 1.0176177024841309,
        "task_vector_l2_distance": -90.34898376464844,
        "task_vector_dot_product": 34.772972106933594,
        "weight_space_angle": 141.03372192382812,
        "task_vector_magnitude_ratio": -61.783485412597656,
        "singular_value_overlap": 12.165574073791504,
        "subspace_overlap": 52.69221115112305,
        "activation_l2_distance": -34.97544479370117,
        "activation_cosine_similarity": -37.04852294921875,
        "activation_magnitude_ratio": -30.550222396850586,
        "activation_dot_product": 27.181385040283203,
        "encoder_gradient_cosine_similarity": 3.1655783653259277,
        "encoder_gradient_l2_distance": -97.08927917480469,
        "encoder_gradient_dot_product": 22.373109817504883,
        "input_gradient_cosine_similarity": 22.185083389282227,
        "input_gradient_l2_distance": -116.67314147949219,
        "input_gradient_dot_product": -150.16184997558594
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.446914634201417,
      "val_r": 0.7353392792222355,
      "n_iterations": 199,
      "coefficients": {
        "right_subspace_overlap_top_k": 27.169836044311523,
        "right_subspace_overlap_bottom_k": 21.991947174072266,
        "interaction_matrix_overlap_top_k": 10.790069580078125,
        "interaction_matrix_overlap_bottom_k": -2.2745347023010254,
        "effective_rank": 1.4490000009536743,
        "effective_rank_mergeability_score": -10.7056245803833,
        "stable_rank": 5.732394695281982,
        "spectral_gap": -5.5135345458984375,
        "singular_value_ratio": -25.305850982666016,
        "layerwise_effective_rank": 9.90080451965332,
        "layerwise_effective_rank_mergeability_score": 16.162059783935547,
        "task_vector_cosine_similarity": -14.223163604736328,
        "task_vector_l2_distance": -4.227090358734131,
        "task_vector_dot_product": -12.812206268310547,
        "weight_space_angle": 9.943382263183594,
        "task_vector_magnitude_ratio": -2.9693093299865723,
        "singular_value_overlap": -19.27069854736328,
        "subspace_overlap": 2.599567174911499,
        "activation_l2_distance": 4.222245216369629,
        "activation_cosine_similarity": 25.268373489379883,
        "activation_magnitude_ratio": -11.210371017456055,
        "activation_dot_product": -23.37200164794922,
        "encoder_gradient_cosine_similarity": -5.159829139709473,
        "encoder_gradient_l2_distance": -10.912201881408691,
        "encoder_gradient_dot_product": 7.408976078033447,
        "input_gradient_cosine_similarity": 8.93945598602295,
        "input_gradient_l2_distance": -17.662076950073242,
        "input_gradient_dot_product": 4.206780433654785
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.475337964609168,
      "val_r": -0.31664217523768745,
      "n_iterations": 63,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.670620083808899,
        "right_subspace_overlap_bottom_k": 2.0326013565063477,
        "interaction_matrix_overlap_top_k": 2.35461163520813,
        "interaction_matrix_overlap_bottom_k": 3.7096052169799805,
        "effective_rank": -1.6597907543182373,
        "effective_rank_mergeability_score": -0.587523341178894,
        "stable_rank": 0.19903528690338135,
        "spectral_gap": 1.5238769054412842,
        "singular_value_ratio": 0.16223081946372986,
        "layerwise_effective_rank": 0.30434730648994446,
        "layerwise_effective_rank_mergeability_score": 0.5232563614845276,
        "task_vector_cosine_similarity": -3.070352554321289,
        "task_vector_l2_distance": -1.4000353813171387,
        "task_vector_dot_product": -1.012270450592041,
        "weight_space_angle": 3.044018507003784,
        "task_vector_magnitude_ratio": -1.2232239246368408,
        "singular_value_overlap": -1.4703885316848755,
        "subspace_overlap": 0.8150912523269653,
        "activation_l2_distance": -0.6364809274673462,
        "activation_cosine_similarity": -0.1146124079823494,
        "activation_magnitude_ratio": 2.9734442234039307,
        "activation_dot_product": -1.640404462814331,
        "encoder_gradient_cosine_similarity": 1.780344009399414,
        "encoder_gradient_l2_distance": -4.497560501098633,
        "encoder_gradient_dot_product": 2.312180280685425,
        "input_gradient_cosine_similarity": -0.803293764591217,
        "input_gradient_l2_distance": -2.788841962814331,
        "input_gradient_dot_product": -2.7580199241638184
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.41862438292870385,
      "val_r": 0.3086077428331194,
      "n_iterations": 389,
      "coefficients": {
        "right_subspace_overlap_top_k": 32.34846496582031,
        "right_subspace_overlap_bottom_k": 28.220216751098633,
        "interaction_matrix_overlap_top_k": 39.80397033691406,
        "interaction_matrix_overlap_bottom_k": 32.54408645629883,
        "effective_rank": -37.2114372253418,
        "effective_rank_mergeability_score": -7.635678768157959,
        "stable_rank": 0.14234879612922668,
        "spectral_gap": 28.48039436340332,
        "singular_value_ratio": -12.061440467834473,
        "layerwise_effective_rank": 16.938316345214844,
        "layerwise_effective_rank_mergeability_score": 10.016899108886719,
        "task_vector_cosine_similarity": -20.681459426879883,
        "task_vector_l2_distance": -16.33747673034668,
        "task_vector_dot_product": -26.18390655517578,
        "weight_space_angle": 3.7797088623046875,
        "task_vector_magnitude_ratio": 21.90699005126953,
        "singular_value_overlap": -54.91872787475586,
        "subspace_overlap": 11.789475440979004,
        "activation_l2_distance": -16.820344924926758,
        "activation_cosine_similarity": -2.33248233795166,
        "activation_magnitude_ratio": -12.416810989379883,
        "activation_dot_product": -6.687127113342285,
        "encoder_gradient_cosine_similarity": 15.3282470703125,
        "encoder_gradient_l2_distance": -36.703125,
        "encoder_gradient_dot_product": -10.852928161621094,
        "input_gradient_cosine_similarity": 22.01072883605957,
        "input_gradient_l2_distance": -18.27933120727539,
        "input_gradient_dot_product": -10.442605972290039
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.31511428167930516,
      "val_r": 0.02623710291078407,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5367440581321716,
        "right_subspace_overlap_bottom_k": 1.0357601642608643,
        "interaction_matrix_overlap_top_k": 0.7288005352020264,
        "interaction_matrix_overlap_bottom_k": 0.16768646240234375,
        "effective_rank": -0.29072099924087524,
        "effective_rank_mergeability_score": 0.007074750028550625,
        "stable_rank": 0.153513565659523,
        "spectral_gap": 0.17059558629989624,
        "singular_value_ratio": -0.2248592972755432,
        "layerwise_effective_rank": -0.8655107021331787,
        "layerwise_effective_rank_mergeability_score": 0.44904786348342896,
        "task_vector_cosine_similarity": -0.03888753056526184,
        "task_vector_l2_distance": 0.23216284811496735,
        "task_vector_dot_product": -0.07583287358283997,
        "weight_space_angle": 0.04383578896522522,
        "task_vector_magnitude_ratio": 0.5008578896522522,
        "singular_value_overlap": -0.25459203124046326,
        "subspace_overlap": -0.11547360569238663,
        "activation_l2_distance": 0.028682347387075424,
        "activation_cosine_similarity": 0.583884596824646,
        "activation_magnitude_ratio": -0.33840975165367126,
        "activation_dot_product": -0.29839468002319336,
        "encoder_gradient_cosine_similarity": 0.052652306854724884,
        "encoder_gradient_l2_distance": -0.5729197263717651,
        "encoder_gradient_dot_product": -0.15226410329341888,
        "input_gradient_cosine_similarity": -0.06170515716075897,
        "input_gradient_l2_distance": 0.00947361346334219,
        "input_gradient_dot_product": -0.6672291159629822
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.47066351618701197,
      "val_r": 0.47679456350310073,
      "n_iterations": 91,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.3573169708251953,
        "right_subspace_overlap_bottom_k": 3.6444413661956787,
        "interaction_matrix_overlap_top_k": -0.04639289900660515,
        "interaction_matrix_overlap_bottom_k": 4.375239372253418,
        "effective_rank": 3.250248432159424,
        "effective_rank_mergeability_score": 2.6612799167633057,
        "stable_rank": -1.6548572778701782,
        "spectral_gap": 5.455957889556885,
        "singular_value_ratio": 4.487673282623291,
        "layerwise_effective_rank": -4.046914100646973,
        "layerwise_effective_rank_mergeability_score": -2.8947935104370117,
        "task_vector_cosine_similarity": 0.33289000391960144,
        "task_vector_l2_distance": -3.375398874282837,
        "task_vector_dot_product": -0.48413434624671936,
        "weight_space_angle": 1.3629794120788574,
        "task_vector_magnitude_ratio": -0.08214461803436279,
        "singular_value_overlap": -3.7904279232025146,
        "subspace_overlap": 3.1815412044525146,
        "activation_l2_distance": -4.182855129241943,
        "activation_cosine_similarity": 0.5930210947990417,
        "activation_magnitude_ratio": -3.4351868629455566,
        "activation_dot_product": -1.9546266794204712,
        "encoder_gradient_cosine_similarity": 0.37489044666290283,
        "encoder_gradient_l2_distance": -5.495361804962158,
        "encoder_gradient_dot_product": 3.0465688705444336,
        "input_gradient_cosine_similarity": 1.5263596773147583,
        "input_gradient_l2_distance": -4.60111665725708,
        "input_gradient_dot_product": -3.1897871494293213
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3680574684246627,
      "val_r": 0.3738029494297487,
      "n_iterations": 89,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.2444266974925995,
        "right_subspace_overlap_bottom_k": 8.999061584472656,
        "interaction_matrix_overlap_top_k": 5.971652984619141,
        "interaction_matrix_overlap_bottom_k": 13.360957145690918,
        "effective_rank": -4.880593299865723,
        "effective_rank_mergeability_score": 6.1640424728393555,
        "stable_rank": 3.4511139392852783,
        "spectral_gap": 5.835081100463867,
        "singular_value_ratio": -5.207688808441162,
        "layerwise_effective_rank": 1.7149475812911987,
        "layerwise_effective_rank_mergeability_score": -10.14582347869873,
        "task_vector_cosine_similarity": -2.1395397186279297,
        "task_vector_l2_distance": -4.379062652587891,
        "task_vector_dot_product": -9.96481990814209,
        "weight_space_angle": -6.550201892852783,
        "task_vector_magnitude_ratio": 1.07368803024292,
        "singular_value_overlap": -4.638617515563965,
        "subspace_overlap": 12.708918571472168,
        "activation_l2_distance": -6.224551200866699,
        "activation_cosine_similarity": -8.016310691833496,
        "activation_magnitude_ratio": 0.523012101650238,
        "activation_dot_product": 8.129748344421387,
        "encoder_gradient_cosine_similarity": -1.0050994157791138,
        "encoder_gradient_l2_distance": -7.3434014320373535,
        "encoder_gradient_dot_product": 6.434018135070801,
        "input_gradient_cosine_similarity": 3.1606357097625732,
        "input_gradient_l2_distance": 3.5085761547088623,
        "input_gradient_dot_product": -10.765765190124512
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.31078428006221126,
      "val_r": 0.28150699658736267,
      "n_iterations": 490,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.7065436840057373,
        "right_subspace_overlap_bottom_k": 111.15362548828125,
        "interaction_matrix_overlap_top_k": 6.174343585968018,
        "interaction_matrix_overlap_bottom_k": -7.112748146057129,
        "effective_rank": -66.2901382446289,
        "effective_rank_mergeability_score": 63.101871490478516,
        "stable_rank": -17.8309383392334,
        "spectral_gap": -5.940397262573242,
        "singular_value_ratio": -26.489065170288086,
        "layerwise_effective_rank": -68.21138000488281,
        "layerwise_effective_rank_mergeability_score": -28.413705825805664,
        "task_vector_cosine_similarity": 22.02308464050293,
        "task_vector_l2_distance": -42.59650421142578,
        "task_vector_dot_product": 83.72634887695312,
        "weight_space_angle": -31.34853744506836,
        "task_vector_magnitude_ratio": 69.50273895263672,
        "singular_value_overlap": -65.94632720947266,
        "subspace_overlap": 51.32252883911133,
        "activation_l2_distance": -67.06599426269531,
        "activation_cosine_similarity": -10.254756927490234,
        "activation_magnitude_ratio": 67.73368072509766,
        "activation_dot_product": -81.1796875,
        "encoder_gradient_cosine_similarity": 59.67745590209961,
        "encoder_gradient_l2_distance": -135.22366333007812,
        "encoder_gradient_dot_product": 15.941650390625,
        "input_gradient_cosine_similarity": 19.50103759765625,
        "input_gradient_l2_distance": -36.05988693237305,
        "input_gradient_dot_product": -29.054658889770508
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4133873273826443,
      "val_r": 0.32843154313606315,
      "n_iterations": 366,
      "coefficients": {
        "right_subspace_overlap_top_k": 22.98601531982422,
        "right_subspace_overlap_bottom_k": 20.264677047729492,
        "interaction_matrix_overlap_top_k": -9.624666213989258,
        "interaction_matrix_overlap_bottom_k": 37.28425598144531,
        "effective_rank": -21.445640563964844,
        "effective_rank_mergeability_score": 1.87884521484375,
        "stable_rank": 13.30679988861084,
        "spectral_gap": 16.89051628112793,
        "singular_value_ratio": -2.4020748138427734,
        "layerwise_effective_rank": -18.70415687561035,
        "layerwise_effective_rank_mergeability_score": -26.80235481262207,
        "task_vector_cosine_similarity": 29.90149688720703,
        "task_vector_l2_distance": -15.867291450500488,
        "task_vector_dot_product": 12.577642440795898,
        "weight_space_angle": -16.641334533691406,
        "task_vector_magnitude_ratio": -16.814746856689453,
        "singular_value_overlap": -65.38208770751953,
        "subspace_overlap": 17.1201229095459,
        "activation_l2_distance": -12.580268859863281,
        "activation_cosine_similarity": 6.320003032684326,
        "activation_magnitude_ratio": -9.507762908935547,
        "activation_dot_product": -15.389847755432129,
        "encoder_gradient_cosine_similarity": 27.519166946411133,
        "encoder_gradient_l2_distance": -56.23189926147461,
        "encoder_gradient_dot_product": 30.96053695678711,
        "input_gradient_cosine_similarity": 45.305870056152344,
        "input_gradient_l2_distance": -24.637487411499023,
        "input_gradient_dot_product": -10.843921661376953
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3741063606209149,
      "val_r": 0.49846228305144724,
      "n_iterations": 463,
      "coefficients": {
        "right_subspace_overlap_top_k": 59.574771881103516,
        "right_subspace_overlap_bottom_k": 83.05310821533203,
        "interaction_matrix_overlap_top_k": 24.570032119750977,
        "interaction_matrix_overlap_bottom_k": 64.54927825927734,
        "effective_rank": -37.49557113647461,
        "effective_rank_mergeability_score": 18.102514266967773,
        "stable_rank": 67.14202117919922,
        "spectral_gap": -11.948724746704102,
        "singular_value_ratio": 11.07020092010498,
        "layerwise_effective_rank": 17.685630798339844,
        "layerwise_effective_rank_mergeability_score": 67.72022247314453,
        "task_vector_cosine_similarity": 1.9424546957015991,
        "task_vector_l2_distance": -7.756789684295654,
        "task_vector_dot_product": -22.212902069091797,
        "weight_space_angle": -3.686506748199463,
        "task_vector_magnitude_ratio": -55.58607482910156,
        "singular_value_overlap": -29.026737213134766,
        "subspace_overlap": 8.775182723999023,
        "activation_l2_distance": -22.779142379760742,
        "activation_cosine_similarity": 52.45461654663086,
        "activation_magnitude_ratio": -69.3916244506836,
        "activation_dot_product": -72.88904571533203,
        "encoder_gradient_cosine_similarity": 7.198190212249756,
        "encoder_gradient_l2_distance": -83.98847961425781,
        "encoder_gradient_dot_product": 15.2311372756958,
        "input_gradient_cosine_similarity": 8.133423805236816,
        "input_gradient_l2_distance": -14.8727445602417,
        "input_gradient_dot_product": -90.13723754882812
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.44484662177117207,
      "val_r": 0.5172987645701549,
      "n_iterations": 793,
      "coefficients": {
        "right_subspace_overlap_top_k": 80.07698059082031,
        "right_subspace_overlap_bottom_k": 57.445884704589844,
        "interaction_matrix_overlap_top_k": 43.04856491088867,
        "interaction_matrix_overlap_bottom_k": 55.102901458740234,
        "effective_rank": 27.271175384521484,
        "effective_rank_mergeability_score": 5.854565620422363,
        "stable_rank": 16.76607894897461,
        "spectral_gap": 57.128353118896484,
        "singular_value_ratio": 63.32685089111328,
        "layerwise_effective_rank": -62.06245422363281,
        "layerwise_effective_rank_mergeability_score": 4.479236602783203,
        "task_vector_cosine_similarity": 43.48715591430664,
        "task_vector_l2_distance": -77.41590881347656,
        "task_vector_dot_product": -90.38200378417969,
        "weight_space_angle": 46.63685607910156,
        "task_vector_magnitude_ratio": -47.14866256713867,
        "singular_value_overlap": -104.90254211425781,
        "subspace_overlap": -26.716930389404297,
        "activation_l2_distance": 13.734524726867676,
        "activation_cosine_similarity": -2.104670763015747,
        "activation_magnitude_ratio": -42.90939712524414,
        "activation_dot_product": 49.683998107910156,
        "encoder_gradient_cosine_similarity": -45.47803497314453,
        "encoder_gradient_l2_distance": -26.53992462158203,
        "encoder_gradient_dot_product": -2.498744010925293,
        "input_gradient_cosine_similarity": 50.24728775024414,
        "input_gradient_l2_distance": -100.55408477783203,
        "input_gradient_dot_product": -70.80619049072266
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.3581921293431115,
      "val_r": 0.4305359185023685,
      "n_iterations": 255,
      "coefficients": {
        "right_subspace_overlap_top_k": 110.54637908935547,
        "right_subspace_overlap_bottom_k": 74.82742309570312,
        "interaction_matrix_overlap_top_k": -50.46525192260742,
        "interaction_matrix_overlap_bottom_k": 111.02033996582031,
        "effective_rank": 40.21890640258789,
        "effective_rank_mergeability_score": -58.9904670715332,
        "stable_rank": -63.202484130859375,
        "spectral_gap": 38.800323486328125,
        "singular_value_ratio": 19.18412208557129,
        "layerwise_effective_rank": -50.04880142211914,
        "layerwise_effective_rank_mergeability_score": 9.930131912231445,
        "task_vector_cosine_similarity": -50.473575592041016,
        "task_vector_l2_distance": -46.77613067626953,
        "task_vector_dot_product": 21.000089645385742,
        "weight_space_angle": -16.70090103149414,
        "task_vector_magnitude_ratio": -65.93567657470703,
        "singular_value_overlap": -79.13397979736328,
        "subspace_overlap": 39.3466796875,
        "activation_l2_distance": -0.3394326865673065,
        "activation_cosine_similarity": -57.032527923583984,
        "activation_magnitude_ratio": -36.24209213256836,
        "activation_dot_product": 47.382843017578125,
        "encoder_gradient_cosine_similarity": 41.0145263671875,
        "encoder_gradient_l2_distance": -18.11486053466797,
        "encoder_gradient_dot_product": -4.54426908493042,
        "input_gradient_cosine_similarity": -49.0396614074707,
        "input_gradient_l2_distance": -85.26300811767578,
        "input_gradient_dot_product": 58.62223815917969
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.43204919670713854,
      "val_r": 0.3294415332046711,
      "n_iterations": 78,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.241830348968506,
        "right_subspace_overlap_bottom_k": 2.2649483680725098,
        "interaction_matrix_overlap_top_k": 1.8407766819000244,
        "interaction_matrix_overlap_bottom_k": 4.909120559692383,
        "effective_rank": -2.193099021911621,
        "effective_rank_mergeability_score": 3.3769540786743164,
        "stable_rank": -0.19718648493289948,
        "spectral_gap": -0.6809945106506348,
        "singular_value_ratio": -1.1283044815063477,
        "layerwise_effective_rank": 1.876295804977417,
        "layerwise_effective_rank_mergeability_score": -1.597355604171753,
        "task_vector_cosine_similarity": 0.7057971954345703,
        "task_vector_l2_distance": -1.3772356510162354,
        "task_vector_dot_product": -3.4260785579681396,
        "weight_space_angle": -1.4223227500915527,
        "task_vector_magnitude_ratio": -0.559799313545227,
        "singular_value_overlap": -5.463666915893555,
        "subspace_overlap": 2.55788516998291,
        "activation_l2_distance": -0.5033103227615356,
        "activation_cosine_similarity": 0.8382166624069214,
        "activation_magnitude_ratio": 0.7286978363990784,
        "activation_dot_product": -2.4386703968048096,
        "encoder_gradient_cosine_similarity": 2.2391555309295654,
        "encoder_gradient_l2_distance": -4.1449785232543945,
        "encoder_gradient_dot_product": 3.243882894515991,
        "input_gradient_cosine_similarity": 3.471055269241333,
        "input_gradient_l2_distance": -2.805438995361328,
        "input_gradient_dot_product": -6.020548343658447
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.39433002309902476,
      "val_r": 0.0012089420707072918,
      "n_iterations": 79,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.991716384887695,
        "right_subspace_overlap_bottom_k": 1.9651457071304321,
        "interaction_matrix_overlap_top_k": 0.6528354287147522,
        "interaction_matrix_overlap_bottom_k": 5.0040998458862305,
        "effective_rank": -1.6833391189575195,
        "effective_rank_mergeability_score": -6.484701156616211,
        "stable_rank": -1.4181314706802368,
        "spectral_gap": 1.3909636735916138,
        "singular_value_ratio": -1.0672553777694702,
        "layerwise_effective_rank": -0.8608725666999817,
        "layerwise_effective_rank_mergeability_score": 0.8453317880630493,
        "task_vector_cosine_similarity": 0.5243594646453857,
        "task_vector_l2_distance": 0.6667750477790833,
        "task_vector_dot_product": 0.9488909244537354,
        "weight_space_angle": 2.4844870567321777,
        "task_vector_magnitude_ratio": -4.5957350730896,
        "singular_value_overlap": 1.5600160360336304,
        "subspace_overlap": 0.010057645849883556,
        "activation_l2_distance": -2.175403594970703,
        "activation_cosine_similarity": 1.0765893459320068,
        "activation_magnitude_ratio": 2.778810739517212,
        "activation_dot_product": -4.484579086303711,
        "encoder_gradient_cosine_similarity": 1.183383584022522,
        "encoder_gradient_l2_distance": -0.2818759083747864,
        "encoder_gradient_dot_product": 4.703922748565674,
        "input_gradient_cosine_similarity": 0.5188119411468506,
        "input_gradient_l2_distance": -6.798567771911621,
        "input_gradient_dot_product": -2.6597464084625244
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7532855053393703,
      "val_r": 0.5573228185912737,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.482881546020508,
        "right_subspace_overlap_bottom_k": -6.561868190765381,
        "interaction_matrix_overlap_top_k": 1.8697409629821777,
        "interaction_matrix_overlap_bottom_k": 8.131450653076172,
        "effective_rank": 3.7944977283477783,
        "effective_rank_mergeability_score": -1.5814956426620483,
        "stable_rank": 1.4578105211257935,
        "spectral_gap": 4.344490051269531,
        "singular_value_ratio": 7.436164379119873,
        "layerwise_effective_rank": -6.992055892944336,
        "layerwise_effective_rank_mergeability_score": 6.01114559173584,
        "task_vector_cosine_similarity": -7.82566499710083,
        "task_vector_l2_distance": -0.20825593173503876,
        "task_vector_dot_product": -4.076115131378174,
        "weight_space_angle": -1.1002306938171387,
        "task_vector_magnitude_ratio": -1.3975752592086792,
        "singular_value_overlap": -3.1989753246307373,
        "subspace_overlap": 0.1809847354888916,
        "activation_l2_distance": 3.0582075119018555,
        "activation_cosine_similarity": 4.71613073348999,
        "activation_magnitude_ratio": -1.3559396266937256,
        "activation_dot_product": 2.390690565109253,
        "encoder_gradient_cosine_similarity": 1.7033785581588745,
        "encoder_gradient_l2_distance": -7.2049031257629395,
        "encoder_gradient_dot_product": 0.09984379261732101,
        "input_gradient_cosine_similarity": 0.0778050571680069,
        "input_gradient_l2_distance": -9.001416206359863,
        "input_gradient_dot_product": -4.111715316772461
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4782144079138561,
      "val_r": 0.08458584375967448,
      "n_iterations": 404,
      "coefficients": {
        "right_subspace_overlap_top_k": 15.77916431427002,
        "right_subspace_overlap_bottom_k": 105.46296691894531,
        "interaction_matrix_overlap_top_k": 25.15024757385254,
        "interaction_matrix_overlap_bottom_k": 57.15338897705078,
        "effective_rank": 7.097146034240723,
        "effective_rank_mergeability_score": -27.700519561767578,
        "stable_rank": 26.950403213500977,
        "spectral_gap": -56.780521392822266,
        "singular_value_ratio": -89.6390380859375,
        "layerwise_effective_rank": 19.455446243286133,
        "layerwise_effective_rank_mergeability_score": 78.10926818847656,
        "task_vector_cosine_similarity": -28.50730323791504,
        "task_vector_l2_distance": -26.503978729248047,
        "task_vector_dot_product": -70.98287963867188,
        "weight_space_angle": 8.20205020904541,
        "task_vector_magnitude_ratio": -44.09503173828125,
        "singular_value_overlap": -81.63914489746094,
        "subspace_overlap": 29.352853775024414,
        "activation_l2_distance": 44.85163116455078,
        "activation_cosine_similarity": 18.940959930419922,
        "activation_magnitude_ratio": 12.039588928222656,
        "activation_dot_product": 48.63665771484375,
        "encoder_gradient_cosine_similarity": 8.344532012939453,
        "encoder_gradient_l2_distance": -41.2470817565918,
        "encoder_gradient_dot_product": 13.26048469543457,
        "input_gradient_cosine_similarity": 83.91641235351562,
        "input_gradient_l2_distance": -116.36357879638672,
        "input_gradient_dot_product": -51.95990753173828
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}