{
  "aggregate_metrics": {
    "train_r": 0.09183687909939028,
    "train_p": 1.7707644466284906e-07,
    "val_r": 0.08687895988437096,
    "val_p": 0.10075950327351509
  },
  "per_fold_stats": {
    "train_r_mean": 0.6559518826312077,
    "train_r_std": 0.09486562821975214,
    "val_r_mean": 0.5549913283389103,
    "val_r_std": 0.20292178956865428
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 51.5689811706543,
    "right_subspace_overlap_bottom_k": -25.292430877685547,
    "interaction_matrix_overlap_top_k": 28.448654174804688,
    "interaction_matrix_overlap_bottom_k": 1.526309609413147,
    "effective_rank": 3.617974042892456,
    "effective_rank_mergeability_score": 14.779199600219727,
    "stable_rank": 11.42481803894043,
    "spectral_gap": 8.259401321411133,
    "singular_value_ratio": 4.448522090911865,
    "layerwise_effective_rank": -1.7128515243530273,
    "layerwise_effective_rank_mergeability_score": 0.9680374264717102,
    "task_vector_cosine_similarity": 15.453977584838867,
    "task_vector_l2_distance": -13.318827629089355,
    "task_vector_dot_product": -12.888193130493164,
    "weight_space_angle": -10.974605560302734,
    "task_vector_magnitude_ratio": -1.4384143352508545,
    "singular_value_overlap": 15.125033378601074,
    "subspace_overlap": -1.983797311782837,
    "right_subspace_overlap": -22.004032135009766,
    "encoder_gradient_cosine_similarity": 19.64982032775879,
    "encoder_gradient_l2_distance": -48.181304931640625,
    "encoder_gradient_dot_product": 23.760602951049805,
    "input_gradient_cosine_similarity": -9.984248161315918,
    "input_gradient_l2_distance": -21.130084991455078,
    "input_gradient_dot_product": -29.124820709228516
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 149.35882568359375,
    "right_subspace_overlap_bottom_k": 48.58954620361328,
    "interaction_matrix_overlap_top_k": 51.27946853637695,
    "interaction_matrix_overlap_bottom_k": 56.646053314208984,
    "effective_rank": 41.28589630126953,
    "effective_rank_mergeability_score": 65.41566467285156,
    "stable_rank": 106.93952941894531,
    "spectral_gap": 35.45848083496094,
    "singular_value_ratio": 13.960068702697754,
    "layerwise_effective_rank": 14.932609558105469,
    "layerwise_effective_rank_mergeability_score": 20.2020320892334,
    "task_vector_cosine_similarity": 27.948463439941406,
    "task_vector_l2_distance": 28.282773971557617,
    "task_vector_dot_product": 83.67048645019531,
    "weight_space_angle": 31.82280158996582,
    "task_vector_magnitude_ratio": 63.98155975341797,
    "singular_value_overlap": 41.52299880981445,
    "subspace_overlap": 22.75664710998535,
    "right_subspace_overlap": 132.89434814453125,
    "encoder_gradient_cosine_similarity": 30.638072967529297,
    "encoder_gradient_l2_distance": 87.0252456665039,
    "encoder_gradient_dot_product": 70.86094665527344,
    "input_gradient_cosine_similarity": 70.91796112060547,
    "input_gradient_l2_distance": 37.16252899169922,
    "input_gradient_dot_product": 65.93130493164062
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6713895295890558,
      "val_r": 0.6411714169399075,
      "n_iterations": 898,
      "coefficients": {
        "right_subspace_overlap_top_k": 25.987531661987305,
        "right_subspace_overlap_bottom_k": -10.768632888793945,
        "interaction_matrix_overlap_top_k": -4.137286186218262,
        "interaction_matrix_overlap_bottom_k": -15.254526138305664,
        "effective_rank": 8.828700065612793,
        "effective_rank_mergeability_score": -0.7753280401229858,
        "stable_rank": 2.7487311363220215,
        "spectral_gap": 5.471801280975342,
        "singular_value_ratio": 9.319009780883789,
        "layerwise_effective_rank": -15.011987686157227,
        "layerwise_effective_rank_mergeability_score": 0.4198601543903351,
        "task_vector_cosine_similarity": -8.01361083984375,
        "task_vector_l2_distance": -10.792259216308594,
        "task_vector_dot_product": 5.449970245361328,
        "weight_space_angle": 11.540079116821289,
        "task_vector_magnitude_ratio": -4.324131965637207,
        "singular_value_overlap": 4.004635810852051,
        "subspace_overlap": -6.34647798538208,
        "right_subspace_overlap": 27.868314743041992,
        "encoder_gradient_cosine_similarity": 8.436690330505371,
        "encoder_gradient_l2_distance": -22.036836624145508,
        "encoder_gradient_dot_product": 4.841688632965088,
        "input_gradient_cosine_similarity": 1.7643086910247803,
        "input_gradient_l2_distance": -21.894670486450195,
        "input_gradient_dot_product": 3.672814130783081
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.40840195954447384,
      "val_r": 0.3112053358877407,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.2157631367444992,
        "right_subspace_overlap_bottom_k": -0.26164913177490234,
        "interaction_matrix_overlap_top_k": 0.5257810354232788,
        "interaction_matrix_overlap_bottom_k": -0.3869801461696625,
        "effective_rank": -0.08332329988479614,
        "effective_rank_mergeability_score": 0.05449063330888748,
        "stable_rank": 0.2452387511730194,
        "spectral_gap": -0.12522803246974945,
        "singular_value_ratio": 0.4041294753551483,
        "layerwise_effective_rank": 0.18241079151630402,
        "layerwise_effective_rank_mergeability_score": -0.09107858687639236,
        "task_vector_cosine_similarity": 0.23678362369537354,
        "task_vector_l2_distance": -0.495013564825058,
        "task_vector_dot_product": -0.031042352318763733,
        "weight_space_angle": -0.2893947660923004,
        "task_vector_magnitude_ratio": -0.10632747411727905,
        "singular_value_overlap": 0.5669344067573547,
        "subspace_overlap": 0.8257344365119934,
        "right_subspace_overlap": -0.25742340087890625,
        "encoder_gradient_cosine_similarity": 0.691683828830719,
        "encoder_gradient_l2_distance": -0.6961145401000977,
        "encoder_gradient_dot_product": 0.6441774368286133,
        "input_gradient_cosine_similarity": -0.615055501461029,
        "input_gradient_l2_distance": -0.007442818954586983,
        "input_gradient_dot_product": -0.1672428995370865
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4917220117875425,
      "val_r": 0.06885550615486268,
      "n_iterations": 640,
      "coefficients": {
        "right_subspace_overlap_top_k": 91.47201538085938,
        "right_subspace_overlap_bottom_k": -9.005743026733398,
        "interaction_matrix_overlap_top_k": 85.50789642333984,
        "interaction_matrix_overlap_bottom_k": 31.047595977783203,
        "effective_rank": -76.40718841552734,
        "effective_rank_mergeability_score": 18.86224937438965,
        "stable_rank": -135.6186981201172,
        "spectral_gap": 12.425161361694336,
        "singular_value_ratio": 49.886962890625,
        "layerwise_effective_rank": 8.770288467407227,
        "layerwise_effective_rank_mergeability_score": 11.708568572998047,
        "task_vector_cosine_similarity": 103.55833435058594,
        "task_vector_l2_distance": -120.5285415649414,
        "task_vector_dot_product": 69.55159759521484,
        "weight_space_angle": -92.958251953125,
        "task_vector_magnitude_ratio": 136.23426818847656,
        "singular_value_overlap": -17.427114486694336,
        "subspace_overlap": -7.937014102935791,
        "right_subspace_overlap": 24.93612289428711,
        "encoder_gradient_cosine_similarity": 29.28325843811035,
        "encoder_gradient_l2_distance": -224.88682556152344,
        "encoder_gradient_dot_product": 19.926570892333984,
        "input_gradient_cosine_similarity": 75.43815612792969,
        "input_gradient_l2_distance": 38.19495391845703,
        "input_gradient_dot_product": -121.0369873046875
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6839838609547755,
      "val_r": 0.49691612364717724,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 15.316924095153809,
        "right_subspace_overlap_bottom_k": -18.363773345947266,
        "interaction_matrix_overlap_top_k": 6.584619998931885,
        "interaction_matrix_overlap_bottom_k": -10.445343971252441,
        "effective_rank": -4.156853675842285,
        "effective_rank_mergeability_score": 2.8757269382476807,
        "stable_rank": 1.3290164470672607,
        "spectral_gap": 0.1076880544424057,
        "singular_value_ratio": 10.164698600769043,
        "layerwise_effective_rank": 0.5778095722198486,
        "layerwise_effective_rank_mergeability_score": 5.378847122192383,
        "task_vector_cosine_similarity": 0.3277626633644104,
        "task_vector_l2_distance": -5.2163801193237305,
        "task_vector_dot_product": 1.7293503284454346,
        "weight_space_angle": -1.0814930200576782,
        "task_vector_magnitude_ratio": -3.432966947555542,
        "singular_value_overlap": 6.633322715759277,
        "subspace_overlap": 1.333268642425537,
        "right_subspace_overlap": 15.284071922302246,
        "encoder_gradient_cosine_similarity": 12.889690399169922,
        "encoder_gradient_l2_distance": -17.015094757080078,
        "encoder_gradient_dot_product": 9.267631530761719,
        "input_gradient_cosine_similarity": -0.38462403416633606,
        "input_gradient_l2_distance": -16.35335922241211,
        "input_gradient_dot_product": -12.352011680603027
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6730258501588,
      "val_r": 0.6204394954977722,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 4.203489780426025,
        "right_subspace_overlap_bottom_k": -6.679756164550781,
        "interaction_matrix_overlap_top_k": 14.289693832397461,
        "interaction_matrix_overlap_bottom_k": -8.781682968139648,
        "effective_rank": 0.5743672847747803,
        "effective_rank_mergeability_score": 3.477797746658325,
        "stable_rank": -4.16275691986084,
        "spectral_gap": 0.24898996949195862,
        "singular_value_ratio": -2.6147100925445557,
        "layerwise_effective_rank": 2.686128616333008,
        "layerwise_effective_rank_mergeability_score": -1.4691781997680664,
        "task_vector_cosine_similarity": 3.403850555419922,
        "task_vector_l2_distance": -8.205828666687012,
        "task_vector_dot_product": 5.267849922180176,
        "weight_space_angle": 2.983766794204712,
        "task_vector_magnitude_ratio": 4.494879245758057,
        "singular_value_overlap": 3.013500213623047,
        "subspace_overlap": -0.2238200604915619,
        "right_subspace_overlap": 5.409512996673584,
        "encoder_gradient_cosine_similarity": 7.952455520629883,
        "encoder_gradient_l2_distance": -13.055950164794922,
        "encoder_gradient_dot_product": 4.547661304473877,
        "input_gradient_cosine_similarity": 4.565752983093262,
        "input_gradient_l2_distance": -12.084242820739746,
        "input_gradient_dot_product": -8.842947959899902
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.6205765310905934,
      "val_r": 0.6098770892003107,
      "n_iterations": 961,
      "coefficients": {
        "right_subspace_overlap_top_k": 29.817859649658203,
        "right_subspace_overlap_bottom_k": -76.00479888916016,
        "interaction_matrix_overlap_top_k": 73.14344787597656,
        "interaction_matrix_overlap_bottom_k": -57.798118591308594,
        "effective_rank": 11.836891174316406,
        "effective_rank_mergeability_score": 5.175981044769287,
        "stable_rank": -27.425554275512695,
        "spectral_gap": -66.69442749023438,
        "singular_value_ratio": -4.98028564453125,
        "layerwise_effective_rank": -9.00650691986084,
        "layerwise_effective_rank_mergeability_score": 15.944249153137207,
        "task_vector_cosine_similarity": 10.292780876159668,
        "task_vector_l2_distance": -20.076751708984375,
        "task_vector_dot_product": 22.796783447265625,
        "weight_space_angle": 1.9438261985778809,
        "task_vector_magnitude_ratio": -28.084514617919922,
        "singular_value_overlap": 16.032323837280273,
        "subspace_overlap": 23.110462188720703,
        "right_subspace_overlap": 61.59674072265625,
        "encoder_gradient_cosine_similarity": 47.044647216796875,
        "encoder_gradient_l2_distance": -41.06892395019531,
        "encoder_gradient_dot_product": 31.504566192626953,
        "input_gradient_cosine_similarity": 25.59151840209961,
        "input_gradient_l2_distance": -0.790868878364563,
        "input_gradient_dot_product": -42.90296936035156
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7083184250494758,
      "val_r": 0.6630981285218713,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.248870849609375,
        "right_subspace_overlap_bottom_k": -2.2991514205932617,
        "interaction_matrix_overlap_top_k": -1.1342581510543823,
        "interaction_matrix_overlap_bottom_k": -2.3656821250915527,
        "effective_rank": 1.485943078994751,
        "effective_rank_mergeability_score": 2.7504167556762695,
        "stable_rank": -1.2075531482696533,
        "spectral_gap": 0.46212413907051086,
        "singular_value_ratio": 1.5115944147109985,
        "layerwise_effective_rank": 1.1392478942871094,
        "layerwise_effective_rank_mergeability_score": -0.6845572590827942,
        "task_vector_cosine_similarity": 2.600172281265259,
        "task_vector_l2_distance": -2.4164278507232666,
        "task_vector_dot_product": 1.3913229703903198,
        "weight_space_angle": 2.471693754196167,
        "task_vector_magnitude_ratio": -1.115517020225525,
        "singular_value_overlap": 1.543838381767273,
        "subspace_overlap": -2.3552722930908203,
        "right_subspace_overlap": 3.5238757133483887,
        "encoder_gradient_cosine_similarity": 1.7897549867630005,
        "encoder_gradient_l2_distance": -5.608683109283447,
        "encoder_gradient_dot_product": 1.6288381814956665,
        "input_gradient_cosine_similarity": -0.4398190379142761,
        "input_gradient_l2_distance": -3.0475738048553467,
        "input_gradient_dot_product": -1.8741015195846558
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7028853215326419,
      "val_r": 0.2474128870111539,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 16.554393768310547,
        "right_subspace_overlap_bottom_k": -11.639678001403809,
        "interaction_matrix_overlap_top_k": 2.8885929584503174,
        "interaction_matrix_overlap_bottom_k": -4.381120681762695,
        "effective_rank": -7.289849281311035,
        "effective_rank_mergeability_score": -8.874456405639648,
        "stable_rank": 1.7440423965454102,
        "spectral_gap": 8.170393943786621,
        "singular_value_ratio": 7.691953182220459,
        "layerwise_effective_rank": -1.143625020980835,
        "layerwise_effective_rank_mergeability_score": 5.378459453582764,
        "task_vector_cosine_similarity": -6.128944396972656,
        "task_vector_l2_distance": -6.185261249542236,
        "task_vector_dot_product": -1.6460403203964233,
        "weight_space_angle": 2.9042391777038574,
        "task_vector_magnitude_ratio": 1.29140043258667,
        "singular_value_overlap": 3.5018324851989746,
        "subspace_overlap": -4.732745170593262,
        "right_subspace_overlap": 12.120718955993652,
        "encoder_gradient_cosine_similarity": 6.808775424957275,
        "encoder_gradient_l2_distance": -13.633010864257812,
        "encoder_gradient_dot_product": 4.100926399230957,
        "input_gradient_cosine_similarity": 1.842816710472107,
        "input_gradient_l2_distance": -7.873898506164551,
        "input_gradient_dot_product": -0.4712892472743988
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7286952915999447,
      "val_r": 0.11378227167799115,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 11.640851020812988,
        "right_subspace_overlap_bottom_k": -6.225329399108887,
        "interaction_matrix_overlap_top_k": 6.273797035217285,
        "interaction_matrix_overlap_bottom_k": -8.089875221252441,
        "effective_rank": 0.1704530566930771,
        "effective_rank_mergeability_score": 2.3843555450439453,
        "stable_rank": -4.972339630126953,
        "spectral_gap": -0.11800853163003922,
        "singular_value_ratio": 0.2893342673778534,
        "layerwise_effective_rank": 2.4228055477142334,
        "layerwise_effective_rank_mergeability_score": 2.143836498260498,
        "task_vector_cosine_similarity": 1.617051362991333,
        "task_vector_l2_distance": -3.2527880668640137,
        "task_vector_dot_product": -0.7871229648590088,
        "weight_space_angle": 3.8652262687683105,
        "task_vector_magnitude_ratio": 3.3777084350585938,
        "singular_value_overlap": 3.614614486694336,
        "subspace_overlap": -3.1981124877929688,
        "right_subspace_overlap": 5.854832649230957,
        "encoder_gradient_cosine_similarity": 5.635009288787842,
        "encoder_gradient_l2_distance": -9.903761863708496,
        "encoder_gradient_dot_product": 3.932363271713257,
        "input_gradient_cosine_similarity": 1.4484516382217407,
        "input_gradient_l2_distance": -11.312485694885254,
        "input_gradient_dot_product": -5.812064170837402
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7652517786066674,
      "val_r": 0.6212663758307135,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.1443259716033936,
        "right_subspace_overlap_bottom_k": -3.2831616401672363,
        "interaction_matrix_overlap_top_k": 2.172849416732788,
        "interaction_matrix_overlap_bottom_k": -2.9141287803649902,
        "effective_rank": 0.335595041513443,
        "effective_rank_mergeability_score": 1.4914823770523071,
        "stable_rank": 2.165891170501709,
        "spectral_gap": -0.6274007558822632,
        "singular_value_ratio": 0.7840216159820557,
        "layerwise_effective_rank": -1.248640537261963,
        "layerwise_effective_rank_mergeability_score": 1.9842818975448608,
        "task_vector_cosine_similarity": -1.514050841331482,
        "task_vector_l2_distance": -0.7337700128555298,
        "task_vector_dot_product": 0.1803540140390396,
        "weight_space_angle": 2.6315064430236816,
        "task_vector_magnitude_ratio": -0.8674633502960205,
        "singular_value_overlap": 1.5708211660385132,
        "subspace_overlap": -1.1962069272994995,
        "right_subspace_overlap": 4.973667144775391,
        "encoder_gradient_cosine_similarity": 1.8119951486587524,
        "encoder_gradient_l2_distance": -5.331720352172852,
        "encoder_gradient_dot_product": 0.5542052388191223,
        "input_gradient_cosine_similarity": 0.6404616236686707,
        "input_gradient_l2_distance": -3.9259800910949707,
        "input_gradient_dot_product": -1.7997509241104126
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6914540291212882,
      "val_r": 0.5220326020258137,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 22.066890716552734,
        "right_subspace_overlap_bottom_k": -17.84808921813965,
        "interaction_matrix_overlap_top_k": -0.2536482810974121,
        "interaction_matrix_overlap_bottom_k": -4.44429349899292,
        "effective_rank": 4.293068885803223,
        "effective_rank_mergeability_score": 0.5732207298278809,
        "stable_rank": -18.580720901489258,
        "spectral_gap": 2.2324798107147217,
        "singular_value_ratio": 13.525026321411133,
        "layerwise_effective_rank": 12.930670738220215,
        "layerwise_effective_rank_mergeability_score": 2.307906150817871,
        "task_vector_cosine_similarity": -2.9083497524261475,
        "task_vector_l2_distance": -3.297652244567871,
        "task_vector_dot_product": 0.2885938286781311,
        "weight_space_angle": -0.13104557991027832,
        "task_vector_magnitude_ratio": -6.259285926818848,
        "singular_value_overlap": 11.066344261169434,
        "subspace_overlap": -5.997982025146484,
        "right_subspace_overlap": 10.181987762451172,
        "encoder_gradient_cosine_similarity": 5.0114922523498535,
        "encoder_gradient_l2_distance": -10.736136436462402,
        "encoder_gradient_dot_product": 5.45650053024292,
        "input_gradient_cosine_similarity": -0.8989829421043396,
        "input_gradient_l2_distance": -14.42650032043457,
        "input_gradient_dot_product": -3.152975559234619
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6716802805724804,
      "val_r": 0.7322567644791279,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.125964164733887,
        "right_subspace_overlap_bottom_k": -14.381304740905762,
        "interaction_matrix_overlap_top_k": 29.169424057006836,
        "interaction_matrix_overlap_bottom_k": -14.648035049438477,
        "effective_rank": -10.59085750579834,
        "effective_rank_mergeability_score": 9.729841232299805,
        "stable_rank": 8.808917045593262,
        "spectral_gap": -8.399788856506348,
        "singular_value_ratio": -1.2188982963562012,
        "layerwise_effective_rank": 2.2115108966827393,
        "layerwise_effective_rank_mergeability_score": -6.257704257965088,
        "task_vector_cosine_similarity": 3.54317307472229,
        "task_vector_l2_distance": -3.7591516971588135,
        "task_vector_dot_product": -2.7322051525115967,
        "weight_space_angle": 5.94979190826416,
        "task_vector_magnitude_ratio": -4.2862868309021,
        "singular_value_overlap": 9.336313247680664,
        "subspace_overlap": 4.716660976409912,
        "right_subspace_overlap": 1.8311452865600586,
        "encoder_gradient_cosine_similarity": 9.482322692871094,
        "encoder_gradient_l2_distance": -8.748127937316895,
        "encoder_gradient_dot_product": 15.159830093383789,
        "input_gradient_cosine_similarity": 2.5328152179718018,
        "input_gradient_l2_distance": -23.470218658447266,
        "input_gradient_dot_product": -12.106602668762207
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.672193007730066,
      "val_r": 0.5198263269548453,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 4.659052848815918,
        "right_subspace_overlap_bottom_k": -5.9499993324279785,
        "interaction_matrix_overlap_top_k": 7.741866588592529,
        "interaction_matrix_overlap_bottom_k": -14.829258918762207,
        "effective_rank": 7.519309043884277,
        "effective_rank_mergeability_score": 3.2763209342956543,
        "stable_rank": -4.304373741149902,
        "spectral_gap": -6.095963478088379,
        "singular_value_ratio": 5.977419376373291,
        "layerwise_effective_rank": 9.211402893066406,
        "layerwise_effective_rank_mergeability_score": 7.870409965515137,
        "task_vector_cosine_similarity": 18.181852340698242,
        "task_vector_l2_distance": -4.83858060836792,
        "task_vector_dot_product": 14.558985710144043,
        "weight_space_angle": -6.675022602081299,
        "task_vector_magnitude_ratio": -12.362349510192871,
        "singular_value_overlap": 6.29454231262207,
        "subspace_overlap": -10.349059104919434,
        "right_subspace_overlap": 3.428696393966675,
        "encoder_gradient_cosine_similarity": 7.724040508270264,
        "encoder_gradient_l2_distance": -15.026634216308594,
        "encoder_gradient_dot_product": 7.856668472290039,
        "input_gradient_cosine_similarity": 1.5208473205566406,
        "input_gradient_l2_distance": -11.299993515014648,
        "input_gradient_dot_product": -13.091501235961914
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7469184745781702,
      "val_r": 0.7520826177404584,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.6005076169967651,
        "right_subspace_overlap_bottom_k": -2.2851033210754395,
        "interaction_matrix_overlap_top_k": -0.6523812413215637,
        "interaction_matrix_overlap_bottom_k": 1.3345853090286255,
        "effective_rank": 0.7807243466377258,
        "effective_rank_mergeability_score": 0.31188610196113586,
        "stable_rank": -0.07267917692661285,
        "spectral_gap": 0.5945030450820923,
        "singular_value_ratio": 0.8300018906593323,
        "layerwise_effective_rank": -0.06341345608234406,
        "layerwise_effective_rank_mergeability_score": 0.4374631345272064,
        "task_vector_cosine_similarity": 0.6661624312400818,
        "task_vector_l2_distance": -0.39486104249954224,
        "task_vector_dot_product": 0.31096604466438293,
        "weight_space_angle": 0.38616907596588135,
        "task_vector_magnitude_ratio": -0.3524128496646881,
        "singular_value_overlap": -0.0011264709755778313,
        "subspace_overlap": -2.6268365383148193,
        "right_subspace_overlap": 2.3135147094726562,
        "encoder_gradient_cosine_similarity": 0.3381931781768799,
        "encoder_gradient_l2_distance": -1.4045214653015137,
        "encoder_gradient_dot_product": 0.2952536642551422,
        "input_gradient_cosine_similarity": 0.145969957113266,
        "input_gradient_l2_distance": -0.8924943804740906,
        "input_gradient_dot_product": -0.5997004508972168
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.629258301481251,
      "val_r": 0.7364163630560443,
      "n_iterations": 618,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.959654808044434,
        "right_subspace_overlap_bottom_k": -24.414012908935547,
        "interaction_matrix_overlap_top_k": 62.35435485839844,
        "interaction_matrix_overlap_bottom_k": -19.994949340820312,
        "effective_rank": -6.128098964691162,
        "effective_rank_mergeability_score": 15.43166446685791,
        "stable_rank": -17.026485443115234,
        "spectral_gap": 4.79395055770874,
        "singular_value_ratio": -9.442439079284668,
        "layerwise_effective_rank": -5.772395610809326,
        "layerwise_effective_rank_mergeability_score": -11.50314712524414,
        "task_vector_cosine_similarity": 62.59025573730469,
        "task_vector_l2_distance": -1.1867481470108032,
        "task_vector_dot_product": -6.668182849884033,
        "weight_space_angle": -1.935566782951355,
        "task_vector_magnitude_ratio": 30.324426651000977,
        "singular_value_overlap": 23.692346572875977,
        "subspace_overlap": -3.6346404552459717,
        "right_subspace_overlap": 23.697519302368164,
        "encoder_gradient_cosine_similarity": 41.29556655883789,
        "encoder_gradient_l2_distance": -62.6771354675293,
        "encoder_gradient_dot_product": 11.581403732299805,
        "input_gradient_cosine_similarity": 5.238542079925537,
        "input_gradient_l2_distance": -74.91732025146484,
        "input_gradient_dot_product": -44.66096878051758
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7790270159799468,
      "val_r": 0.6999502506492411,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 5.441356182098389,
        "right_subspace_overlap_bottom_k": -3.8070268630981445,
        "interaction_matrix_overlap_top_k": 3.559030055999756,
        "interaction_matrix_overlap_bottom_k": -2.8010973930358887,
        "effective_rank": 0.7914722561836243,
        "effective_rank_mergeability_score": 1.4214928150177002,
        "stable_rank": -2.775038480758667,
        "spectral_gap": 6.940905570983887,
        "singular_value_ratio": 3.6927669048309326,
        "layerwise_effective_rank": 1.247322916984558,
        "layerwise_effective_rank_mergeability_score": -2.063248634338379,
        "task_vector_cosine_similarity": -2.397775411605835,
        "task_vector_l2_distance": -3.3664662837982178,
        "task_vector_dot_product": 2.379812240600586,
        "weight_space_angle": -0.48706644773483276,
        "task_vector_magnitude_ratio": 3.1371116638183594,
        "singular_value_overlap": 3.082728624343872,
        "subspace_overlap": -9.982644081115723,
        "right_subspace_overlap": 6.180954933166504,
        "encoder_gradient_cosine_similarity": 1.1135538816452026,
        "encoder_gradient_l2_distance": -6.981871128082275,
        "encoder_gradient_dot_product": 1.3775967359542847,
        "input_gradient_cosine_similarity": 0.5431467890739441,
        "input_gradient_l2_distance": -3.3368935585021973,
        "input_gradient_dot_product": -1.911065697669983
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5790384972891656,
      "val_r": 0.6768403096553164,
      "n_iterations": 816,
      "coefficients": {
        "right_subspace_overlap_top_k": 14.90977954864502,
        "right_subspace_overlap_bottom_k": -49.54831314086914,
        "interaction_matrix_overlap_top_k": 27.799217224121094,
        "interaction_matrix_overlap_bottom_k": -35.8800163269043,
        "effective_rank": -27.263368606567383,
        "effective_rank_mergeability_score": -33.489288330078125,
        "stable_rank": -41.55125045776367,
        "spectral_gap": 13.870603561401367,
        "singular_value_ratio": 28.011783599853516,
        "layerwise_effective_rank": 27.037277221679688,
        "layerwise_effective_rank_mergeability_score": 13.145715713500977,
        "task_vector_cosine_similarity": 50.83049774169922,
        "task_vector_l2_distance": 15.118517875671387,
        "task_vector_dot_product": 11.27409839630127,
        "weight_space_angle": -33.37371826171875,
        "task_vector_magnitude_ratio": 3.802959442138672,
        "singular_value_overlap": 30.570146560668945,
        "subspace_overlap": 68.5987319946289,
        "right_subspace_overlap": -32.21512985229492,
        "encoder_gradient_cosine_similarity": 30.147212982177734,
        "encoder_gradient_l2_distance": -49.23640441894531,
        "encoder_gradient_dot_product": 5.657569885253906,
        "input_gradient_cosine_similarity": 7.1517839431762695,
        "input_gradient_l2_distance": -61.344913482666016,
        "input_gradient_dot_product": 16.9746036529541
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7159204135891603,
      "val_r": 0.689844929971069,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.0224545001983643,
        "right_subspace_overlap_bottom_k": -3.3090426921844482,
        "interaction_matrix_overlap_top_k": 1.193803071975708,
        "interaction_matrix_overlap_bottom_k": 0.6667261719703674,
        "effective_rank": 1.9366470575332642,
        "effective_rank_mergeability_score": 0.7802411913871765,
        "stable_rank": -0.8420431017875671,
        "spectral_gap": 1.4304769039154053,
        "singular_value_ratio": 1.3639343976974487,
        "layerwise_effective_rank": -0.20991410315036774,
        "layerwise_effective_rank_mergeability_score": 0.29965469241142273,
        "task_vector_cosine_similarity": 1.4792081117630005,
        "task_vector_l2_distance": -1.2992231845855713,
        "task_vector_dot_product": 0.7268633246421814,
        "weight_space_angle": 1.1913421154022217,
        "task_vector_magnitude_ratio": -0.3073752820491791,
        "singular_value_overlap": 0.8218332529067993,
        "subspace_overlap": -3.0835883617401123,
        "right_subspace_overlap": 1.6335442066192627,
        "encoder_gradient_cosine_similarity": 1.0071847438812256,
        "encoder_gradient_l2_distance": -3.394143581390381,
        "encoder_gradient_dot_product": 0.9818428158760071,
        "input_gradient_cosine_similarity": 0.0301649272441864,
        "input_gradient_l2_distance": -2.8643686771392822,
        "input_gradient_dot_product": -1.2566584348678589
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4829327105055029,
      "val_r": 0.620234887882532,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 695.4249267578125,
        "right_subspace_overlap_bottom_k": -222.54833984375,
        "interaction_matrix_overlap_top_k": 222.08056640625,
        "interaction_matrix_overlap_bottom_k": 236.5356903076172,
        "effective_rank": 165.07479858398438,
        "effective_rank_mergeability_score": 295.53533935546875,
        "stable_rank": 457.72235107421875,
        "spectral_gap": 135.7885284423828,
        "singular_value_ratio": -7.342919826507568,
        "layerwise_effective_rank": -52.84562683105469,
        "layerwise_effective_rank_mergeability_score": -71.8589859008789,
        "task_vector_cosine_similarity": 28.959762573242188,
        "task_vector_l2_distance": -56.991294860839844,
        "task_vector_dot_product": -370.6653137207031,
        "weight_space_angle": -112.2515869140625,
        "task_vector_magnitude_ratio": -233.2469024658203,
        "singular_value_overlap": 191.39675903320312,
        "subspace_overlap": -68.48626708984375,
        "right_subspace_overlap": -595.7764892578125,
        "encoder_gradient_cosine_similarity": 137.3548126220703,
        "encoder_gradient_l2_distance": -358.9044189453125,
        "encoder_gradient_dot_product": 330.82305908203125,
        "input_gradient_cosine_similarity": -309.602294921875,
        "input_gradient_l2_distance": -147.7714385986328,
        "input_gradient_dot_product": -287.4062805175781
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6963643618631511,
      "val_r": 0.7563168839942555,
      "n_iterations": 883,
      "coefficients": {
        "right_subspace_overlap_top_k": 64.5670394897461,
        "right_subspace_overlap_bottom_k": -17.225711822509766,
        "interaction_matrix_overlap_top_k": 29.865644454956055,
        "interaction_matrix_overlap_bottom_k": -36.043296813964844,
        "effective_rank": 0.6510544419288635,
        "effective_rank_mergeability_score": -25.409440994262695,
        "stable_rank": 12.271642684936523,
        "spectral_gap": 54.711238861083984,
        "singular_value_ratio": -18.882946014404297,
        "layerwise_effective_rank": -17.371795654296875,
        "layerwise_effective_rank_mergeability_score": 46.26939010620117,
        "task_vector_cosine_similarity": 41.75468063354492,
        "task_vector_l2_distance": -28.458065032958984,
        "task_vector_dot_product": -11.140473365783691,
        "weight_space_angle": -6.176599502563477,
        "task_vector_magnitude_ratio": 83.31450653076172,
        "singular_value_overlap": 3.18609881401062,
        "subspace_overlap": -8.110136985778809,
        "right_subspace_overlap": -22.66680335998535,
        "encoder_gradient_cosine_similarity": 37.178035736083984,
        "encoder_gradient_l2_distance": -93.27980041503906,
        "encoder_gradient_dot_product": 15.073698043823242,
        "input_gradient_cosine_similarity": -16.198951721191406,
        "input_gradient_l2_distance": -43.182010650634766,
        "input_gradient_dot_product": -43.69871520996094
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}