{
  "aggregate_metrics": {
    "train_r": 0.23359234658597364,
    "train_p": 3.498877517451537e-41,
    "val_r": 0.11898863598701342,
    "val_p": 0.024353795486833807
  },
  "per_fold_stats": {
    "train_r_mean": 0.5270797362701849,
    "train_r_std": 0.07544790262355155,
    "val_r_mean": 0.4191882029622838,
    "val_r_std": 0.21070118641558142
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 28.822216033935547,
    "right_subspace_overlap_bottom_k": 4.52155065536499,
    "interaction_matrix_overlap_top_k": 19.766691207885742,
    "interaction_matrix_overlap_bottom_k": 11.455246925354004,
    "effective_rank": 0.11509702354669571,
    "effective_rank_mergeability_score": 5.937655448913574,
    "stable_rank": 0.6198938488960266,
    "spectral_gap": 11.27633285522461,
    "singular_value_ratio": 3.2245476245880127,
    "layerwise_effective_rank": 0.3268283009529114,
    "layerwise_effective_rank_mergeability_score": 8.269485473632812,
    "task_vector_cosine_similarity": 4.413418769836426,
    "task_vector_l2_distance": -27.284435272216797,
    "task_vector_dot_product": 9.811861991882324,
    "weight_space_angle": -8.904512405395508,
    "task_vector_magnitude_ratio": -9.00728988647461,
    "singular_value_overlap": -35.41975402832031,
    "subspace_overlap": 11.84252643585205,
    "right_subspace_overlap": 23.61832046508789,
    "encoder_gradient_cosine_similarity": 23.68423843383789,
    "encoder_gradient_l2_distance": -43.20964431762695,
    "encoder_gradient_dot_product": 24.743144989013672,
    "input_gradient_cosine_similarity": 11.849625587463379,
    "input_gradient_l2_distance": -43.05323028564453,
    "input_gradient_dot_product": -36.421791076660156
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 40.41632080078125,
    "right_subspace_overlap_bottom_k": 27.876697540283203,
    "interaction_matrix_overlap_top_k": 17.82134246826172,
    "interaction_matrix_overlap_bottom_k": 25.123579025268555,
    "effective_rank": 24.659578323364258,
    "effective_rank_mergeability_score": 29.381874084472656,
    "stable_rank": 29.792354583740234,
    "spectral_gap": 23.354808807373047,
    "singular_value_ratio": 20.56673240661621,
    "layerwise_effective_rank": 27.96288299560547,
    "layerwise_effective_rank_mergeability_score": 41.98396682739258,
    "task_vector_cosine_similarity": 44.980567932128906,
    "task_vector_l2_distance": 23.422279357910156,
    "task_vector_dot_product": 47.153079986572266,
    "weight_space_angle": 18.934520721435547,
    "task_vector_magnitude_ratio": 32.61367416381836,
    "singular_value_overlap": 23.4042911529541,
    "subspace_overlap": 33.957275390625,
    "right_subspace_overlap": 27.917984008789062,
    "encoder_gradient_cosine_similarity": 18.076263427734375,
    "encoder_gradient_l2_distance": 29.93277931213379,
    "encoder_gradient_dot_product": 16.545162200927734,
    "input_gradient_cosine_similarity": 17.707103729248047,
    "input_gradient_l2_distance": 43.75696563720703,
    "input_gradient_dot_product": 32.650054931640625
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5794349725726791,
      "val_r": 0.6906302304305941,
      "n_iterations": 877,
      "coefficients": {
        "right_subspace_overlap_top_k": 25.231170654296875,
        "right_subspace_overlap_bottom_k": 7.753875732421875,
        "interaction_matrix_overlap_top_k": 5.822181701660156,
        "interaction_matrix_overlap_bottom_k": 23.349027633666992,
        "effective_rank": -13.996007919311523,
        "effective_rank_mergeability_score": 25.17545509338379,
        "stable_rank": 3.2561628818511963,
        "spectral_gap": 12.557059288024902,
        "singular_value_ratio": -36.53904724121094,
        "layerwise_effective_rank": 38.66532516479492,
        "layerwise_effective_rank_mergeability_score": -23.802946090698242,
        "task_vector_cosine_similarity": 19.043535232543945,
        "task_vector_l2_distance": -48.9365119934082,
        "task_vector_dot_product": -4.846920013427734,
        "weight_space_angle": 30.862825393676758,
        "task_vector_magnitude_ratio": 16.201923370361328,
        "singular_value_overlap": -55.30916213989258,
        "subspace_overlap": 17.67266273498535,
        "right_subspace_overlap": 24.0223445892334,
        "encoder_gradient_cosine_similarity": 8.785720825195312,
        "encoder_gradient_l2_distance": -24.12119483947754,
        "encoder_gradient_dot_product": 36.07170867919922,
        "input_gradient_cosine_similarity": 0.5084198117256165,
        "input_gradient_l2_distance": -44.372032165527344,
        "input_gradient_dot_product": -42.05726623535156
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5434490982854907,
      "val_r": 0.553033231946783,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.12552528083324432,
        "right_subspace_overlap_bottom_k": -5.104091167449951,
        "interaction_matrix_overlap_top_k": 17.492555618286133,
        "interaction_matrix_overlap_bottom_k": 15.97929859161377,
        "effective_rank": 5.954941272735596,
        "effective_rank_mergeability_score": 2.0510504245758057,
        "stable_rank": -2.3330748081207275,
        "spectral_gap": 7.639285564422607,
        "singular_value_ratio": 2.866452932357788,
        "layerwise_effective_rank": 8.14999008178711,
        "layerwise_effective_rank_mergeability_score": 4.828269958496094,
        "task_vector_cosine_similarity": -0.5405360460281372,
        "task_vector_l2_distance": -27.38144302368164,
        "task_vector_dot_product": 8.05325984954834,
        "weight_space_angle": 9.176724433898926,
        "task_vector_magnitude_ratio": -11.924543380737305,
        "singular_value_overlap": -25.94948387145996,
        "subspace_overlap": 11.978182792663574,
        "right_subspace_overlap": 20.566850662231445,
        "encoder_gradient_cosine_similarity": 8.984541893005371,
        "encoder_gradient_l2_distance": -29.931184768676758,
        "encoder_gradient_dot_product": 18.89719581604004,
        "input_gradient_cosine_similarity": 7.966216087341309,
        "input_gradient_l2_distance": -20.126293182373047,
        "input_gradient_dot_product": -26.421207427978516
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5006553972701652,
      "val_r": 0.40764907887283097,
      "n_iterations": 560,
      "coefficients": {
        "right_subspace_overlap_top_k": 10.31873893737793,
        "right_subspace_overlap_bottom_k": 4.812002658843994,
        "interaction_matrix_overlap_top_k": 11.620749473571777,
        "interaction_matrix_overlap_bottom_k": 20.791460037231445,
        "effective_rank": 2.6991777420043945,
        "effective_rank_mergeability_score": 5.504918575286865,
        "stable_rank": -27.4345703125,
        "spectral_gap": -30.288726806640625,
        "singular_value_ratio": 17.934066772460938,
        "layerwise_effective_rank": 21.716079711914062,
        "layerwise_effective_rank_mergeability_score": 39.20319366455078,
        "task_vector_cosine_similarity": 35.139137268066406,
        "task_vector_l2_distance": -19.099811553955078,
        "task_vector_dot_product": -9.778711318969727,
        "weight_space_angle": -20.5643367767334,
        "task_vector_magnitude_ratio": -46.80939865112305,
        "singular_value_overlap": -74.14717864990234,
        "subspace_overlap": 39.69877243041992,
        "right_subspace_overlap": 82.50672912597656,
        "encoder_gradient_cosine_similarity": 44.127777099609375,
        "encoder_gradient_l2_distance": -29.39409637451172,
        "encoder_gradient_dot_product": 33.43394088745117,
        "input_gradient_cosine_similarity": 26.029855728149414,
        "input_gradient_l2_distance": -81.52207946777344,
        "input_gradient_dot_product": -55.50041198730469
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.562363179129151,
      "val_r": 0.34372998636070073,
      "n_iterations": 672,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.627059936523438,
        "right_subspace_overlap_bottom_k": -35.52219009399414,
        "interaction_matrix_overlap_top_k": 8.53035831451416,
        "interaction_matrix_overlap_bottom_k": 59.382083892822266,
        "effective_rank": 25.416934967041016,
        "effective_rank_mergeability_score": 8.79483699798584,
        "stable_rank": -9.9962797164917,
        "spectral_gap": 26.30656623840332,
        "singular_value_ratio": 1.5121126174926758,
        "layerwise_effective_rank": 4.18583869934082,
        "layerwise_effective_rank_mergeability_score": 6.969919204711914,
        "task_vector_cosine_similarity": 30.633665084838867,
        "task_vector_l2_distance": -30.13035011291504,
        "task_vector_dot_product": -24.26004409790039,
        "weight_space_angle": -5.093570232391357,
        "task_vector_magnitude_ratio": 5.376677989959717,
        "singular_value_overlap": -28.130151748657227,
        "subspace_overlap": -5.475264072418213,
        "right_subspace_overlap": 27.538070678710938,
        "encoder_gradient_cosine_similarity": 13.587257385253906,
        "encoder_gradient_l2_distance": -60.46233367919922,
        "encoder_gradient_dot_product": 36.46807861328125,
        "input_gradient_cosine_similarity": 12.626341819763184,
        "input_gradient_l2_distance": -38.414466857910156,
        "input_gradient_dot_product": -38.47322463989258
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.42504437945440454,
      "val_r": 0.5981839324664783,
      "n_iterations": 851,
      "coefficients": {
        "right_subspace_overlap_top_k": 173.0087127685547,
        "right_subspace_overlap_bottom_k": 84.06490325927734,
        "interaction_matrix_overlap_top_k": 67.6689453125,
        "interaction_matrix_overlap_bottom_k": -33.59153747558594,
        "effective_rank": 77.12539672851562,
        "effective_rank_mergeability_score": -110.21184539794922,
        "stable_rank": 105.73715209960938,
        "spectral_gap": 74.83124542236328,
        "singular_value_ratio": 50.760009765625,
        "layerwise_effective_rank": -78.17135620117188,
        "layerwise_effective_rank_mergeability_score": 175.09779357910156,
        "task_vector_cosine_similarity": -145.56919860839844,
        "task_vector_l2_distance": -63.62986373901367,
        "task_vector_dot_product": 173.61900329589844,
        "weight_space_angle": -17.865007400512695,
        "task_vector_magnitude_ratio": -122.41901397705078,
        "singular_value_overlap": 1.701330304145813,
        "subspace_overlap": -113.51852416992188,
        "right_subspace_overlap": -13.586051940917969,
        "encoder_gradient_cosine_similarity": 29.393903732299805,
        "encoder_gradient_l2_distance": -137.97726440429688,
        "encoder_gradient_dot_product": 20.120121002197266,
        "input_gradient_cosine_similarity": -36.2176399230957,
        "input_gradient_l2_distance": -211.1871795654297,
        "input_gradient_dot_product": 51.81420135498047
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.53595228476217,
      "val_r": 0.6328196512848334,
      "n_iterations": 614,
      "coefficients": {
        "right_subspace_overlap_top_k": 16.688907623291016,
        "right_subspace_overlap_bottom_k": 36.649253845214844,
        "interaction_matrix_overlap_top_k": 20.868141174316406,
        "interaction_matrix_overlap_bottom_k": 2.3466362953186035,
        "effective_rank": -13.015671730041504,
        "effective_rank_mergeability_score": 24.252622604370117,
        "stable_rank": -13.956000328063965,
        "spectral_gap": 16.20841407775879,
        "singular_value_ratio": 40.006141662597656,
        "layerwise_effective_rank": 7.118646621704102,
        "layerwise_effective_rank_mergeability_score": -12.595270156860352,
        "task_vector_cosine_similarity": 22.96942901611328,
        "task_vector_l2_distance": -67.86071014404297,
        "task_vector_dot_product": 55.10540771484375,
        "weight_space_angle": -10.394895553588867,
        "task_vector_magnitude_ratio": -39.20844268798828,
        "singular_value_overlap": -57.1446418762207,
        "subspace_overlap": 0.017192581668496132,
        "right_subspace_overlap": 22.977062225341797,
        "encoder_gradient_cosine_similarity": 20.466764450073242,
        "encoder_gradient_l2_distance": -74.65922546386719,
        "encoder_gradient_dot_product": 47.83258819580078,
        "input_gradient_cosine_similarity": 43.29435729980469,
        "input_gradient_l2_distance": -27.78706169128418,
        "input_gradient_dot_product": -59.182132720947266
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.6060186479081547,
      "val_r": 0.28439156010624245,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.2872185707092285,
        "right_subspace_overlap_bottom_k": -6.589474201202393,
        "interaction_matrix_overlap_top_k": -1.6062812805175781,
        "interaction_matrix_overlap_bottom_k": 12.853020668029785,
        "effective_rank": -1.4016666412353516,
        "effective_rank_mergeability_score": 1.3390460014343262,
        "stable_rank": -2.75228214263916,
        "spectral_gap": 0.09275646507740021,
        "singular_value_ratio": -2.254556179046631,
        "layerwise_effective_rank": 7.697523593902588,
        "layerwise_effective_rank_mergeability_score": 2.72774076461792,
        "task_vector_cosine_similarity": 5.081521034240723,
        "task_vector_l2_distance": -5.527209281921387,
        "task_vector_dot_product": -0.2134624719619751,
        "weight_space_angle": 4.713334083557129,
        "task_vector_magnitude_ratio": 1.5785547494888306,
        "singular_value_overlap": -3.3248696327209473,
        "subspace_overlap": -0.8305551409721375,
        "right_subspace_overlap": -0.1567082703113556,
        "encoder_gradient_cosine_similarity": 0.8803425431251526,
        "encoder_gradient_l2_distance": -6.268242359161377,
        "encoder_gradient_dot_product": 1.3030306100845337,
        "input_gradient_cosine_similarity": -0.5203531384468079,
        "input_gradient_l2_distance": -5.559966564178467,
        "input_gradient_dot_product": -2.5496084690093994
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4809683761823443,
      "val_r": 0.1665176781006173,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 26.21795654296875,
        "right_subspace_overlap_bottom_k": 1.3665375709533691,
        "interaction_matrix_overlap_top_k": 0.6761277318000793,
        "interaction_matrix_overlap_bottom_k": 32.8702507019043,
        "effective_rank": 9.045370101928711,
        "effective_rank_mergeability_score": -3.999992847442627,
        "stable_rank": 6.606378078460693,
        "spectral_gap": 33.54920959472656,
        "singular_value_ratio": -10.664334297180176,
        "layerwise_effective_rank": 1.960310935974121,
        "layerwise_effective_rank_mergeability_score": 1.1856580972671509,
        "task_vector_cosine_similarity": 5.343392372131348,
        "task_vector_l2_distance": -30.835487365722656,
        "task_vector_dot_product": -22.655765533447266,
        "weight_space_angle": -15.638031959533691,
        "task_vector_magnitude_ratio": -4.919414520263672,
        "singular_value_overlap": -43.13711166381836,
        "subspace_overlap": 22.934179306030273,
        "right_subspace_overlap": 38.19602584838867,
        "encoder_gradient_cosine_similarity": 17.61578941345215,
        "encoder_gradient_l2_distance": -42.76189041137695,
        "encoder_gradient_dot_product": 21.96087646484375,
        "input_gradient_cosine_similarity": 12.388995170593262,
        "input_gradient_l2_distance": -50.41630172729492,
        "input_gradient_dot_product": -5.890328884124756
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.4230013605749151,
      "val_r": -0.237415405203857,
      "n_iterations": 681,
      "coefficients": {
        "right_subspace_overlap_top_k": 85.5077896118164,
        "right_subspace_overlap_bottom_k": 1.4866149425506592,
        "interaction_matrix_overlap_top_k": 13.741585731506348,
        "interaction_matrix_overlap_bottom_k": 65.14694213867188,
        "effective_rank": -38.2010612487793,
        "effective_rank_mergeability_score": 41.12621307373047,
        "stable_rank": -51.29773712158203,
        "spectral_gap": -38.229949951171875,
        "singular_value_ratio": 24.51155662536621,
        "layerwise_effective_rank": -72.26951599121094,
        "layerwise_effective_rank_mergeability_score": 17.70159912109375,
        "task_vector_cosine_similarity": 83.83560943603516,
        "task_vector_l2_distance": -8.497260093688965,
        "task_vector_dot_product": -28.04459571838379,
        "weight_space_angle": -46.56793975830078,
        "task_vector_magnitude_ratio": 32.643394470214844,
        "singular_value_overlap": -45.3306884765625,
        "subspace_overlap": 53.49593734741211,
        "right_subspace_overlap": 5.193942546844482,
        "encoder_gradient_cosine_similarity": 69.20577239990234,
        "encoder_gradient_l2_distance": -64.40409851074219,
        "encoder_gradient_dot_product": 7.2777509689331055,
        "input_gradient_cosine_similarity": 36.564208984375,
        "input_gradient_l2_distance": -62.59157943725586,
        "input_gradient_dot_product": -81.00684356689453
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5230467492873645,
      "val_r": 0.3561880341361159,
      "n_iterations": 644,
      "coefficients": {
        "right_subspace_overlap_top_k": 29.599769592285156,
        "right_subspace_overlap_bottom_k": -10.454663276672363,
        "interaction_matrix_overlap_top_k": 21.249134063720703,
        "interaction_matrix_overlap_bottom_k": 21.133718490600586,
        "effective_rank": 7.405068397521973,
        "effective_rank_mergeability_score": 10.277453422546387,
        "stable_rank": -4.312119007110596,
        "spectral_gap": 9.745377540588379,
        "singular_value_ratio": 2.652841329574585,
        "layerwise_effective_rank": -4.102776050567627,
        "layerwise_effective_rank_mergeability_score": 0.6950420141220093,
        "task_vector_cosine_similarity": 23.0035400390625,
        "task_vector_l2_distance": -56.64482498168945,
        "task_vector_dot_product": 24.670833587646484,
        "weight_space_angle": -10.778775215148926,
        "task_vector_magnitude_ratio": -10.302460670471191,
        "singular_value_overlap": -53.113243103027344,
        "subspace_overlap": 11.909585952758789,
        "right_subspace_overlap": 41.11540603637695,
        "encoder_gradient_cosine_similarity": 32.9273681640625,
        "encoder_gradient_l2_distance": -46.49068069458008,
        "encoder_gradient_dot_product": 54.25190353393555,
        "input_gradient_cosine_similarity": 11.219986915588379,
        "input_gradient_l2_distance": -54.72598648071289,
        "input_gradient_dot_product": -49.933841705322266
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5523263306471146,
      "val_r": 0.36245335038017407,
      "n_iterations": 842,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.8442604541778564,
        "right_subspace_overlap_bottom_k": 9.745476722717285,
        "interaction_matrix_overlap_top_k": 9.486305236816406,
        "interaction_matrix_overlap_bottom_k": -0.14455777406692505,
        "effective_rank": 2.3393611907958984,
        "effective_rank_mergeability_score": 6.304585933685303,
        "stable_rank": -0.3367931544780731,
        "spectral_gap": 4.522006988525391,
        "singular_value_ratio": -3.0293612480163574,
        "layerwise_effective_rank": 4.3857526779174805,
        "layerwise_effective_rank_mergeability_score": 0.916335940361023,
        "task_vector_cosine_similarity": -2.315532684326172,
        "task_vector_l2_distance": -12.271551132202148,
        "task_vector_dot_product": 3.150470495223999,
        "weight_space_angle": 0.9356421232223511,
        "task_vector_magnitude_ratio": 4.193097114562988,
        "singular_value_overlap": -7.550382137298584,
        "subspace_overlap": -6.91627311706543,
        "right_subspace_overlap": -1.96429443359375,
        "encoder_gradient_cosine_similarity": 1.5201343297958374,
        "encoder_gradient_l2_distance": -9.352548599243164,
        "encoder_gradient_dot_product": 2.2378687858581543,
        "input_gradient_cosine_similarity": 3.7689249515533447,
        "input_gradient_l2_distance": -9.075196266174316,
        "input_gradient_dot_product": -3.3951518535614014
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.559282004662562,
      "val_r": 0.5437663457773889,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 13.933403968811035,
        "right_subspace_overlap_bottom_k": -6.460270404815674,
        "interaction_matrix_overlap_top_k": 2.883068561553955,
        "interaction_matrix_overlap_bottom_k": 15.538896560668945,
        "effective_rank": -5.336411476135254,
        "effective_rank_mergeability_score": 20.490991592407227,
        "stable_rank": -0.4658891558647156,
        "spectral_gap": 6.183124542236328,
        "singular_value_ratio": -1.2136716842651367,
        "layerwise_effective_rank": 15.708108901977539,
        "layerwise_effective_rank_mergeability_score": -17.651119232177734,
        "task_vector_cosine_similarity": -0.7896155714988708,
        "task_vector_l2_distance": -19.178577423095703,
        "task_vector_dot_product": 8.42264175415039,
        "weight_space_angle": 17.098196029663086,
        "task_vector_magnitude_ratio": -3.9417266845703125,
        "singular_value_overlap": -19.47324562072754,
        "subspace_overlap": 10.731890678405762,
        "right_subspace_overlap": 7.708592414855957,
        "encoder_gradient_cosine_similarity": 8.322310447692871,
        "encoder_gradient_l2_distance": -22.459653854370117,
        "encoder_gradient_dot_product": 8.303557395935059,
        "input_gradient_cosine_similarity": 6.105866432189941,
        "input_gradient_l2_distance": -16.20345115661621,
        "input_gradient_dot_product": -27.258424758911133
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4682139909664061,
      "val_r": 0.29370294663379054,
      "n_iterations": 735,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.5955771207809448,
        "right_subspace_overlap_bottom_k": 9.733588218688965,
        "interaction_matrix_overlap_top_k": 31.763731002807617,
        "interaction_matrix_overlap_bottom_k": 7.494326114654541,
        "effective_rank": 2.0912094116210938,
        "effective_rank_mergeability_score": -5.602400779724121,
        "stable_rank": 19.60036849975586,
        "spectral_gap": 9.14667797088623,
        "singular_value_ratio": -24.106523513793945,
        "layerwise_effective_rank": -2.2951579093933105,
        "layerwise_effective_rank_mergeability_score": 10.927634239196777,
        "task_vector_cosine_similarity": 20.076671600341797,
        "task_vector_l2_distance": -32.01681900024414,
        "task_vector_dot_product": 49.48751449584961,
        "weight_space_angle": -41.91981887817383,
        "task_vector_magnitude_ratio": 2.7814252376556396,
        "singular_value_overlap": -52.19630432128906,
        "subspace_overlap": 19.380382537841797,
        "right_subspace_overlap": -5.665317535400391,
        "encoder_gradient_cosine_similarity": 33.0831413269043,
        "encoder_gradient_l2_distance": -32.70826721191406,
        "encoder_gradient_dot_product": 49.238162994384766,
        "input_gradient_cosine_similarity": 15.434008598327637,
        "input_gradient_l2_distance": -29.907487869262695,
        "input_gradient_dot_product": -54.418521881103516
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.43177015369252514,
      "val_r": 0.6259147767594183,
      "n_iterations": 593,
      "coefficients": {
        "right_subspace_overlap_top_k": 18.511707305908203,
        "right_subspace_overlap_bottom_k": 25.75614356994629,
        "interaction_matrix_overlap_top_k": 39.07170104980469,
        "interaction_matrix_overlap_bottom_k": -39.59376907348633,
        "effective_rank": -50.14693069458008,
        "effective_rank_mergeability_score": 21.66080093383789,
        "stable_rank": -6.098048686981201,
        "spectral_gap": 33.44068145751953,
        "singular_value_ratio": -11.31181812286377,
        "layerwise_effective_rank": 33.25820541381836,
        "layerwise_effective_rank_mergeability_score": -19.341053009033203,
        "task_vector_cosine_similarity": -71.87890625,
        "task_vector_l2_distance": -10.440939903259277,
        "task_vector_dot_product": 0.9222930073738098,
        "weight_space_angle": -1.521875023841858,
        "task_vector_magnitude_ratio": 40.69817352294922,
        "singular_value_overlap": -52.177066802978516,
        "subspace_overlap": 44.80474853515625,
        "right_subspace_overlap": 101.29399108886719,
        "encoder_gradient_cosine_similarity": 47.077518463134766,
        "encoder_gradient_l2_distance": -70.74433898925781,
        "encoder_gradient_dot_product": 11.206059455871582,
        "input_gradient_cosine_similarity": 2.6174027919769287,
        "input_gradient_l2_distance": -16.060901641845703,
        "input_gradient_dot_product": -70.00631713867188
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4267493105953266,
      "val_r": 0.5761630681990627,
      "n_iterations": 934,
      "coefficients": {
        "right_subspace_overlap_top_k": 75.25934600830078,
        "right_subspace_overlap_bottom_k": -46.73640060424805,
        "interaction_matrix_overlap_top_k": 34.34864044189453,
        "interaction_matrix_overlap_bottom_k": 15.61064338684082,
        "effective_rank": -25.873811721801758,
        "effective_rank_mergeability_score": 22.9234676361084,
        "stable_rank": -15.610968589782715,
        "spectral_gap": 16.771728515625,
        "singular_value_ratio": -3.8964145183563232,
        "layerwise_effective_rank": 3.37788462638855,
        "layerwise_effective_rank_mergeability_score": -36.409202575683594,
        "task_vector_cosine_similarity": 25.98237419128418,
        "task_vector_l2_distance": -46.71500778198242,
        "task_vector_dot_product": 26.040889739990234,
        "weight_space_angle": -7.79760217666626,
        "task_vector_magnitude_ratio": 7.204225540161133,
        "singular_value_overlap": -70.55900573730469,
        "subspace_overlap": 34.70768737792969,
        "right_subspace_overlap": 42.275535583496094,
        "encoder_gradient_cosine_similarity": 51.94562911987305,
        "encoder_gradient_l2_distance": -52.21907424926758,
        "encoder_gradient_dot_product": 38.22370147705078,
        "input_gradient_cosine_similarity": 10.884904861450195,
        "input_gradient_l2_distance": -18.930143356323242,
        "input_gradient_dot_product": -79.8107681274414
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5234482628950385,
      "val_r": 0.324962330281244,
      "n_iterations": 578,
      "coefficients": {
        "right_subspace_overlap_top_k": 23.093372344970703,
        "right_subspace_overlap_bottom_k": 8.336146354675293,
        "interaction_matrix_overlap_top_k": 39.1578483581543,
        "interaction_matrix_overlap_bottom_k": -11.3031005859375,
        "effective_rank": 8.395235061645508,
        "effective_rank_mergeability_score": 22.694334030151367,
        "stable_rank": -24.98686408996582,
        "spectral_gap": 16.827533721923828,
        "singular_value_ratio": 18.705846786499023,
        "layerwise_effective_rank": 16.69921112060547,
        "layerwise_effective_rank_mergeability_score": -14.714447975158691,
        "task_vector_cosine_similarity": 36.72145462036133,
        "task_vector_l2_distance": -48.15574264526367,
        "task_vector_dot_product": 10.358277320861816,
        "weight_space_angle": -18.935791015625,
        "task_vector_magnitude_ratio": -16.920522689819336,
        "singular_value_overlap": -35.771209716796875,
        "subspace_overlap": 16.20085906982422,
        "right_subspace_overlap": 38.11738967895508,
        "encoder_gradient_cosine_similarity": 21.38450813293457,
        "encoder_gradient_l2_distance": -47.4753303527832,
        "encoder_gradient_dot_product": 39.91044235229492,
        "input_gradient_cosine_similarity": 25.9606876373291,
        "input_gradient_l2_distance": -43.985286712646484,
        "input_gradient_dot_product": -79.31743621826172
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6339239253484723,
      "val_r": 0.6271747105043887,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.7030816674232483,
        "right_subspace_overlap_bottom_k": -1.3194390535354614,
        "interaction_matrix_overlap_top_k": -1.3045084476470947,
        "interaction_matrix_overlap_bottom_k": 1.6603361368179321,
        "effective_rank": 0.8246133327484131,
        "effective_rank_mergeability_score": 0.8438488841056824,
        "stable_rank": -0.43540260195732117,
        "spectral_gap": 0.7436414361000061,
        "singular_value_ratio": 1.3213874101638794,
        "layerwise_effective_rank": 0.05950816348195076,
        "layerwise_effective_rank_mergeability_score": -0.30908089876174927,
        "task_vector_cosine_similarity": -0.10105843096971512,
        "task_vector_l2_distance": -0.3238810896873474,
        "task_vector_dot_product": 0.26616933941841125,
        "weight_space_angle": -0.4470946490764618,
        "task_vector_magnitude_ratio": -0.5447966456413269,
        "singular_value_overlap": -0.2389024794101715,
        "subspace_overlap": 0.02082696370780468,
        "right_subspace_overlap": 0.1490701138973236,
        "encoder_gradient_cosine_similarity": 0.02915845811367035,
        "encoder_gradient_l2_distance": -0.24531660974025726,
        "encoder_gradient_dot_product": 0.08452872186899185,
        "input_gradient_cosine_similarity": 0.03306785598397255,
        "input_gradient_l2_distance": -0.34659719467163086,
        "input_gradient_dot_product": -0.1244048923254013
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.46415642713935423,
      "val_r": 0.27998057552809863,
      "n_iterations": 452,
      "coefficients": {
        "right_subspace_overlap_top_k": 50.51213073730469,
        "right_subspace_overlap_bottom_k": 47.291866302490234,
        "interaction_matrix_overlap_top_k": 8.86070442199707,
        "interaction_matrix_overlap_bottom_k": 0.410295307636261,
        "effective_rank": -9.540502548217773,
        "effective_rank_mergeability_score": -6.258843421936035,
        "stable_rank": 38.57206726074219,
        "spectral_gap": 9.550190925598145,
        "singular_value_ratio": -23.652217864990234,
        "layerwise_effective_rank": -9.4213285446167,
        "layerwise_effective_rank_mergeability_score": 16.242231369018555,
        "task_vector_cosine_similarity": 27.029829025268555,
        "task_vector_l2_distance": 19.34555435180664,
        "task_vector_dot_product": -83.88105773925781,
        "weight_space_angle": -39.743919372558594,
        "task_vector_magnitude_ratio": -20.537233352661133,
        "singular_value_overlap": -44.7902946472168,
        "subspace_overlap": 54.19511032104492,
        "right_subspace_overlap": 22.23213768005371,
        "encoder_gradient_cosine_similarity": 28.091524124145508,
        "encoder_gradient_l2_distance": -55.82686233520508,
        "encoder_gradient_dot_product": 29.862712860107422,
        "input_gradient_cosine_similarity": 45.27146530151367,
        "input_gradient_l2_distance": -59.692771911621094,
        "input_gradient_dot_product": -43.12609100341797
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7174574083805669,
      "val_r": 0.5653813813897329,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 5.390468597412109,
        "right_subspace_overlap_bottom_k": -21.386859893798828,
        "interaction_matrix_overlap_top_k": 47.008155822753906,
        "interaction_matrix_overlap_bottom_k": -12.72534465789795,
        "effective_rank": 10.950394630432129,
        "effective_rank_mergeability_score": 24.135658264160156,
        "stable_rank": -4.904451370239258,
        "spectral_gap": -14.820734977722168,
        "singular_value_ratio": -0.3407781720161438,
        "layerwise_effective_rank": -7.766732692718506,
        "layerwise_effective_rank_mergeability_score": -10.444629669189453,
        "task_vector_cosine_similarity": 0.2673704922199249,
        "task_vector_l2_distance": 6.8067522048950195,
        "task_vector_dot_product": -3.215407371520996,
        "weight_space_angle": 8.997876167297363,
        "task_vector_magnitude_ratio": -5.43796443939209,
        "singular_value_overlap": 1.3659943342208862,
        "subspace_overlap": 5.707612037658691,
        "right_subspace_overlap": 8.730350494384766,
        "encoder_gradient_cosine_similarity": 15.668286323547363,
        "encoder_gradient_l2_distance": -21.144027709960938,
        "encoder_gradient_dot_product": 10.666647911071777,
        "input_gradient_cosine_similarity": -2.1893627643585205,
        "input_gradient_l2_distance": -25.151046752929688,
        "input_gradient_dot_product": -15.169817924499512
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5843324656494935,
      "val_r": 0.38853659529103873,
      "n_iterations": 848,
      "coefficients": {
        "right_subspace_overlap_top_k": 4.988145351409912,
        "right_subspace_overlap_bottom_k": -12.991991996765137,
        "interaction_matrix_overlap_top_k": 17.994678497314453,
        "interaction_matrix_overlap_bottom_k": 31.89631462097168,
        "effective_rank": 7.5663018226623535,
        "effective_rank_mergeability_score": 7.250909805297852,
        "stable_rank": 3.5462357997894287,
        "spectral_gap": 30.750585556030273,
        "singular_value_ratio": 21.229257583618164,
        "layerwise_effective_rank": 17.581045150756836,
        "layerwise_effective_rank_mergeability_score": 24.16205406188965,
        "task_vector_cosine_similarity": -25.664306640625,
        "task_vector_l2_distance": -44.19503402709961,
        "task_vector_dot_product": 13.0364351272583,
        "weight_space_angle": -12.606192588806152,
        "task_vector_magnitude_ratio": -7.857732772827148,
        "singular_value_overlap": -43.11944580078125,
        "subspace_overlap": 20.135494232177734,
        "right_subspace_overlap": 11.115256309509277,
        "encoder_gradient_cosine_similarity": 20.587339401245117,
        "encoder_gradient_l2_distance": -35.54729461669922,
        "encoder_gradient_dot_product": 27.51205062866211,
        "input_gradient_cosine_similarity": 15.245153427124023,
        "input_gradient_l2_distance": -45.00881576538086,
        "input_gradient_dot_product": -46.608253479003906
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}