{
  "aggregate_metrics": {
    "train_r": 0.16727052636986867,
    "train_p": 1.1953097159150748e-21,
    "val_r": 0.19602247759523134,
    "val_p": 0.0001897999447864549
  },
  "per_fold_stats": {
    "train_r_mean": 0.4806556586097314,
    "train_r_std": 0.09117042485445828,
    "val_r_mean": 0.37584147475286855,
    "val_r_std": 0.20419107919939009
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 48.140846252441406,
    "right_subspace_overlap_bottom_k": 36.38416290283203,
    "interaction_matrix_overlap_top_k": 5.945261478424072,
    "interaction_matrix_overlap_bottom_k": 39.328609466552734,
    "effective_rank": -4.18609619140625,
    "effective_rank_mergeability_score": 7.503643989562988,
    "stable_rank": -3.0267465114593506,
    "spectral_gap": 0.3822577893733978,
    "singular_value_ratio": -21.330726623535156,
    "layerwise_effective_rank": -5.568869590759277,
    "layerwise_effective_rank_mergeability_score": -11.3728609085083,
    "task_vector_cosine_similarity": -3.768975019454956,
    "task_vector_l2_distance": -35.93769454956055,
    "task_vector_dot_product": -8.367576599121094,
    "weight_space_angle": 29.854145050048828,
    "task_vector_magnitude_ratio": -7.449483394622803,
    "singular_value_overlap": -42.277854919433594,
    "subspace_overlap": 17.339656829833984,
    "right_subspace_overlap": 17.883533477783203,
    "encoder_gradient_cosine_similarity": 14.315057754516602,
    "encoder_gradient_l2_distance": -25.734664916992188,
    "encoder_gradient_dot_product": 22.976688385009766,
    "input_gradient_cosine_similarity": 18.087373733520508,
    "input_gradient_l2_distance": -46.508689880371094,
    "input_gradient_dot_product": -41.61314010620117
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 51.13064956665039,
    "right_subspace_overlap_bottom_k": 65.27442932128906,
    "interaction_matrix_overlap_top_k": 41.54039001464844,
    "interaction_matrix_overlap_bottom_k": 49.813236236572266,
    "effective_rank": 56.09489822387695,
    "effective_rank_mergeability_score": 47.82360076904297,
    "stable_rank": 31.38559913635254,
    "spectral_gap": 34.13792419433594,
    "singular_value_ratio": 37.796295166015625,
    "layerwise_effective_rank": 33.98410415649414,
    "layerwise_effective_rank_mergeability_score": 45.553863525390625,
    "task_vector_cosine_similarity": 40.3008918762207,
    "task_vector_l2_distance": 43.703895568847656,
    "task_vector_dot_product": 44.586219787597656,
    "weight_space_angle": 71.57379150390625,
    "task_vector_magnitude_ratio": 30.82371711730957,
    "singular_value_overlap": 32.79603958129883,
    "subspace_overlap": 32.509300231933594,
    "right_subspace_overlap": 28.939348220825195,
    "encoder_gradient_cosine_similarity": 26.119535446166992,
    "encoder_gradient_l2_distance": 43.2000732421875,
    "encoder_gradient_dot_product": 45.62858963012695,
    "input_gradient_cosine_similarity": 18.023555755615234,
    "input_gradient_l2_distance": 46.92709732055664,
    "input_gradient_dot_product": 63.99600601196289
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.49035500096240414,
      "val_r": 0.5897749418371877,
      "n_iterations": 683,
      "coefficients": {
        "right_subspace_overlap_top_k": 68.73896026611328,
        "right_subspace_overlap_bottom_k": 91.37103271484375,
        "interaction_matrix_overlap_top_k": 31.14832878112793,
        "interaction_matrix_overlap_bottom_k": 69.36382293701172,
        "effective_rank": -8.577086448669434,
        "effective_rank_mergeability_score": 44.32826232910156,
        "stable_rank": -14.363791465759277,
        "spectral_gap": 36.11246109008789,
        "singular_value_ratio": -18.207965850830078,
        "layerwise_effective_rank": -4.282628059387207,
        "layerwise_effective_rank_mergeability_score": -42.51250076293945,
        "task_vector_cosine_similarity": 73.19514465332031,
        "task_vector_l2_distance": -119.96896362304688,
        "task_vector_dot_product": 23.724576950073242,
        "weight_space_angle": 49.45371627807617,
        "task_vector_magnitude_ratio": -5.297768592834473,
        "singular_value_overlap": -95.88085174560547,
        "subspace_overlap": 38.84658432006836,
        "right_subspace_overlap": -9.54377269744873,
        "encoder_gradient_cosine_similarity": -3.9951119422912598,
        "encoder_gradient_l2_distance": -102.61593627929688,
        "encoder_gradient_dot_product": 51.451873779296875,
        "input_gradient_cosine_similarity": 50.68821716308594,
        "input_gradient_l2_distance": -97.03130340576172,
        "input_gradient_dot_product": -105.14765167236328
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5432245058818463,
      "val_r": 0.5197328463708625,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.1730304956436157,
        "right_subspace_overlap_bottom_k": 5.983649253845215,
        "interaction_matrix_overlap_top_k": 1.4287620782852173,
        "interaction_matrix_overlap_bottom_k": 0.8823767304420471,
        "effective_rank": -0.040070656687021255,
        "effective_rank_mergeability_score": 3.375462532043457,
        "stable_rank": 0.46151888370513916,
        "spectral_gap": 0.31819936633110046,
        "singular_value_ratio": 1.1532124280929565,
        "layerwise_effective_rank": 3.736110210418701,
        "layerwise_effective_rank_mergeability_score": 1.5772892236709595,
        "task_vector_cosine_similarity": 1.262204647064209,
        "task_vector_l2_distance": -4.911165237426758,
        "task_vector_dot_product": 1.1923397779464722,
        "weight_space_angle": 0.8390842080116272,
        "task_vector_magnitude_ratio": -2.2200582027435303,
        "singular_value_overlap": -3.9218456745147705,
        "subspace_overlap": -1.608397364616394,
        "right_subspace_overlap": -1.7169439792633057,
        "encoder_gradient_cosine_similarity": -0.04548614099621773,
        "encoder_gradient_l2_distance": -4.299805641174316,
        "encoder_gradient_dot_product": 0.5524417757987976,
        "input_gradient_cosine_similarity": 1.2432482242584229,
        "input_gradient_l2_distance": -4.03558874130249,
        "input_gradient_dot_product": -1.3803950548171997
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5193761053119121,
      "val_r": 0.413398495600589,
      "n_iterations": 424,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.439212799072266,
        "right_subspace_overlap_bottom_k": 28.560771942138672,
        "interaction_matrix_overlap_top_k": 32.49717712402344,
        "interaction_matrix_overlap_bottom_k": 37.39506912231445,
        "effective_rank": 15.862244606018066,
        "effective_rank_mergeability_score": -3.6840758323669434,
        "stable_rank": 1.5780128240585327,
        "spectral_gap": 6.154335021972656,
        "singular_value_ratio": -16.540281295776367,
        "layerwise_effective_rank": 5.565829277038574,
        "layerwise_effective_rank_mergeability_score": 16.927337646484375,
        "task_vector_cosine_similarity": -2.214674949645996,
        "task_vector_l2_distance": -40.83401870727539,
        "task_vector_dot_product": 2.5227065086364746,
        "weight_space_angle": 7.882326602935791,
        "task_vector_magnitude_ratio": -12.583118438720703,
        "singular_value_overlap": -51.556156158447266,
        "subspace_overlap": 19.336524963378906,
        "right_subspace_overlap": -8.17296314239502,
        "encoder_gradient_cosine_similarity": 2.0466208457946777,
        "encoder_gradient_l2_distance": -25.047700881958008,
        "encoder_gradient_dot_product": 18.198028564453125,
        "input_gradient_cosine_similarity": 26.899076461791992,
        "input_gradient_l2_distance": -37.704261779785156,
        "input_gradient_dot_product": -29.531381607055664
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.579966174092056,
      "val_r": 0.48679996125164293,
      "n_iterations": 847,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.1486072987318039,
        "right_subspace_overlap_bottom_k": -0.9435663223266602,
        "interaction_matrix_overlap_top_k": -1.4640766382217407,
        "interaction_matrix_overlap_bottom_k": 1.4903098344802856,
        "effective_rank": 0.4781189262866974,
        "effective_rank_mergeability_score": 0.8408353924751282,
        "stable_rank": 0.3295753300189972,
        "spectral_gap": 0.3973301947116852,
        "singular_value_ratio": 0.4303008019924164,
        "layerwise_effective_rank": 0.2195240706205368,
        "layerwise_effective_rank_mergeability_score": 0.18679897487163544,
        "task_vector_cosine_similarity": -0.4655703008174896,
        "task_vector_l2_distance": -0.3021492063999176,
        "task_vector_dot_product": 0.3631507456302643,
        "weight_space_angle": -0.5819677114486694,
        "task_vector_magnitude_ratio": -0.19536836445331573,
        "singular_value_overlap": -0.3029221296310425,
        "subspace_overlap": 0.17772604525089264,
        "right_subspace_overlap": 0.591036856174469,
        "encoder_gradient_cosine_similarity": -0.018472040072083473,
        "encoder_gradient_l2_distance": -0.11984168738126755,
        "encoder_gradient_dot_product": 0.010038339532911777,
        "input_gradient_cosine_similarity": 0.09410955756902695,
        "input_gradient_l2_distance": -0.2772441506385803,
        "input_gradient_dot_product": -0.08771701157093048
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.30807196273297327,
      "val_r": 0.2773285391322126,
      "n_iterations": 468,
      "coefficients": {
        "right_subspace_overlap_top_k": 130.7686004638672,
        "right_subspace_overlap_bottom_k": 62.0387077331543,
        "interaction_matrix_overlap_top_k": -57.95948028564453,
        "interaction_matrix_overlap_bottom_k": 138.101318359375,
        "effective_rank": -95.37885284423828,
        "effective_rank_mergeability_score": 14.902533531188965,
        "stable_rank": -68.5762939453125,
        "spectral_gap": 43.962913513183594,
        "singular_value_ratio": 25.943735122680664,
        "layerwise_effective_rank": -16.68250846862793,
        "layerwise_effective_rank_mergeability_score": -93.28252410888672,
        "task_vector_cosine_similarity": 8.395706176757812,
        "task_vector_l2_distance": 83.86421203613281,
        "task_vector_dot_product": -46.50307846069336,
        "weight_space_angle": -75.29857635498047,
        "task_vector_magnitude_ratio": 27.581106185913086,
        "singular_value_overlap": -76.0792465209961,
        "subspace_overlap": 51.7332649230957,
        "right_subspace_overlap": 22.63361167907715,
        "encoder_gradient_cosine_similarity": 3.030287027359009,
        "encoder_gradient_l2_distance": -20.232995986938477,
        "encoder_gradient_dot_product": -21.400075912475586,
        "input_gradient_cosine_similarity": 54.47825622558594,
        "input_gradient_l2_distance": -56.36189270019531,
        "input_gradient_dot_product": -38.68196105957031
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.501065650851966,
      "val_r": 0.7885234591937846,
      "n_iterations": 827,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.45708075165748596,
        "right_subspace_overlap_bottom_k": -24.651683807373047,
        "interaction_matrix_overlap_top_k": -19.98405647277832,
        "interaction_matrix_overlap_bottom_k": 122.3342514038086,
        "effective_rank": 5.601956844329834,
        "effective_rank_mergeability_score": 75.49422454833984,
        "stable_rank": 18.2579402923584,
        "spectral_gap": -50.08512878417969,
        "singular_value_ratio": -16.114686965942383,
        "layerwise_effective_rank": 44.413875579833984,
        "layerwise_effective_rank_mergeability_score": -17.022911071777344,
        "task_vector_cosine_similarity": 40.059261322021484,
        "task_vector_l2_distance": -67.31298065185547,
        "task_vector_dot_product": -9.179458618164062,
        "weight_space_angle": 65.38018035888672,
        "task_vector_magnitude_ratio": -77.51123046875,
        "singular_value_overlap": -49.50196075439453,
        "subspace_overlap": -6.73118257522583,
        "right_subspace_overlap": 65.20758056640625,
        "encoder_gradient_cosine_similarity": -23.36789894104004,
        "encoder_gradient_l2_distance": -31.625972747802734,
        "encoder_gradient_dot_product": 20.550329208374023,
        "input_gradient_cosine_similarity": 19.949304580688477,
        "input_gradient_l2_distance": -91.67476654052734,
        "input_gradient_dot_product": 8.056106567382812
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5103951402716695,
      "val_r": -0.12236797934569221,
      "n_iterations": 771,
      "coefficients": {
        "right_subspace_overlap_top_k": 42.279197692871094,
        "right_subspace_overlap_bottom_k": 29.664146423339844,
        "interaction_matrix_overlap_top_k": -12.54101276397705,
        "interaction_matrix_overlap_bottom_k": 23.590370178222656,
        "effective_rank": -14.451151847839355,
        "effective_rank_mergeability_score": 9.533377647399902,
        "stable_rank": 31.096492767333984,
        "spectral_gap": 1.2811329364776611,
        "singular_value_ratio": -19.156038284301758,
        "layerwise_effective_rank": 0.7340141534805298,
        "layerwise_effective_rank_mergeability_score": -0.5556400418281555,
        "task_vector_cosine_similarity": 6.814720630645752,
        "task_vector_l2_distance": -56.55878448486328,
        "task_vector_dot_product": 9.925479888916016,
        "weight_space_angle": 65.87046813964844,
        "task_vector_magnitude_ratio": -22.49587631225586,
        "singular_value_overlap": -24.0910587310791,
        "subspace_overlap": 9.785345077514648,
        "right_subspace_overlap": 16.643905639648438,
        "encoder_gradient_cosine_similarity": 14.168031692504883,
        "encoder_gradient_l2_distance": -56.94136428833008,
        "encoder_gradient_dot_product": 32.49527359008789,
        "input_gradient_cosine_similarity": -3.7216618061065674,
        "input_gradient_l2_distance": -27.988113403320312,
        "input_gradient_dot_product": -54.383155822753906
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.36052520601603,
      "val_r": 0.2017799703031678,
      "n_iterations": 564,
      "coefficients": {
        "right_subspace_overlap_top_k": 162.6822967529297,
        "right_subspace_overlap_bottom_k": 40.73015594482422,
        "interaction_matrix_overlap_top_k": 56.48323059082031,
        "interaction_matrix_overlap_bottom_k": 1.1527973413467407,
        "effective_rank": 77.42587280273438,
        "effective_rank_mergeability_score": -68.17317962646484,
        "stable_rank": 45.50536346435547,
        "spectral_gap": 35.732948303222656,
        "singular_value_ratio": -120.54551696777344,
        "layerwise_effective_rank": -92.60032653808594,
        "layerwise_effective_rank_mergeability_score": 40.35059356689453,
        "task_vector_cosine_similarity": -77.54119873046875,
        "task_vector_l2_distance": 2.7235803604125977,
        "task_vector_dot_product": -151.60519409179688,
        "weight_space_angle": -10.938498497009277,
        "task_vector_magnitude_ratio": 29.817665100097656,
        "singular_value_overlap": -100.14379119873047,
        "subspace_overlap": 63.11049270629883,
        "right_subspace_overlap": 85.23873901367188,
        "encoder_gradient_cosine_similarity": 39.64943313598633,
        "encoder_gradient_l2_distance": 12.539162635803223,
        "encoder_gradient_dot_product": -16.206520080566406,
        "input_gradient_cosine_similarity": 0.9239580035209656,
        "input_gradient_l2_distance": -49.030303955078125,
        "input_gradient_dot_product": -6.284627437591553
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.4626262996150136,
      "val_r": 0.08626025633336071,
      "n_iterations": 562,
      "coefficients": {
        "right_subspace_overlap_top_k": 22.86854362487793,
        "right_subspace_overlap_bottom_k": 29.052242279052734,
        "interaction_matrix_overlap_top_k": 2.8914451599121094,
        "interaction_matrix_overlap_bottom_k": 11.669437408447266,
        "effective_rank": -3.7022366523742676,
        "effective_rank_mergeability_score": 8.753951072692871,
        "stable_rank": -8.223271369934082,
        "spectral_gap": 18.251188278198242,
        "singular_value_ratio": -12.545366287231445,
        "layerwise_effective_rank": 16.745704650878906,
        "layerwise_effective_rank_mergeability_score": -14.779810905456543,
        "task_vector_cosine_similarity": -1.9639562368392944,
        "task_vector_l2_distance": -25.07731819152832,
        "task_vector_dot_product": -18.087566375732422,
        "weight_space_angle": -0.14558765292167664,
        "task_vector_magnitude_ratio": -8.301324844360352,
        "singular_value_overlap": -46.397220611572266,
        "subspace_overlap": 9.588438987731934,
        "right_subspace_overlap": 46.38581466674805,
        "encoder_gradient_cosine_similarity": 40.027976989746094,
        "encoder_gradient_l2_distance": -33.93938446044922,
        "encoder_gradient_dot_product": 27.2001953125,
        "input_gradient_cosine_similarity": 18.871225357055664,
        "input_gradient_l2_distance": -32.4463005065918,
        "input_gradient_dot_product": -45.69949722290039
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.43018916804935015,
      "val_r": 0.3443708159487475,
      "n_iterations": 478,
      "coefficients": {
        "right_subspace_overlap_top_k": 109.91810607910156,
        "right_subspace_overlap_bottom_k": -31.887969970703125,
        "interaction_matrix_overlap_top_k": 53.033607482910156,
        "interaction_matrix_overlap_bottom_k": 151.68173217773438,
        "effective_rank": -70.0858154296875,
        "effective_rank_mergeability_score": 85.3682861328125,
        "stable_rank": -31.735443115234375,
        "spectral_gap": 15.583147048950195,
        "singular_value_ratio": -15.10242748260498,
        "layerwise_effective_rank": 11.590651512145996,
        "layerwise_effective_rank_mergeability_score": -80.56339263916016,
        "task_vector_cosine_similarity": 33.413108825683594,
        "task_vector_l2_distance": -44.22798156738281,
        "task_vector_dot_product": -73.55093383789062,
        "weight_space_angle": 30.21847152709961,
        "task_vector_magnitude_ratio": 38.7833251953125,
        "singular_value_overlap": -76.51423645019531,
        "subspace_overlap": -44.180450439453125,
        "right_subspace_overlap": 65.75931549072266,
        "encoder_gradient_cosine_similarity": 28.24026107788086,
        "encoder_gradient_l2_distance": -96.65394592285156,
        "encoder_gradient_dot_product": 39.627166748046875,
        "input_gradient_cosine_similarity": 19.98988151550293,
        "input_gradient_l2_distance": -35.18590545654297,
        "input_gradient_dot_product": -82.52163696289062
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5278138905116996,
      "val_r": 0.41308973333058924,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.9289132952690125,
        "right_subspace_overlap_bottom_k": 1.747924566268921,
        "interaction_matrix_overlap_top_k": -1.5441263914108276,
        "interaction_matrix_overlap_bottom_k": 2.561368942260742,
        "effective_rank": 0.3748024106025696,
        "effective_rank_mergeability_score": 1.8469417095184326,
        "stable_rank": 0.23585182428359985,
        "spectral_gap": 1.569064736366272,
        "singular_value_ratio": 0.8856971859931946,
        "layerwise_effective_rank": 0.40628114342689514,
        "layerwise_effective_rank_mergeability_score": -0.2704800069332123,
        "task_vector_cosine_similarity": 0.276921808719635,
        "task_vector_l2_distance": -2.6058290004730225,
        "task_vector_dot_product": 0.530279815196991,
        "weight_space_angle": 0.23550084233283997,
        "task_vector_magnitude_ratio": 0.1358768492937088,
        "singular_value_overlap": -2.1662657260894775,
        "subspace_overlap": 0.47068852186203003,
        "right_subspace_overlap": 0.8605725169181824,
        "encoder_gradient_cosine_similarity": -0.09770075231790543,
        "encoder_gradient_l2_distance": -1.4256117343902588,
        "encoder_gradient_dot_product": -0.20953790843486786,
        "input_gradient_cosine_similarity": 0.6213029623031616,
        "input_gradient_l2_distance": -1.9070841073989868,
        "input_gradient_dot_product": -0.6036344170570374
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5161946070826372,
      "val_r": 0.5225564417501579,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -5.518855094909668,
        "right_subspace_overlap_bottom_k": 4.472259044647217,
        "interaction_matrix_overlap_top_k": -11.92236614227295,
        "interaction_matrix_overlap_bottom_k": 36.340152740478516,
        "effective_rank": -4.099583148956299,
        "effective_rank_mergeability_score": 13.049490928649902,
        "stable_rank": -3.0482888221740723,
        "spectral_gap": -2.996523857116699,
        "singular_value_ratio": -24.1809024810791,
        "layerwise_effective_rank": 34.68445587158203,
        "layerwise_effective_rank_mergeability_score": 13.379128456115723,
        "task_vector_cosine_similarity": -35.865966796875,
        "task_vector_l2_distance": -30.150726318359375,
        "task_vector_dot_product": 40.0901985168457,
        "weight_space_angle": 19.57472038269043,
        "task_vector_magnitude_ratio": 6.2103095054626465,
        "singular_value_overlap": -28.33283233642578,
        "subspace_overlap": 33.10106658935547,
        "right_subspace_overlap": -0.43663856387138367,
        "encoder_gradient_cosine_similarity": 3.752599000930786,
        "encoder_gradient_l2_distance": -18.05718421936035,
        "encoder_gradient_dot_product": 0.7705238461494446,
        "input_gradient_cosine_similarity": 7.9250359535217285,
        "input_gradient_l2_distance": -21.743118286132812,
        "input_gradient_dot_product": -25.998279571533203
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.30568408561981003,
      "val_r": 0.20563159363478284,
      "n_iterations": 487,
      "coefficients": {
        "right_subspace_overlap_top_k": 144.8486785888672,
        "right_subspace_overlap_bottom_k": 268.0596618652344,
        "interaction_matrix_overlap_top_k": 136.26754760742188,
        "interaction_matrix_overlap_bottom_k": -49.37776184082031,
        "effective_rank": -143.35818481445312,
        "effective_rank_mergeability_score": -140.46041870117188,
        "stable_rank": 54.77898406982422,
        "spectral_gap": 9.353631973266602,
        "singular_value_ratio": -124.66056060791016,
        "layerwise_effective_rank": -35.83803176879883,
        "layerwise_effective_rank_mergeability_score": -117.64078521728516,
        "task_vector_cosine_similarity": -102.24683380126953,
        "task_vector_l2_distance": -101.19844055175781,
        "task_vector_dot_product": -9.010933876037598,
        "weight_space_angle": 307.7027587890625,
        "task_vector_magnitude_ratio": -50.191219329833984,
        "singular_value_overlap": 4.521020889282227,
        "subspace_overlap": -6.883511066436768,
        "right_subspace_overlap": 17.470035552978516,
        "encoder_gradient_cosine_similarity": 106.6142807006836,
        "encoder_gradient_l2_distance": 109.1449203491211,
        "encoder_gradient_dot_product": 202.94985961914062,
        "input_gradient_cosine_similarity": 29.562210083007812,
        "input_gradient_l2_distance": -218.01287841796875,
        "input_gradient_dot_product": -291.3970947265625
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3785328335015252,
      "val_r": 0.533250629795134,
      "n_iterations": 460,
      "coefficients": {
        "right_subspace_overlap_top_k": 62.11006164550781,
        "right_subspace_overlap_bottom_k": 134.5089569091797,
        "interaction_matrix_overlap_top_k": -31.567453384399414,
        "interaction_matrix_overlap_bottom_k": 3.839534044265747,
        "effective_rank": 135.1576385498047,
        "effective_rank_mergeability_score": 21.524856567382812,
        "stable_rank": -16.38140296936035,
        "spectral_gap": -108.87533569335938,
        "singular_value_ratio": -31.841753005981445,
        "layerwise_effective_rank": -97.14534759521484,
        "layerwise_effective_rank_mergeability_score": 76.30431365966797,
        "task_vector_cosine_similarity": -73.606201171875,
        "task_vector_l2_distance": -84.81754302978516,
        "task_vector_dot_product": 42.99125289916992,
        "weight_space_angle": -7.702002048492432,
        "task_vector_magnitude_ratio": -73.95779418945312,
        "singular_value_overlap": -47.57358932495117,
        "subspace_overlap": 21.47244644165039,
        "right_subspace_overlap": 51.58564758300781,
        "encoder_gradient_cosine_similarity": 22.3166446685791,
        "encoder_gradient_l2_distance": -35.274871826171875,
        "encoder_gradient_dot_product": 54.64216613769531,
        "input_gradient_cosine_similarity": 21.1329402923584,
        "input_gradient_l2_distance": -26.762996673583984,
        "input_gradient_dot_product": -11.083422660827637
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4433133670242425,
      "val_r": 0.4785354534298062,
      "n_iterations": 572,
      "coefficients": {
        "right_subspace_overlap_top_k": 28.396949768066406,
        "right_subspace_overlap_bottom_k": 12.875178337097168,
        "interaction_matrix_overlap_top_k": -53.114280700683594,
        "interaction_matrix_overlap_bottom_k": 76.3102798461914,
        "effective_rank": -46.33253860473633,
        "effective_rank_mergeability_score": 60.363121032714844,
        "stable_rank": -12.166237831115723,
        "spectral_gap": 33.985660552978516,
        "singular_value_ratio": 12.785435676574707,
        "layerwise_effective_rank": 12.433923721313477,
        "layerwise_effective_rank_mergeability_score": -55.007450103759766,
        "task_vector_cosine_similarity": 6.2922892570495605,
        "task_vector_l2_distance": -72.34312438964844,
        "task_vector_dot_product": 57.47235870361328,
        "weight_space_angle": 72.90451049804688,
        "task_vector_magnitude_ratio": 35.9095458984375,
        "singular_value_overlap": -19.434919357299805,
        "subspace_overlap": -14.383398056030273,
        "right_subspace_overlap": 7.94785213470459,
        "encoder_gradient_cosine_similarity": 3.1097183227539062,
        "encoder_gradient_l2_distance": -75.69548034667969,
        "encoder_gradient_dot_product": 7.1040544509887695,
        "input_gradient_cosine_similarity": 4.462813377380371,
        "input_gradient_l2_distance": -49.635929107666016,
        "input_gradient_dot_product": -33.24272918701172
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5030645025087592,
      "val_r": 0.47015844980365146,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 30.430320739746094,
        "right_subspace_overlap_bottom_k": 9.342302322387695,
        "interaction_matrix_overlap_top_k": -10.610379219055176,
        "interaction_matrix_overlap_bottom_k": 29.569334030151367,
        "effective_rank": 17.50119400024414,
        "effective_rank_mergeability_score": 8.9680757522583,
        "stable_rank": 4.15904426574707,
        "spectral_gap": 16.7138614654541,
        "singular_value_ratio": 3.464359760284424,
        "layerwise_effective_rank": 9.963279724121094,
        "layerwise_effective_rank_mergeability_score": 20.05629539489746,
        "task_vector_cosine_similarity": -15.608606338500977,
        "task_vector_l2_distance": -39.64502716064453,
        "task_vector_dot_product": -8.45919418334961,
        "weight_space_angle": 1.4570444822311401,
        "task_vector_magnitude_ratio": -12.994205474853516,
        "singular_value_overlap": -45.4717903137207,
        "subspace_overlap": 32.190731048583984,
        "right_subspace_overlap": 25.35483741760254,
        "encoder_gradient_cosine_similarity": -4.529555320739746,
        "encoder_gradient_l2_distance": -29.989044189453125,
        "encoder_gradient_dot_product": 2.8434348106384277,
        "input_gradient_cosine_similarity": 23.427230834960938,
        "input_gradient_l2_distance": -45.91779327392578,
        "input_gradient_dot_product": -21.217273712158203
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.43497390105830996,
      "val_r": 0.43893015703367433,
      "n_iterations": 502,
      "coefficients": {
        "right_subspace_overlap_top_k": 39.26821517944336,
        "right_subspace_overlap_bottom_k": 34.53630065917969,
        "interaction_matrix_overlap_top_k": 5.755978107452393,
        "interaction_matrix_overlap_bottom_k": 50.7833366394043,
        "effective_rank": 12.63242244720459,
        "effective_rank_mergeability_score": -19.273468017578125,
        "stable_rank": -63.63522720336914,
        "spectral_gap": 5.2849650382995605,
        "singular_value_ratio": -23.802385330200195,
        "layerwise_effective_rank": 7.549988746643066,
        "layerwise_effective_rank_mergeability_score": -22.420076370239258,
        "task_vector_cosine_similarity": 22.635046005249023,
        "task_vector_l2_distance": -54.61371612548828,
        "task_vector_dot_product": 1.950408935546875,
        "weight_space_angle": 1.4450477361679077,
        "task_vector_magnitude_ratio": -5.053354740142822,
        "singular_value_overlap": -91.01947784423828,
        "subspace_overlap": 113.67705535888672,
        "right_subspace_overlap": -11.95635986328125,
        "encoder_gradient_cosine_similarity": 23.4834041595459,
        "encoder_gradient_l2_distance": -22.577468872070312,
        "encoder_gradient_dot_product": 12.386656761169434,
        "input_gradient_cosine_similarity": 56.80369567871094,
        "input_gradient_l2_distance": -17.767169952392578,
        "input_gradient_dot_product": -55.07686233520508
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5376445885751981,
      "val_r": 0.09642133643704012,
      "n_iterations": 631,
      "coefficients": {
        "right_subspace_overlap_top_k": 59.997188568115234,
        "right_subspace_overlap_bottom_k": 43.304691314697266,
        "interaction_matrix_overlap_top_k": -15.09920883178711,
        "interaction_matrix_overlap_bottom_k": 57.66963195800781,
        "effective_rank": 33.4681510925293,
        "effective_rank_mergeability_score": 45.4794921875,
        "stable_rank": 38.84962463378906,
        "spectral_gap": -47.14390182495117,
        "singular_value_ratio": -53.46923828125,
        "layerwise_effective_rank": -11.554999351501465,
        "layerwise_effective_rank_mergeability_score": 23.475278854370117,
        "task_vector_cosine_similarity": 16.741722106933594,
        "task_vector_l2_distance": -48.5473518371582,
        "task_vector_dot_product": -46.494728088378906,
        "weight_space_angle": 28.357898712158203,
        "task_vector_magnitude_ratio": -22.828407287597656,
        "singular_value_overlap": -65.5177001953125,
        "subspace_overlap": 25.114295959472656,
        "right_subspace_overlap": 2.273941993713379,
        "encoder_gradient_cosine_similarity": 14.639039039611816,
        "encoder_gradient_l2_distance": -55.85928726196289,
        "encoder_gradient_dot_product": 8.160496711730957,
        "input_gradient_cosine_similarity": 19.68368148803711,
        "input_gradient_l2_distance": -44.876277923583984,
        "input_gradient_dot_product": -4.826417922973633
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.68519494429954,
      "val_r": 0.5126941103666305,
      "n_iterations": 748,
      "coefficients": {
        "right_subspace_overlap_top_k": 64.12710571289062,
        "right_subspace_overlap_bottom_k": -17.364288330078125,
        "interaction_matrix_overlap_top_k": 18.580259323120117,
        "interaction_matrix_overlap_bottom_k": 11.788349151611328,
        "effective_rank": -5.9719319343566895,
        "effective_rank_mergeability_score": -17.238828659057617,
        "stable_rank": -39.016963958740234,
        "spectral_gap": -5.3347063064575195,
        "singular_value_ratio": 9.357769012451172,
        "layerwise_effective_rank": -5.363479137420654,
        "layerwise_effective_rank_mergeability_score": 16.96213150024414,
        "task_vector_cosine_similarity": 12.859148979187012,
        "task_vector_l2_distance": -2.8919765949249268,
        "task_vector_dot_product": 20.34030532836914,
        "weight_space_angle": 34.219642639160156,
        "task_vector_magnitude_ratio": 11.221487045288086,
        "singular_value_overlap": -19.50408172607422,
        "subspace_overlap": -2.0107338428497314,
        "right_subspace_overlap": -19.48385238647461,
        "encoder_gradient_cosine_similarity": 17.88859748840332,
        "encoder_gradient_l2_distance": -15.101758003234863,
        "encoder_gradient_dot_product": 15.80224609375,
        "input_gradient_cosine_similarity": 5.907066345214844,
        "input_gradient_l2_distance": -60.29434585571289,
        "input_gradient_dot_product": -28.479198455810547
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5749012382276872,
      "val_r": 0.2599602828500406,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -6.387409210205078,
        "right_subspace_overlap_bottom_k": 6.282735824584961,
        "interaction_matrix_overlap_top_k": -3.3746631145477295,
        "interaction_matrix_overlap_bottom_k": 9.426509857177734,
        "effective_rank": 9.773122787475586,
        "effective_rank_mergeability_score": 5.073939800262451,
        "stable_rank": 1.3595784902572632,
        "spectral_gap": -2.620086431503296,
        "singular_value_ratio": -4.467862606048584,
        "layerwise_effective_rank": 4.0462870597839355,
        "layerwise_effective_rank_mergeability_score": 7.379185199737549,
        "task_vector_cosine_similarity": 12.188231468200684,
        "task_vector_l2_distance": -9.334653854370117,
        "task_vector_dot_product": -5.563469409942627,
        "weight_space_angle": 6.208045482635498,
        "task_vector_magnitude_ratio": -5.019260406494141,
        "singular_value_overlap": -6.668161392211914,
        "subspace_overlap": 3.986131191253662,
        "right_subspace_overlap": 1.0283297300338745,
        "encoder_gradient_cosine_similarity": -0.6115270256996155,
        "encoder_gradient_l2_distance": -10.919710159301758,
        "encoder_gradient_dot_product": 2.6051011085510254,
        "input_gradient_cosine_similarity": 2.8058226108551025,
        "input_gradient_l2_distance": -11.520487785339355,
        "input_gradient_dot_product": -4.6759934425354
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}