{
  "aggregate_metrics": {
    "train_r": 0.15923390913506355,
    "train_p": 9.624824492038067e-20,
    "val_r": 0.06408345766701232,
    "val_p": 0.22646350919288885
  },
  "per_fold_stats": {
    "train_r_mean": 0.4490951683665833,
    "train_r_std": 0.09751538772917104,
    "val_r_mean": 0.3367790148432278,
    "val_r_std": 0.19558157311139543
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 16.711137771606445,
    "right_subspace_overlap_bottom_k": 13.105685234069824,
    "interaction_matrix_overlap_top_k": 16.15176010131836,
    "interaction_matrix_overlap_bottom_k": 31.36733627319336,
    "effective_rank": -18.38064956665039,
    "effective_rank_mergeability_score": 7.255045413970947,
    "stable_rank": -13.513788223266602,
    "spectral_gap": -13.051432609558105,
    "singular_value_ratio": -10.776240348815918,
    "layerwise_effective_rank": 14.813491821289062,
    "layerwise_effective_rank_mergeability_score": -3.620401382446289,
    "task_vector_cosine_similarity": 11.677420616149902,
    "task_vector_l2_distance": -19.195262908935547,
    "task_vector_dot_product": 8.681769371032715,
    "weight_space_angle": 3.894869327545166,
    "task_vector_magnitude_ratio": -4.699292182922363,
    "singular_value_overlap": -27.664485931396484,
    "subspace_overlap": 22.26282501220703,
    "right_subspace_overlap": 15.681843757629395,
    "activation_l2_distance": -10.562708854675293,
    "activation_cosine_similarity": 8.936807632446289,
    "activation_magnitude_ratio": -2.692319631576538,
    "activation_dot_product": -6.500173091888428,
    "encoder_gradient_cosine_similarity": 22.75579261779785,
    "encoder_gradient_l2_distance": -25.241466522216797,
    "encoder_gradient_dot_product": 14.642127990722656,
    "input_gradient_cosine_similarity": 15.523633003234863,
    "input_gradient_l2_distance": -42.31437301635742,
    "input_gradient_dot_product": -24.25777244567871
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 23.270946502685547,
    "right_subspace_overlap_bottom_k": 29.048429489135742,
    "interaction_matrix_overlap_top_k": 46.11623001098633,
    "interaction_matrix_overlap_bottom_k": 29.757341384887695,
    "effective_rank": 61.37198257446289,
    "effective_rank_mergeability_score": 21.038925170898438,
    "stable_rank": 44.821956634521484,
    "spectral_gap": 69.1725845336914,
    "singular_value_ratio": 32.227176666259766,
    "layerwise_effective_rank": 44.15179443359375,
    "layerwise_effective_rank_mergeability_score": 44.7409553527832,
    "task_vector_cosine_similarity": 44.80790328979492,
    "task_vector_l2_distance": 20.449169158935547,
    "task_vector_dot_product": 46.0932502746582,
    "weight_space_angle": 24.93490219116211,
    "task_vector_magnitude_ratio": 11.142478942871094,
    "singular_value_overlap": 25.922319412231445,
    "subspace_overlap": 20.240753173828125,
    "right_subspace_overlap": 18.50063133239746,
    "activation_l2_distance": 17.274446487426758,
    "activation_cosine_similarity": 27.9848575592041,
    "activation_magnitude_ratio": 23.907594680786133,
    "activation_dot_product": 32.69023895263672,
    "encoder_gradient_cosine_similarity": 55.465538024902344,
    "encoder_gradient_l2_distance": 24.88446807861328,
    "encoder_gradient_dot_product": 14.228562355041504,
    "input_gradient_cosine_similarity": 21.382102966308594,
    "input_gradient_l2_distance": 74.28459167480469,
    "input_gradient_dot_product": 22.06572914123535
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.1833975609579077,
      "val_r": 0.39472848928251697,
      "n_iterations": 354,
      "coefficients": {
        "right_subspace_overlap_top_k": 33.7823600769043,
        "right_subspace_overlap_bottom_k": -69.57169342041016,
        "interaction_matrix_overlap_top_k": 199.81246948242188,
        "interaction_matrix_overlap_bottom_k": 120.3124771118164,
        "effective_rank": -274.7010192871094,
        "effective_rank_mergeability_score": 77.66661834716797,
        "stable_rank": -193.24765014648438,
        "spectral_gap": -310.7374267578125,
        "singular_value_ratio": -74.87483978271484,
        "layerwise_effective_rank": 191.6025390625,
        "layerwise_effective_rank_mergeability_score": -190.6361083984375,
        "task_vector_cosine_similarity": 196.01956176757812,
        "task_vector_l2_distance": -27.867036819458008,
        "task_vector_dot_product": 167.78515625,
        "weight_space_angle": -81.51100158691406,
        "task_vector_magnitude_ratio": -12.517769813537598,
        "singular_value_overlap": 32.64427185058594,
        "subspace_overlap": 61.79294967651367,
        "right_subspace_overlap": -19.856090545654297,
        "activation_l2_distance": -35.579708099365234,
        "activation_cosine_similarity": 107.58941650390625,
        "activation_magnitude_ratio": 88.62698364257812,
        "activation_dot_product": 102.60125732421875,
        "encoder_gradient_cosine_similarity": 255.64112854003906,
        "encoder_gradient_l2_distance": -8.122688293457031,
        "encoder_gradient_dot_product": -4.031628131866455,
        "input_gradient_cosine_similarity": 20.801353454589844,
        "input_gradient_l2_distance": -348.14495849609375,
        "input_gradient_dot_product": -4.283113956451416
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3739725214703364,
      "val_r": 0.2360915961707123,
      "n_iterations": 523,
      "coefficients": {
        "right_subspace_overlap_top_k": 72.94263458251953,
        "right_subspace_overlap_bottom_k": 66.43067932128906,
        "interaction_matrix_overlap_top_k": -25.66248893737793,
        "interaction_matrix_overlap_bottom_k": 74.74834442138672,
        "effective_rank": -33.95208740234375,
        "effective_rank_mergeability_score": -23.532194137573242,
        "stable_rank": 3.2701594829559326,
        "spectral_gap": -5.491231441497803,
        "singular_value_ratio": -106.6242904663086,
        "layerwise_effective_rank": 31.509178161621094,
        "layerwise_effective_rank_mergeability_score": 8.745226860046387,
        "task_vector_cosine_similarity": -10.892016410827637,
        "task_vector_l2_distance": -25.692081451416016,
        "task_vector_dot_product": 95.55133819580078,
        "weight_space_angle": 36.03120803833008,
        "task_vector_magnitude_ratio": -4.725044250488281,
        "singular_value_overlap": -33.52662658691406,
        "subspace_overlap": 30.662120819091797,
        "right_subspace_overlap": 29.317180633544922,
        "activation_l2_distance": -14.539753913879395,
        "activation_cosine_similarity": 20.2861270904541,
        "activation_magnitude_ratio": -21.39057159423828,
        "activation_dot_product": -37.706382751464844,
        "encoder_gradient_cosine_similarity": -6.81953239440918,
        "encoder_gradient_l2_distance": -56.40570068359375,
        "encoder_gradient_dot_product": 14.173310279846191,
        "input_gradient_cosine_similarity": -14.739147186279297,
        "input_gradient_l2_distance": -23.21975326538086,
        "input_gradient_dot_product": -37.75159454345703
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5156823370794328,
      "val_r": 0.3783146444000464,
      "n_iterations": 558,
      "coefficients": {
        "right_subspace_overlap_top_k": -3.9985666275024414,
        "right_subspace_overlap_bottom_k": 38.556793212890625,
        "interaction_matrix_overlap_top_k": 50.10338592529297,
        "interaction_matrix_overlap_bottom_k": 26.77780532836914,
        "effective_rank": 10.737663269042969,
        "effective_rank_mergeability_score": 4.803597450256348,
        "stable_rank": -14.856518745422363,
        "spectral_gap": 0.3185539245605469,
        "singular_value_ratio": -5.507349491119385,
        "layerwise_effective_rank": 11.136432647705078,
        "layerwise_effective_rank_mergeability_score": 20.980138778686523,
        "task_vector_cosine_similarity": 5.049074172973633,
        "task_vector_l2_distance": -38.813785552978516,
        "task_vector_dot_product": -1.4611616134643555,
        "weight_space_angle": 18.424457550048828,
        "task_vector_magnitude_ratio": -9.801222801208496,
        "singular_value_overlap": -67.53485870361328,
        "subspace_overlap": 17.98138999938965,
        "right_subspace_overlap": 25.319116592407227,
        "activation_l2_distance": 2.284151554107666,
        "activation_cosine_similarity": 20.452939987182617,
        "activation_magnitude_ratio": -19.400653839111328,
        "activation_dot_product": -39.105499267578125,
        "encoder_gradient_cosine_similarity": 4.962991714477539,
        "encoder_gradient_l2_distance": -21.347015380859375,
        "encoder_gradient_dot_product": 17.172964096069336,
        "input_gradient_cosine_similarity": 25.638885498046875,
        "input_gradient_l2_distance": -36.91345977783203,
        "input_gradient_dot_product": -40.9627571105957
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.48284558014968276,
      "val_r": 0.41254803928917605,
      "n_iterations": 296,
      "coefficients": {
        "right_subspace_overlap_top_k": 11.946456909179688,
        "right_subspace_overlap_bottom_k": 18.537273406982422,
        "interaction_matrix_overlap_top_k": 7.867680072784424,
        "interaction_matrix_overlap_bottom_k": 38.11231231689453,
        "effective_rank": 8.113991737365723,
        "effective_rank_mergeability_score": 11.163917541503906,
        "stable_rank": -31.219018936157227,
        "spectral_gap": -8.63302230834961,
        "singular_value_ratio": -3.8380343914031982,
        "layerwise_effective_rank": 36.71833038330078,
        "layerwise_effective_rank_mergeability_score": 20.084243774414062,
        "task_vector_cosine_similarity": -20.624277114868164,
        "task_vector_l2_distance": -33.68889617919922,
        "task_vector_dot_product": 7.199121475219727,
        "weight_space_angle": 28.809728622436523,
        "task_vector_magnitude_ratio": -12.399049758911133,
        "singular_value_overlap": -35.44363784790039,
        "subspace_overlap": 46.84593200683594,
        "right_subspace_overlap": 28.16006088256836,
        "activation_l2_distance": -38.48590087890625,
        "activation_cosine_similarity": -35.88306427001953,
        "activation_magnitude_ratio": -23.962703704833984,
        "activation_dot_product": -1.1806741952896118,
        "encoder_gradient_cosine_similarity": 6.251875877380371,
        "encoder_gradient_l2_distance": -20.40985679626465,
        "encoder_gradient_dot_product": 7.928750038146973,
        "input_gradient_cosine_similarity": 25.333663940429688,
        "input_gradient_l2_distance": -27.561195373535156,
        "input_gradient_dot_product": -8.748588562011719
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4119895664963937,
      "val_r": 0.36492827926740956,
      "n_iterations": 75,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.015289306640625,
        "right_subspace_overlap_bottom_k": 10.613809585571289,
        "interaction_matrix_overlap_top_k": 12.023971557617188,
        "interaction_matrix_overlap_bottom_k": 4.645997524261475,
        "effective_rank": 0.16854725778102875,
        "effective_rank_mergeability_score": -5.947492599487305,
        "stable_rank": -2.8025453090667725,
        "spectral_gap": 1.5257140398025513,
        "singular_value_ratio": -1.4469791650772095,
        "layerwise_effective_rank": -0.47397881746292114,
        "layerwise_effective_rank_mergeability_score": 1.8035624027252197,
        "task_vector_cosine_similarity": -1.4057060480117798,
        "task_vector_l2_distance": -1.9719911813735962,
        "task_vector_dot_product": -4.768651008605957,
        "weight_space_angle": -5.011664390563965,
        "task_vector_magnitude_ratio": -2.4422945976257324,
        "singular_value_overlap": -8.003402709960938,
        "subspace_overlap": -1.6826368570327759,
        "right_subspace_overlap": -1.2331578731536865,
        "activation_l2_distance": 1.2034714221954346,
        "activation_cosine_similarity": 8.802454948425293,
        "activation_magnitude_ratio": -3.4923269748687744,
        "activation_dot_product": -8.517318725585938,
        "encoder_gradient_cosine_similarity": 1.0312381982803345,
        "encoder_gradient_l2_distance": -5.488320350646973,
        "encoder_gradient_dot_product": 6.5371012687683105,
        "input_gradient_cosine_similarity": 7.74590539932251,
        "input_gradient_l2_distance": -1.6428099870681763,
        "input_gradient_dot_product": -5.810729503631592
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.40849001135696245,
      "val_r": 0.6423990667547053,
      "n_iterations": 347,
      "coefficients": {
        "right_subspace_overlap_top_k": 19.378311157226562,
        "right_subspace_overlap_bottom_k": 4.414000988006592,
        "interaction_matrix_overlap_top_k": 41.93049621582031,
        "interaction_matrix_overlap_bottom_k": 5.625819683074951,
        "effective_rank": 3.85734224319458,
        "effective_rank_mergeability_score": -0.27780115604400635,
        "stable_rank": -4.890145778656006,
        "spectral_gap": 31.810508728027344,
        "singular_value_ratio": -10.301708221435547,
        "layerwise_effective_rank": 14.856878280639648,
        "layerwise_effective_rank_mergeability_score": 16.488033294677734,
        "task_vector_cosine_similarity": 22.7652587890625,
        "task_vector_l2_distance": -17.33884048461914,
        "task_vector_dot_product": -14.419088363647461,
        "weight_space_angle": 8.306761741638184,
        "task_vector_magnitude_ratio": 10.774910926818848,
        "singular_value_overlap": -29.758319854736328,
        "subspace_overlap": 11.716530799865723,
        "right_subspace_overlap": 50.197967529296875,
        "activation_l2_distance": -57.716983795166016,
        "activation_cosine_similarity": -8.004096031188965,
        "activation_magnitude_ratio": -1.4646905660629272,
        "activation_dot_product": -44.882450103759766,
        "encoder_gradient_cosine_similarity": 27.984472274780273,
        "encoder_gradient_l2_distance": -38.32186508178711,
        "encoder_gradient_dot_product": 22.624216079711914,
        "input_gradient_cosine_similarity": 56.35320281982422,
        "input_gradient_l2_distance": -67.30731964111328,
        "input_gradient_dot_product": -53.40552520751953
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5658595915502538,
      "val_r": -0.022928866360455186,
      "n_iterations": 55,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.1832762956619263,
        "right_subspace_overlap_bottom_k": 1.991315484046936,
        "interaction_matrix_overlap_top_k": -0.4341607689857483,
        "interaction_matrix_overlap_bottom_k": -0.1340404599905014,
        "effective_rank": 0.48029839992523193,
        "effective_rank_mergeability_score": 1.4233580827713013,
        "stable_rank": 1.030864953994751,
        "spectral_gap": 0.6115174293518066,
        "singular_value_ratio": -0.18882526457309723,
        "layerwise_effective_rank": 0.5712195634841919,
        "layerwise_effective_rank_mergeability_score": 0.7579072117805481,
        "task_vector_cosine_similarity": -0.3237886130809784,
        "task_vector_l2_distance": -1.4155635833740234,
        "task_vector_dot_product": -0.14483240246772766,
        "weight_space_angle": 1.3876525163650513,
        "task_vector_magnitude_ratio": 0.04405241087079048,
        "singular_value_overlap": -1.0571798086166382,
        "subspace_overlap": -0.18653754889965057,
        "right_subspace_overlap": -0.08427130430936813,
        "activation_l2_distance": -0.9333290457725525,
        "activation_cosine_similarity": -0.17748425900936127,
        "activation_magnitude_ratio": 0.63581782579422,
        "activation_dot_product": -1.123655915260315,
        "encoder_gradient_cosine_similarity": 0.6008909344673157,
        "encoder_gradient_l2_distance": -1.7693984508514404,
        "encoder_gradient_dot_product": 0.9170799255371094,
        "input_gradient_cosine_similarity": -0.15627992153167725,
        "input_gradient_l2_distance": -1.5000227689743042,
        "input_gradient_dot_product": -1.020963191986084
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3287826675719953,
      "val_r": 0.20363637023794195,
      "n_iterations": 52,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.7538300156593323,
        "right_subspace_overlap_bottom_k": 2.650587320327759,
        "interaction_matrix_overlap_top_k": 2.0247106552124023,
        "interaction_matrix_overlap_bottom_k": 1.5301768779754639,
        "effective_rank": -2.895443916320801,
        "effective_rank_mergeability_score": 0.5461181402206421,
        "stable_rank": -0.3121621012687683,
        "spectral_gap": -0.8636996746063232,
        "singular_value_ratio": -0.6636722087860107,
        "layerwise_effective_rank": -0.224516823887825,
        "layerwise_effective_rank_mergeability_score": 0.9221826195716858,
        "task_vector_cosine_similarity": 0.9458122253417969,
        "task_vector_l2_distance": 0.46004417538642883,
        "task_vector_dot_product": -0.6260153651237488,
        "weight_space_angle": 0.000138787436299026,
        "task_vector_magnitude_ratio": 0.23976805806159973,
        "singular_value_overlap": -1.8596471548080444,
        "subspace_overlap": 0.6172904372215271,
        "right_subspace_overlap": 2.5274925231933594,
        "activation_l2_distance": -2.2903900146484375,
        "activation_cosine_similarity": 0.019401533529162407,
        "activation_magnitude_ratio": -0.3165777325630188,
        "activation_dot_product": -1.9649147987365723,
        "encoder_gradient_cosine_similarity": 1.2865123748779297,
        "encoder_gradient_l2_distance": -0.6622827649116516,
        "encoder_gradient_dot_product": 0.022748731076717377,
        "input_gradient_cosine_similarity": 1.296571135520935,
        "input_gradient_l2_distance": -3.097426414489746,
        "input_gradient_dot_product": 0.9024064540863037
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.39946606048476685,
      "val_r": -0.08151487152080722,
      "n_iterations": 404,
      "coefficients": {
        "right_subspace_overlap_top_k": 46.54082489013672,
        "right_subspace_overlap_bottom_k": 12.19614315032959,
        "interaction_matrix_overlap_top_k": 14.784226417541504,
        "interaction_matrix_overlap_bottom_k": 36.04286193847656,
        "effective_rank": -18.386022567749023,
        "effective_rank_mergeability_score": 1.3801661729812622,
        "stable_rank": -45.930721282958984,
        "spectral_gap": 12.900588989257812,
        "singular_value_ratio": -6.0085272789001465,
        "layerwise_effective_rank": 0.9368610382080078,
        "layerwise_effective_rank_mergeability_score": -17.180408477783203,
        "task_vector_cosine_similarity": -3.973141670227051,
        "task_vector_l2_distance": 5.5567474365234375,
        "task_vector_dot_product": 17.523204803466797,
        "weight_space_angle": -17.192842483520508,
        "task_vector_magnitude_ratio": -1.0495620965957642,
        "singular_value_overlap": -39.776817321777344,
        "subspace_overlap": 13.36234188079834,
        "right_subspace_overlap": 57.34178924560547,
        "activation_l2_distance": -18.023637771606445,
        "activation_cosine_similarity": 34.18147277832031,
        "activation_magnitude_ratio": -16.839643478393555,
        "activation_dot_product": -62.91304397583008,
        "encoder_gradient_cosine_similarity": 61.469642639160156,
        "encoder_gradient_l2_distance": -34.20729446411133,
        "encoder_gradient_dot_product": 58.269412994384766,
        "input_gradient_cosine_similarity": 2.793572425842285,
        "input_gradient_l2_distance": -41.77680587768555,
        "input_gradient_dot_product": -51.02519607543945
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.49043479888401886,
      "val_r": 0.5506082377068063,
      "n_iterations": 83,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.9741798639297485,
        "right_subspace_overlap_bottom_k": 4.125815391540527,
        "interaction_matrix_overlap_top_k": 1.0604592561721802,
        "interaction_matrix_overlap_bottom_k": 1.0310685634613037,
        "effective_rank": 1.810408115386963,
        "effective_rank_mergeability_score": 0.025593632832169533,
        "stable_rank": 1.2235087156295776,
        "spectral_gap": 3.171002149581909,
        "singular_value_ratio": -0.9892452359199524,
        "layerwise_effective_rank": -0.07573864609003067,
        "layerwise_effective_rank_mergeability_score": -0.09369350224733353,
        "task_vector_cosine_similarity": -0.6112645268440247,
        "task_vector_l2_distance": -3.748342275619507,
        "task_vector_dot_product": 0.3495250344276428,
        "weight_space_angle": 0.5068994760513306,
        "task_vector_magnitude_ratio": -1.460881233215332,
        "singular_value_overlap": -3.9121885299682617,
        "subspace_overlap": 3.4261159896850586,
        "right_subspace_overlap": 1.148666262626648,
        "activation_l2_distance": -1.3125237226486206,
        "activation_cosine_similarity": 4.225404739379883,
        "activation_magnitude_ratio": -1.9595775604248047,
        "activation_dot_product": -4.006145477294922,
        "encoder_gradient_cosine_similarity": 0.3649369180202484,
        "encoder_gradient_l2_distance": -1.9661049842834473,
        "encoder_gradient_dot_product": 4.585156440734863,
        "input_gradient_cosine_similarity": 2.121958017349243,
        "input_gradient_l2_distance": -6.049075603485107,
        "input_gradient_dot_product": -3.981506586074829
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.38152863231153894,
      "val_r": 0.3429694725967123,
      "n_iterations": 229,
      "coefficients": {
        "right_subspace_overlap_top_k": 31.98041534423828,
        "right_subspace_overlap_bottom_k": 10.36723804473877,
        "interaction_matrix_overlap_top_k": -29.062082290649414,
        "interaction_matrix_overlap_bottom_k": 52.27055740356445,
        "effective_rank": 2.1884706020355225,
        "effective_rank_mergeability_score": -10.186333656311035,
        "stable_rank": -26.33251190185547,
        "spectral_gap": -18.57233238220215,
        "singular_value_ratio": -44.46134948730469,
        "layerwise_effective_rank": 9.721098899841309,
        "layerwise_effective_rank_mergeability_score": -3.944652795791626,
        "task_vector_cosine_similarity": -10.182296752929688,
        "task_vector_l2_distance": -36.111244201660156,
        "task_vector_dot_product": 22.169553756713867,
        "weight_space_angle": 5.884143829345703,
        "task_vector_magnitude_ratio": 7.463071823120117,
        "singular_value_overlap": -37.588191986083984,
        "subspace_overlap": 9.277053833007812,
        "right_subspace_overlap": 10.095389366149902,
        "activation_l2_distance": -3.7143990993499756,
        "activation_cosine_similarity": -14.559370040893555,
        "activation_magnitude_ratio": -3.056083917617798,
        "activation_dot_product": 12.588951110839844,
        "encoder_gradient_cosine_similarity": 19.95241928100586,
        "encoder_gradient_l2_distance": -20.090373992919922,
        "encoder_gradient_dot_product": 23.302303314208984,
        "input_gradient_cosine_similarity": 20.85140609741211,
        "input_gradient_l2_distance": 5.044073581695557,
        "input_gradient_dot_product": 15.699126243591309
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5014431024144844,
      "val_r": 0.49442561432316096,
      "n_iterations": 592,
      "coefficients": {
        "right_subspace_overlap_top_k": -37.45170593261719,
        "right_subspace_overlap_bottom_k": 54.20201110839844,
        "interaction_matrix_overlap_top_k": 24.594135284423828,
        "interaction_matrix_overlap_bottom_k": 18.896392822265625,
        "effective_rank": 18.60120391845703,
        "effective_rank_mergeability_score": 22.886627197265625,
        "stable_rank": -23.528329849243164,
        "spectral_gap": -14.60195255279541,
        "singular_value_ratio": -12.206375122070312,
        "layerwise_effective_rank": 49.30796813964844,
        "layerwise_effective_rank_mergeability_score": 40.54175567626953,
        "task_vector_cosine_similarity": -23.688207626342773,
        "task_vector_l2_distance": -56.30147171020508,
        "task_vector_dot_product": 31.81476593017578,
        "weight_space_angle": 33.25682830810547,
        "task_vector_magnitude_ratio": -5.621145725250244,
        "singular_value_overlap": -59.69763946533203,
        "subspace_overlap": 61.9791374206543,
        "right_subspace_overlap": 12.245176315307617,
        "activation_l2_distance": -10.525601387023926,
        "activation_cosine_similarity": -7.837285995483398,
        "activation_magnitude_ratio": -12.457656860351562,
        "activation_dot_product": -14.776416778564453,
        "encoder_gradient_cosine_similarity": 10.642220497131348,
        "encoder_gradient_l2_distance": -28.820161819458008,
        "encoder_gradient_dot_product": 11.052775382995605,
        "input_gradient_cosine_similarity": -21.203720092773438,
        "input_gradient_l2_distance": -30.56589698791504,
        "input_gradient_dot_product": -29.739776611328125
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.42686453382225215,
      "val_r": 0.3045971781955734,
      "n_iterations": 83,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.49407508969306946,
        "right_subspace_overlap_bottom_k": 3.642632246017456,
        "interaction_matrix_overlap_top_k": 0.7825307250022888,
        "interaction_matrix_overlap_bottom_k": 4.3103766441345215,
        "effective_rank": 3.3544981479644775,
        "effective_rank_mergeability_score": 0.28021714091300964,
        "stable_rank": -1.1846860647201538,
        "spectral_gap": 1.1597906351089478,
        "singular_value_ratio": -1.1987006664276123,
        "layerwise_effective_rank": -3.5145530700683594,
        "layerwise_effective_rank_mergeability_score": -0.49723324179649353,
        "task_vector_cosine_similarity": 2.6719372272491455,
        "task_vector_l2_distance": -0.5307047367095947,
        "task_vector_dot_product": -0.7946443557739258,
        "weight_space_angle": -0.6564778089523315,
        "task_vector_magnitude_ratio": -0.9169272184371948,
        "singular_value_overlap": -5.955835342407227,
        "subspace_overlap": 2.785759210586548,
        "right_subspace_overlap": 3.961338758468628,
        "activation_l2_distance": -1.7527810335159302,
        "activation_cosine_similarity": 0.03218934312462807,
        "activation_magnitude_ratio": -1.143847107887268,
        "activation_dot_product": -2.6460180282592773,
        "encoder_gradient_cosine_similarity": 2.1690826416015625,
        "encoder_gradient_l2_distance": -3.1594648361206055,
        "encoder_gradient_dot_product": 4.147167682647705,
        "input_gradient_cosine_similarity": 2.8029050827026367,
        "input_gradient_l2_distance": -2.286545991897583,
        "input_gradient_dot_product": -4.385603427886963
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4816740455917171,
      "val_r": 0.5824645144763154,
      "n_iterations": 383,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.917211532592773,
        "right_subspace_overlap_bottom_k": 30.297874450683594,
        "interaction_matrix_overlap_top_k": 12.0886869430542,
        "interaction_matrix_overlap_bottom_k": 48.959495544433594,
        "effective_rank": -14.176939964294434,
        "effective_rank_mergeability_score": 25.70057487487793,
        "stable_rank": 4.500184535980225,
        "spectral_gap": 21.455434799194336,
        "singular_value_ratio": 15.65548324584961,
        "layerwise_effective_rank": -0.11762456595897675,
        "layerwise_effective_rank_mergeability_score": -10.250749588012695,
        "task_vector_cosine_similarity": 24.724864959716797,
        "task_vector_l2_distance": -37.62361526489258,
        "task_vector_dot_product": -30.357229232788086,
        "weight_space_angle": 6.851110458374023,
        "task_vector_magnitude_ratio": 6.202269077301025,
        "singular_value_overlap": -32.18167495727539,
        "subspace_overlap": 32.438968658447266,
        "right_subspace_overlap": 3.0932705402374268,
        "activation_l2_distance": -12.127423286437988,
        "activation_cosine_similarity": 3.832002639770508,
        "activation_magnitude_ratio": -14.259940147399902,
        "activation_dot_product": -32.91957092285156,
        "encoder_gradient_cosine_similarity": 16.220521926879883,
        "encoder_gradient_l2_distance": -40.2974967956543,
        "encoder_gradient_dot_product": 18.84444808959961,
        "input_gradient_cosine_similarity": 23.241491317749023,
        "input_gradient_l2_distance": -38.251468658447266,
        "input_gradient_dot_product": -40.46385955810547
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4592168282268681,
      "val_r": 0.5334924202178155,
      "n_iterations": 445,
      "coefficients": {
        "right_subspace_overlap_top_k": 18.274494171142578,
        "right_subspace_overlap_bottom_k": 1.2132484912872314,
        "interaction_matrix_overlap_top_k": 17.20093536376953,
        "interaction_matrix_overlap_bottom_k": 23.978368759155273,
        "effective_rank": -12.496602058410645,
        "effective_rank_mergeability_score": 2.9384570121765137,
        "stable_rank": 29.233970642089844,
        "spectral_gap": 1.7921323776245117,
        "singular_value_ratio": -6.228879451751709,
        "layerwise_effective_rank": -5.237371444702148,
        "layerwise_effective_rank_mergeability_score": 6.152126312255859,
        "task_vector_cosine_similarity": -3.0214052200317383,
        "task_vector_l2_distance": -12.369407653808594,
        "task_vector_dot_product": -45.606109619140625,
        "weight_space_angle": 17.026296615600586,
        "task_vector_magnitude_ratio": -12.599416732788086,
        "singular_value_overlap": -37.33936309814453,
        "subspace_overlap": 50.71487808227539,
        "right_subspace_overlap": 6.132899284362793,
        "activation_l2_distance": 0.28788942098617554,
        "activation_cosine_similarity": 4.967314720153809,
        "activation_magnitude_ratio": -9.416576385498047,
        "activation_dot_product": -0.4163101017475128,
        "encoder_gradient_cosine_similarity": -0.29084986448287964,
        "encoder_gradient_l2_distance": -6.6208295822143555,
        "encoder_gradient_dot_product": 12.573670387268066,
        "input_gradient_cosine_similarity": 15.716835975646973,
        "input_gradient_l2_distance": -28.12563133239746,
        "input_gradient_dot_product": -27.438013076782227
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.45771788023423765,
      "val_r": 0.38211522660184133,
      "n_iterations": 327,
      "coefficients": {
        "right_subspace_overlap_top_k": 16.95616912841797,
        "right_subspace_overlap_bottom_k": 19.075435638427734,
        "interaction_matrix_overlap_top_k": 14.339154243469238,
        "interaction_matrix_overlap_bottom_k": 34.0393180847168,
        "effective_rank": -0.9842838644981384,
        "effective_rank_mergeability_score": 3.788036346435547,
        "stable_rank": 3.3644936084747314,
        "spectral_gap": 8.648632049560547,
        "singular_value_ratio": 5.190222263336182,
        "layerwise_effective_rank": -3.2651336193084717,
        "layerwise_effective_rank_mergeability_score": 5.076052188873291,
        "task_vector_cosine_similarity": 9.035706520080566,
        "task_vector_l2_distance": -32.5142707824707,
        "task_vector_dot_product": -7.154217720031738,
        "weight_space_angle": -19.190488815307617,
        "task_vector_magnitude_ratio": -15.159873962402344,
        "singular_value_overlap": -38.907161712646484,
        "subspace_overlap": 13.604887008666992,
        "right_subspace_overlap": 27.939285278320312,
        "activation_l2_distance": -1.360852837562561,
        "activation_cosine_similarity": 4.982470989227295,
        "activation_magnitude_ratio": -10.949188232421875,
        "activation_dot_product": -8.288644790649414,
        "encoder_gradient_cosine_similarity": -3.5315539836883545,
        "encoder_gradient_l2_distance": -22.439239501953125,
        "encoder_gradient_dot_product": 18.381723403930664,
        "input_gradient_cosine_similarity": 36.192840576171875,
        "input_gradient_l2_distance": -24.140111923217773,
        "input_gradient_dot_product": -31.733888626098633
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4237078814565544,
      "val_r": 0.2939549697525012,
      "n_iterations": 69,
      "coefficients": {
        "right_subspace_overlap_top_k": 8.493319511413574,
        "right_subspace_overlap_bottom_k": 4.375002861022949,
        "interaction_matrix_overlap_top_k": 4.263698577880859,
        "interaction_matrix_overlap_bottom_k": 4.7767791748046875,
        "effective_rank": -1.0288420915603638,
        "effective_rank_mergeability_score": -0.011696141213178635,
        "stable_rank": -0.42826366424560547,
        "spectral_gap": -2.1651854515075684,
        "singular_value_ratio": -3.7297136783599854,
        "layerwise_effective_rank": -0.6103392839431763,
        "layerwise_effective_rank_mergeability_score": 1.3732361793518066,
        "task_vector_cosine_similarity": 5.384461879730225,
        "task_vector_l2_distance": 1.329774260520935,
        "task_vector_dot_product": -8.659636497497559,
        "weight_space_angle": 2.983250856399536,
        "task_vector_magnitude_ratio": 0.5105645656585693,
        "singular_value_overlap": -4.226054668426514,
        "subspace_overlap": 4.043556213378906,
        "right_subspace_overlap": -2.654179811477661,
        "activation_l2_distance": -1.6168017387390137,
        "activation_cosine_similarity": 2.5176503658294678,
        "activation_magnitude_ratio": -3.6561381816864014,
        "activation_dot_product": -3.1909666061401367,
        "encoder_gradient_cosine_similarity": 2.9168548583984375,
        "encoder_gradient_l2_distance": -3.522364854812622,
        "encoder_gradient_dot_product": 1.712082028388977,
        "input_gradient_cosine_similarity": 1.8004425764083862,
        "input_gradient_l2_distance": -4.697752952575684,
        "input_gradient_dot_product": -5.306332588195801
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5064839226065346,
      "val_r": 0.1341706087719138,
      "n_iterations": 742,
      "coefficients": {
        "right_subspace_overlap_top_k": 46.08221435546875,
        "right_subspace_overlap_bottom_k": 28.12645149230957,
        "interaction_matrix_overlap_top_k": -18.217077255249023,
        "interaction_matrix_overlap_bottom_k": 54.59599685668945,
        "effective_rank": 19.662059783935547,
        "effective_rank_mergeability_score": 41.69078826904297,
        "stable_rank": 19.610450744628906,
        "spectral_gap": 1.3119865655899048,
        "singular_value_ratio": -26.926753997802734,
        "layerwise_effective_rank": -7.126412868499756,
        "layerwise_effective_rank_mergeability_score": 16.55692481994629,
        "task_vector_cosine_similarity": -8.148802757263184,
        "task_vector_l2_distance": -44.07896041870117,
        "task_vector_dot_product": -14.090201377868652,
        "weight_space_angle": 36.52285385131836,
        "task_vector_magnitude_ratio": 8.909921646118164,
        "singular_value_overlap": -42.3029899597168,
        "subspace_overlap": 41.870540618896484,
        "right_subspace_overlap": 30.65882682800293,
        "activation_l2_distance": -32.58709716796875,
        "activation_cosine_similarity": -14.493130683898926,
        "activation_magnitude_ratio": -0.7191047668457031,
        "activation_dot_product": -16.436798095703125,
        "encoder_gradient_cosine_similarity": 14.844064712524414,
        "encoder_gradient_l2_distance": -106.2369155883789,
        "encoder_gradient_dot_product": 15.386117935180664,
        "input_gradient_cosine_similarity": 28.393749237060547,
        "input_gradient_l2_distance": -18.92140007019043,
        "input_gradient_dot_product": -52.93935775756836
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.69046721308676,
      "val_r": 0.52725021921383,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 42.635440826416016,
        "right_subspace_overlap_bottom_k": -31.6908016204834,
        "interaction_matrix_overlap_top_k": -3.7355265617370605,
        "interaction_matrix_overlap_bottom_k": 20.989294052124023,
        "effective_rank": -19.224437713623047,
        "effective_rank_mergeability_score": -9.105240821838379,
        "stable_rank": -10.378081321716309,
        "spectral_gap": 11.379907608032227,
        "singular_value_ratio": 20.572433471679688,
        "layerwise_effective_rank": 6.686361312866211,
        "layerwise_effective_rank_mergeability_score": 17.64106559753418,
        "task_vector_cosine_similarity": 7.0078277587890625,
        "task_vector_l2_distance": 21.29562759399414,
        "task_vector_dot_product": -5.0510711669921875,
        "weight_space_angle": -1.1894237995147705,
        "task_vector_magnitude_ratio": -8.079097747802734,
        "singular_value_overlap": -24.154699325561523,
        "subspace_overlap": 24.90361976623535,
        "right_subspace_overlap": 24.533540725708008,
        "activation_l2_distance": 2.6257853507995605,
        "activation_cosine_similarity": 40.38064193725586,
        "activation_magnitude_ratio": -25.94561767578125,
        "activation_dot_product": 6.319622039794922,
        "encoder_gradient_cosine_similarity": 25.189748764038086,
        "encoder_gradient_l2_distance": -44.6574592590332,
        "encoder_gradient_dot_product": 18.171892166137695,
        "input_gradient_cosine_similarity": 5.210176467895508,
        "input_gradient_l2_distance": -51.479736328125,
        "input_gradient_dot_product": -59.85340118408203
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4918786315789689,
      "val_r": 0.06132908748684063,
      "n_iterations": 515,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.310709476470947,
        "right_subspace_overlap_bottom_k": 52.55989074707031,
        "interaction_matrix_overlap_top_k": -2.72997784614563,
        "interaction_matrix_overlap_bottom_k": 55.83734893798828,
        "effective_rank": -58.741756439208984,
        "effective_rank_mergeability_score": -0.13239647448062897,
        "stable_rank": 22.601255416870117,
        "spectral_gap": 3.9504551887512207,
        "singular_value_ratio": 48.252281188964844,
        "layerwise_effective_rank": -36.13141632080078,
        "layerwise_effective_rank_mergeability_score": -6.927633762359619,
        "task_vector_cosine_similarity": 42.8148193359375,
        "task_vector_l2_distance": -42.48125457763672,
        "task_vector_dot_product": -35.6243896484375,
        "weight_space_angle": 6.657950401306152,
        "task_vector_magnitude_ratio": -41.35811996459961,
        "singular_value_overlap": -82.70774841308594,
        "subspace_overlap": 19.10258674621582,
        "right_subspace_overlap": 24.792564392089844,
        "activation_l2_distance": 14.911738395690918,
        "activation_cosine_similarity": 7.421091556549072,
        "activation_magnitude_ratio": 27.321704864501953,
        "activation_dot_product": 28.561506271362305,
        "encoder_gradient_cosine_similarity": 14.22923755645752,
        "encoder_gradient_l2_distance": -40.284481048583984,
        "encoder_gradient_dot_product": 41.071231842041016,
        "input_gradient_cosine_similarity": 70.27684020996094,
        "input_gradient_l2_distance": -95.65013885498047,
        "input_gradient_dot_product": -42.90678024291992
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}