{
  "excluded_metrics": [
    "interaction_matrix_overlap_bottom_k",
    "interaction_matrix_overlap_top_k",
    "right_subspace_overlap",
    "right_subspace_overlap_bottom_k",
    "right_subspace_overlap_top_k",
    "singular_value_overlap",
    "subspace_overlap"
  ],
  "n_metrics_used": 22,
  "metrics_used": [
    "effective_rank",
    "effective_rank_mergeability_score",
    "stable_rank",
    "spectral_gap",
    "singular_value_ratio",
    "layerwise_effective_rank",
    "layerwise_effective_rank_mergeability_score",
    "task_vector_cosine_similarity",
    "task_vector_l2_distance",
    "task_vector_dot_product",
    "weight_space_angle",
    "task_vector_magnitude_ratio",
    "activation_l2_distance",
    "activation_cosine_similarity",
    "activation_magnitude_ratio",
    "activation_dot_product",
    "encoder_gradient_cosine_similarity",
    "encoder_gradient_l2_distance",
    "encoder_gradient_dot_product",
    "input_gradient_cosine_similarity",
    "input_gradient_l2_distance",
    "input_gradient_dot_product"
  ],
  "methods": {
    "weight_avg": {
      "aggregate_metrics": {
        "train_r": 0.1877017706451737,
        "train_p": 6.191276262081849e-27,
        "val_r": 0.20103644198545956,
        "val_p": 0.000128322958206954
      },
      "per_fold_stats": {
        "train_r_mean": 0.5736383681723893,
        "train_r_std": 0.2504042175751728,
        "val_r_mean": 0.42438359588747876,
        "val_r_std": 0.30383915831625213
      },
      "average_coefficients": {
        "effective_rank": -3.758315324783325,
        "effective_rank_mergeability_score": 10.188277244567871,
        "stable_rank": 12.04945182800293,
        "spectral_gap": -0.4523714482784271,
        "singular_value_ratio": -7.618811130523682,
        "layerwise_effective_rank": 0.8052960634231567,
        "layerwise_effective_rank_mergeability_score": -3.4298012256622314,
        "task_vector_cosine_similarity": 2.7382891178131104,
        "task_vector_l2_distance": 8.70966911315918,
        "task_vector_dot_product": 6.554912567138672,
        "weight_space_angle": -5.9695234298706055,
        "task_vector_magnitude_ratio": -3.175868511199951,
        "activation_l2_distance": -18.18015480041504,
        "activation_cosine_similarity": 18.22173500061035,
        "activation_magnitude_ratio": -8.906698226928711,
        "activation_dot_product": 21.860380172729492,
        "encoder_gradient_cosine_similarity": 16.869836807250977,
        "encoder_gradient_l2_distance": -34.13471221923828,
        "encoder_gradient_dot_product": 13.468910217285156,
        "input_gradient_cosine_similarity": 16.162302017211914,
        "input_gradient_l2_distance": -27.80255699157715,
        "input_gradient_dot_product": -13.201458930969238
      },
      "coefficient_std": {
        "effective_rank": 28.364273071289062,
        "effective_rank_mergeability_score": 25.32481575012207,
        "stable_rank": 36.753089904785156,
        "spectral_gap": 31.437013626098633,
        "singular_value_ratio": 33.98372268676758,
        "layerwise_effective_rank": 26.955015182495117,
        "layerwise_effective_rank_mergeability_score": 25.97682762145996,
        "task_vector_cosine_similarity": 24.003971099853516,
        "task_vector_l2_distance": 35.304710388183594,
        "task_vector_dot_product": 18.406095504760742,
        "weight_space_angle": 33.33672332763672,
        "task_vector_magnitude_ratio": 44.85594940185547,
        "activation_l2_distance": 49.084022521972656,
        "activation_cosine_similarity": 36.91358184814453,
        "activation_magnitude_ratio": 15.024666786193848,
        "activation_dot_product": 28.548110961914062,
        "encoder_gradient_cosine_similarity": 26.470966339111328,
        "encoder_gradient_l2_distance": 46.92348098754883,
        "encoder_gradient_dot_product": 28.15730857849121,
        "input_gradient_cosine_similarity": 26.776174545288086,
        "input_gradient_l2_distance": 33.43470764160156,
        "input_gradient_dot_product": 24.107622146606445
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": -0.04570349493905039,
          "val_r": -0.2655955553301436,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": -6.949795722961426,
            "effective_rank_mergeability_score": -1.0722306966781616,
            "stable_rank": -0.3663243353366852,
            "spectral_gap": 7.193935394287109,
            "singular_value_ratio": 2.2558093070983887,
            "layerwise_effective_rank": 11.354029655456543,
            "layerwise_effective_rank_mergeability_score": -4.5637006759643555,
            "task_vector_cosine_similarity": 5.827106475830078,
            "task_vector_l2_distance": 1.9217569828033447,
            "task_vector_dot_product": -3.097933530807495,
            "weight_space_angle": -5.164436340332031,
            "task_vector_magnitude_ratio": 2.2463619709014893,
            "activation_l2_distance": -7.017400741577148,
            "activation_cosine_similarity": -2.840245246887207,
            "activation_magnitude_ratio": -3.1762888431549072,
            "activation_dot_product": 2.335317611694336,
            "encoder_gradient_cosine_similarity": -7.037820816040039,
            "encoder_gradient_l2_distance": 2.635085105895996,
            "encoder_gradient_dot_product": 2.0204784870147705,
            "input_gradient_cosine_similarity": -3.161983013153076,
            "input_gradient_l2_distance": 2.919093370437622,
            "input_gradient_dot_product": 4.744661331176758
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5665840230496599,
          "val_r": 0.5365080894438957,
          "n_iterations": 567,
          "coefficients": {
            "effective_rank": -12.735401153564453,
            "effective_rank_mergeability_score": 15.218719482421875,
            "stable_rank": 59.3719482421875,
            "spectral_gap": -28.869367599487305,
            "singular_value_ratio": -8.715813636779785,
            "layerwise_effective_rank": -65.8265609741211,
            "layerwise_effective_rank_mergeability_score": -26.35480499267578,
            "task_vector_cosine_similarity": 13.026275634765625,
            "task_vector_l2_distance": 37.4151496887207,
            "task_vector_dot_product": 11.764007568359375,
            "weight_space_angle": -32.50175476074219,
            "task_vector_magnitude_ratio": -47.713401794433594,
            "activation_l2_distance": 23.41571807861328,
            "activation_cosine_similarity": 67.39183044433594,
            "activation_magnitude_ratio": -10.120556831359863,
            "activation_dot_product": 84.1650619506836,
            "encoder_gradient_cosine_similarity": 13.738377571105957,
            "encoder_gradient_l2_distance": -50.75181198120117,
            "encoder_gradient_dot_product": 8.385309219360352,
            "input_gradient_cosine_similarity": 43.25615692138672,
            "input_gradient_l2_distance": -59.33909225463867,
            "input_gradient_dot_product": -33.222633361816406
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7413273336041792,
          "val_r": 0.7877816588842264,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": -0.3649028539657593,
            "effective_rank_mergeability_score": -0.22556251287460327,
            "stable_rank": 0.2013067901134491,
            "spectral_gap": 0.03234105929732323,
            "singular_value_ratio": -0.08523250371217728,
            "layerwise_effective_rank": 0.08781342208385468,
            "layerwise_effective_rank_mergeability_score": 0.37714946269989014,
            "task_vector_cosine_similarity": 0.35829538106918335,
            "task_vector_l2_distance": -0.3388618528842926,
            "task_vector_dot_product": 0.27355778217315674,
            "weight_space_angle": 0.39137348532676697,
            "task_vector_magnitude_ratio": 0.11453243345022202,
            "activation_l2_distance": 0.7842167615890503,
            "activation_cosine_similarity": 1.2099906206130981,
            "activation_magnitude_ratio": -0.06738349795341492,
            "activation_dot_product": -0.045404329895973206,
            "encoder_gradient_cosine_similarity": 0.07473544031381607,
            "encoder_gradient_l2_distance": -1.006628155708313,
            "encoder_gradient_dot_product": -0.0015703901881352067,
            "input_gradient_cosine_similarity": 0.10164427757263184,
            "input_gradient_l2_distance": -0.6312002539634705,
            "input_gradient_dot_product": -0.24112094938755035
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7075922234420882,
          "val_r": 0.7160018846534751,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": -0.23121590912342072,
            "effective_rank_mergeability_score": 2.474454879760742,
            "stable_rank": -3.4062139987945557,
            "spectral_gap": -0.42015790939331055,
            "singular_value_ratio": -2.3911094665527344,
            "layerwise_effective_rank": 5.2779693603515625,
            "layerwise_effective_rank_mergeability_score": 4.700900077819824,
            "task_vector_cosine_similarity": 2.631774425506592,
            "task_vector_l2_distance": -4.677471160888672,
            "task_vector_dot_product": -0.14680632948875427,
            "weight_space_angle": 1.092189908027649,
            "task_vector_magnitude_ratio": 5.185915946960449,
            "activation_l2_distance": 0.3761330544948578,
            "activation_cosine_similarity": 1.6574604511260986,
            "activation_magnitude_ratio": -0.8073009848594666,
            "activation_dot_product": 8.348931312561035,
            "encoder_gradient_cosine_similarity": 2.1305737495422363,
            "encoder_gradient_l2_distance": -11.978658676147461,
            "encoder_gradient_dot_product": 1.0248342752456665,
            "input_gradient_cosine_similarity": 1.7160557508468628,
            "input_gradient_l2_distance": -8.407828330993652,
            "input_gradient_dot_product": -3.1515562534332275
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.10022738710244423,
          "val_r": -0.07701753833697958,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": -0.9401532411575317,
            "effective_rank_mergeability_score": -1.3012603521347046,
            "stable_rank": -0.15514208376407623,
            "spectral_gap": 1.2369917631149292,
            "singular_value_ratio": -0.6772366166114807,
            "layerwise_effective_rank": -0.4603213667869568,
            "layerwise_effective_rank_mergeability_score": -0.13396714627742767,
            "task_vector_cosine_similarity": -0.5090071558952332,
            "task_vector_l2_distance": 0.16105154156684875,
            "task_vector_dot_product": 0.8895413279533386,
            "weight_space_angle": -0.09055211395025253,
            "task_vector_magnitude_ratio": -0.35916754603385925,
            "activation_l2_distance": -0.8851715922355652,
            "activation_cosine_similarity": 1.3389396667480469,
            "activation_magnitude_ratio": -1.0900251865386963,
            "activation_dot_product": 0.8791757822036743,
            "encoder_gradient_cosine_similarity": 0.7938652038574219,
            "encoder_gradient_l2_distance": 0.4734978675842285,
            "encoder_gradient_dot_product": -0.2634439468383789,
            "input_gradient_cosine_similarity": 1.5306851863861084,
            "input_gradient_l2_distance": 0.8481109142303467,
            "input_gradient_dot_product": -0.2755057215690613
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.7522254105869997,
          "val_r": 0.6821063637247817,
          "n_iterations": 648,
          "coefficients": {
            "effective_rank": 1.575722575187683,
            "effective_rank_mergeability_score": 1.9396976232528687,
            "stable_rank": -1.1992484331130981,
            "spectral_gap": 1.5045520067214966,
            "singular_value_ratio": 0.9300130605697632,
            "layerwise_effective_rank": 2.0287182331085205,
            "layerwise_effective_rank_mergeability_score": 1.7616239786148071,
            "task_vector_cosine_similarity": -1.458923578262329,
            "task_vector_l2_distance": -1.7877644300460815,
            "task_vector_dot_product": -0.0005375179462134838,
            "weight_space_angle": -2.1197142601013184,
            "task_vector_magnitude_ratio": 0.8031673431396484,
            "activation_l2_distance": 0.5405551195144653,
            "activation_cosine_similarity": 2.817683458328247,
            "activation_magnitude_ratio": -0.5600684285163879,
            "activation_dot_product": 1.13280189037323,
            "encoder_gradient_cosine_similarity": 1.1609570980072021,
            "encoder_gradient_l2_distance": -5.058168411254883,
            "encoder_gradient_dot_product": 0.1939309686422348,
            "input_gradient_cosine_similarity": 0.32158660888671875,
            "input_gradient_l2_distance": -1.8817228078842163,
            "input_gradient_dot_product": -1.6453171968460083
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.6945833569333495,
          "val_r": 0.44039274093916303,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 2.7429468631744385,
            "effective_rank_mergeability_score": 4.487942695617676,
            "stable_rank": 1.8231000900268555,
            "spectral_gap": -4.431467056274414,
            "singular_value_ratio": -12.218056678771973,
            "layerwise_effective_rank": -0.1968882828950882,
            "layerwise_effective_rank_mergeability_score": 9.729141235351562,
            "task_vector_cosine_similarity": 1.0256016254425049,
            "task_vector_l2_distance": -18.214839935302734,
            "task_vector_dot_product": 11.541658401489258,
            "weight_space_angle": 4.619645118713379,
            "task_vector_magnitude_ratio": 7.916584491729736,
            "activation_l2_distance": 7.922162055969238,
            "activation_cosine_similarity": 9.785309791564941,
            "activation_magnitude_ratio": 2.330739974975586,
            "activation_dot_product": 18.155248641967773,
            "encoder_gradient_cosine_similarity": 6.9235944747924805,
            "encoder_gradient_l2_distance": -23.18515968322754,
            "encoder_gradient_dot_product": 10.362251281738281,
            "input_gradient_cosine_similarity": 2.6389403343200684,
            "input_gradient_l2_distance": -22.903993606567383,
            "input_gradient_dot_product": -19.85575294494629
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6753603263933059,
          "val_r": 0.3166362502700752,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": -4.504055500030518,
            "effective_rank_mergeability_score": 2.7466118335723877,
            "stable_rank": -0.3147001266479492,
            "spectral_gap": 1.2045644521713257,
            "singular_value_ratio": 8.103690147399902,
            "layerwise_effective_rank": 0.16506701707839966,
            "layerwise_effective_rank_mergeability_score": 0.32962408661842346,
            "task_vector_cosine_similarity": 3.1390833854675293,
            "task_vector_l2_distance": -9.991339683532715,
            "task_vector_dot_product": 3.884503126144409,
            "weight_space_angle": 0.1785837560892105,
            "task_vector_magnitude_ratio": -3.201083183288574,
            "activation_l2_distance": 0.9438455104827881,
            "activation_cosine_similarity": 6.2935967445373535,
            "activation_magnitude_ratio": -1.1573708057403564,
            "activation_dot_product": 8.038196563720703,
            "encoder_gradient_cosine_similarity": 3.9913787841796875,
            "encoder_gradient_l2_distance": -17.140262603759766,
            "encoder_gradient_dot_product": 1.5664867162704468,
            "input_gradient_cosine_similarity": 5.140308856964111,
            "input_gradient_l2_distance": -9.323247909545898,
            "input_gradient_dot_product": 0.9051271677017212
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.5913383378101329,
          "val_r": 0.13267521279605204,
          "n_iterations": 597,
          "coefficients": {
            "effective_rank": -81.54327392578125,
            "effective_rank_mergeability_score": 8.344572067260742,
            "stable_rank": 142.29393005371094,
            "spectral_gap": 60.94699478149414,
            "singular_value_ratio": -111.27411651611328,
            "layerwise_effective_rank": 30.585689544677734,
            "layerwise_effective_rank_mergeability_score": 67.91785430908203,
            "task_vector_cosine_similarity": 1.5191971063613892,
            "task_vector_l2_distance": 52.79710388183594,
            "task_vector_dot_product": -42.286415100097656,
            "weight_space_angle": -119.47195434570312,
            "task_vector_magnitude_ratio": 114.42793273925781,
            "activation_l2_distance": -133.89114379882812,
            "activation_cosine_similarity": -32.87437057495117,
            "activation_magnitude_ratio": -27.159887313842773,
            "activation_dot_product": 34.72404098510742,
            "encoder_gradient_cosine_similarity": 58.23405075073242,
            "encoder_gradient_l2_distance": -86.10266876220703,
            "encoder_gradient_dot_product": 88.7999267578125,
            "input_gradient_cosine_similarity": 47.94587707519531,
            "input_gradient_l2_distance": -120.04664611816406,
            "input_gradient_dot_product": 47.11080551147461
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.6976095816175445,
          "val_r": 0.6612809177523373,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": -0.030795244500041008,
            "effective_rank_mergeability_score": -4.232767581939697,
            "stable_rank": 3.9849536418914795,
            "spectral_gap": 5.6027421951293945,
            "singular_value_ratio": 8.616925239562988,
            "layerwise_effective_rank": -1.860262155532837,
            "layerwise_effective_rank_mergeability_score": 9.56264877319336,
            "task_vector_cosine_similarity": 3.670053005218506,
            "task_vector_l2_distance": -3.8961966037750244,
            "task_vector_dot_product": 0.8722373843193054,
            "weight_space_angle": -0.20459435880184174,
            "task_vector_magnitude_ratio": -3.2421088218688965,
            "activation_l2_distance": 2.2164204120635986,
            "activation_cosine_similarity": 0.7599062323570251,
            "activation_magnitude_ratio": -0.795062780380249,
            "activation_dot_product": -1.9859087467193604,
            "encoder_gradient_cosine_similarity": 2.431565284729004,
            "encoder_gradient_l2_distance": -7.66160774230957,
            "encoder_gradient_dot_product": 2.865762233734131,
            "input_gradient_cosine_similarity": 1.0382747650146484,
            "input_gradient_l2_distance": -12.71165657043457,
            "input_gradient_dot_product": -4.0013203620910645
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5634000240488231,
          "val_r": 0.18843624410595536,
          "n_iterations": 595,
          "coefficients": {
            "effective_rank": 47.31863784790039,
            "effective_rank_mergeability_score": 76.16912841796875,
            "stable_rank": 68.15062713623047,
            "spectral_gap": -98.12654113769531,
            "singular_value_ratio": -85.1376953125,
            "layerwise_effective_rank": -19.52223777770996,
            "layerwise_effective_rank_mergeability_score": -71.71187591552734,
            "task_vector_cosine_similarity": 75.66146087646484,
            "task_vector_l2_distance": 72.3773193359375,
            "task_vector_dot_product": -0.5964272618293762,
            "weight_space_angle": 49.12101745605469,
            "task_vector_magnitude_ratio": -110.31140899658203,
            "activation_l2_distance": -156.07664489746094,
            "activation_cosine_similarity": 61.7389030456543,
            "activation_magnitude_ratio": -30.626718521118164,
            "activation_dot_product": 66.25082397460938,
            "encoder_gradient_cosine_similarity": 46.5970344543457,
            "encoder_gradient_l2_distance": -66.67843627929688,
            "encoder_gradient_dot_product": 101.19176483154297,
            "input_gradient_cosine_similarity": 109.85391998291016,
            "input_gradient_l2_distance": -76.24470520019531,
            "input_gradient_dot_product": -58.400550842285156
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.511798372788252,
          "val_r": 0.38668013176381283,
          "n_iterations": 825,
          "coefficients": {
            "effective_rank": 42.571998596191406,
            "effective_rank_mergeability_score": 82.29194641113281,
            "stable_rank": -20.95009422302246,
            "spectral_gap": -22.969633102416992,
            "singular_value_ratio": 2.5435657501220703,
            "layerwise_effective_rank": 83.7514419555664,
            "layerwise_effective_rank_mergeability_score": -43.73118209838867,
            "task_vector_cosine_similarity": -61.075496673583984,
            "task_vector_l2_distance": 122.17794799804688,
            "task_vector_dot_product": 56.89876937866211,
            "weight_space_angle": 6.170718669891357,
            "task_vector_magnitude_ratio": -99.17805480957031,
            "activation_l2_distance": -96.24658966064453,
            "activation_cosine_similarity": 148.08656311035156,
            "activation_magnitude_ratio": -52.848854064941406,
            "activation_dot_product": 1.3877410888671875,
            "encoder_gradient_cosine_similarity": 100.23208618164062,
            "encoder_gradient_l2_distance": -197.03726196289062,
            "encoder_gradient_dot_product": 6.9785943031311035,
            "input_gradient_cosine_similarity": 46.36387252807617,
            "input_gradient_l2_distance": -52.99732208251953,
            "input_gradient_dot_product": -51.42272186279297
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.6690102945587899,
          "val_r": 0.6859282297554661,
          "n_iterations": 946,
          "coefficients": {
            "effective_rank": -72.79582214355469,
            "effective_rank_mergeability_score": -27.16938018798828,
            "stable_rank": 16.297893524169922,
            "spectral_gap": 67.76978302001953,
            "singular_value_ratio": 51.72367477416992,
            "layerwise_effective_rank": -36.8642578125,
            "layerwise_effective_rank_mergeability_score": -30.19085693359375,
            "task_vector_cosine_similarity": -22.196128845214844,
            "task_vector_l2_distance": -22.596548080444336,
            "task_vector_dot_product": 20.96973991394043,
            "weight_space_angle": 38.75796127319336,
            "task_vector_magnitude_ratio": 35.5713996887207,
            "activation_l2_distance": 11.644025802612305,
            "activation_cosine_similarity": 31.06305694580078,
            "activation_magnitude_ratio": -5.548069953918457,
            "activation_dot_product": 91.24530029296875,
            "encoder_gradient_cosine_similarity": 35.39712905883789,
            "encoder_gradient_l2_distance": -68.7265396118164,
            "encoder_gradient_dot_product": 3.9178781509399414,
            "input_gradient_cosine_similarity": 16.988983154296875,
            "input_gradient_l2_distance": -76.63126373291016,
            "input_gradient_dot_product": -57.62953567504883
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6137718421764532,
          "val_r": 0.7026975873426619,
          "n_iterations": 708,
          "coefficients": {
            "effective_rank": 3.6961402893066406,
            "effective_rank_mergeability_score": 33.45564270019531,
            "stable_rank": -15.029562950134277,
            "spectral_gap": -1.8778594732284546,
            "singular_value_ratio": -20.813060760498047,
            "layerwise_effective_rank": 6.8393425941467285,
            "layerwise_effective_rank_mergeability_score": -5.426224708557129,
            "task_vector_cosine_similarity": 34.584781646728516,
            "task_vector_l2_distance": 3.360539436340332,
            "task_vector_dot_product": 35.675174713134766,
            "weight_space_angle": -59.53836441040039,
            "task_vector_magnitude_ratio": 30.146320343017578,
            "activation_l2_distance": -43.17163848876953,
            "activation_cosine_similarity": 30.492406845092773,
            "activation_magnitude_ratio": -37.39933395385742,
            "activation_dot_product": 45.0956916809082,
            "encoder_gradient_cosine_similarity": 48.318939208984375,
            "encoder_gradient_l2_distance": -66.04785919189453,
            "encoder_gradient_dot_product": 30.89417266845703,
            "input_gradient_cosine_similarity": 24.642187118530273,
            "input_gradient_l2_distance": -49.0650749206543,
            "input_gradient_dot_product": -27.8346004486084
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": -0.03970473271585378,
          "val_r": -0.1511793277544313,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": 0.830409049987793,
            "effective_rank_mergeability_score": -2.661609649658203,
            "stable_rank": 3.0075395107269287,
            "spectral_gap": -1.5491690635681152,
            "singular_value_ratio": 0.7800021171569824,
            "layerwise_effective_rank": 1.6299763917922974,
            "layerwise_effective_rank_mergeability_score": -0.9022207260131836,
            "task_vector_cosine_similarity": -1.2814470529556274,
            "task_vector_l2_distance": -2.004441499710083,
            "task_vector_dot_product": -0.4576821029186249,
            "weight_space_angle": -3.245635509490967,
            "task_vector_magnitude_ratio": 0.795712947845459,
            "activation_l2_distance": 0.30780407786369324,
            "activation_cosine_similarity": -0.05037865787744522,
            "activation_magnitude_ratio": -0.4225356876850128,
            "activation_dot_product": 1.6404343843460083,
            "encoder_gradient_cosine_similarity": 1.2621870040893555,
            "encoder_gradient_l2_distance": 0.5777586102485657,
            "encoder_gradient_dot_product": 1.7120712995529175,
            "input_gradient_cosine_similarity": -0.8866254091262817,
            "input_gradient_l2_distance": 1.7024327516555786,
            "input_gradient_dot_product": 0.20060384273529053
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.6894583706806239,
          "val_r": 0.4858532638027599,
          "n_iterations": 986,
          "coefficients": {
            "effective_rank": -3.1518750190734863,
            "effective_rank_mergeability_score": 9.670104026794434,
            "stable_rank": -20.075687408447266,
            "spectral_gap": -11.33110237121582,
            "singular_value_ratio": -17.646406173706055,
            "layerwise_effective_rank": 13.213006973266602,
            "layerwise_effective_rank_mergeability_score": 4.452528476715088,
            "task_vector_cosine_similarity": -13.836134910583496,
            "task_vector_l2_distance": -26.892019271850586,
            "task_vector_dot_product": 22.05367088317871,
            "weight_space_angle": -4.032810211181641,
            "task_vector_magnitude_ratio": 21.28520393371582,
            "activation_l2_distance": 22.37901496887207,
            "activation_cosine_similarity": 11.697956085205078,
            "activation_magnitude_ratio": 1.0518873929977417,
            "activation_dot_product": 36.405296325683594,
            "encoder_gradient_cosine_similarity": 11.164202690124512,
            "encoder_gradient_l2_distance": -16.08236312866211,
            "encoder_gradient_dot_product": 3.695988416671753,
            "input_gradient_cosine_similarity": 10.16010570526123,
            "input_gradient_l2_distance": -28.882610321044922,
            "input_gradient_dot_product": -24.299467086791992
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7390691608469998,
          "val_r": 0.6752293526568118,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 0.3897587060928345,
            "effective_rank_mergeability_score": 0.29904016852378845,
            "stable_rank": -0.3840450644493103,
            "spectral_gap": -0.3466546833515167,
            "singular_value_ratio": 0.13420459628105164,
            "layerwise_effective_rank": -0.09884587675333023,
            "layerwise_effective_rank_mergeability_score": -0.03964102268218994,
            "task_vector_cosine_similarity": 0.3904103636741638,
            "task_vector_l2_distance": -0.4015405774116516,
            "task_vector_dot_product": 0.25419238209724426,
            "weight_space_angle": 0.29612788558006287,
            "task_vector_magnitude_ratio": -0.2870313227176666,
            "activation_l2_distance": 1.083980679512024,
            "activation_cosine_similarity": 1.4938150644302368,
            "activation_magnitude_ratio": -0.050917524844408035,
            "activation_dot_product": -0.11348061263561249,
            "encoder_gradient_cosine_similarity": 0.16159731149673462,
            "encoder_gradient_l2_distance": -0.9700100421905518,
            "encoder_gradient_dot_product": 0.04685400053858757,
            "input_gradient_cosine_similarity": 0.0983530655503273,
            "input_gradient_l2_distance": -0.6857722997665405,
            "input_gradient_dot_product": -0.2714727520942688
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6931023119062545,
          "val_r": 0.5529627667132346,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": -2.3305320739746094,
            "effective_rank_mergeability_score": 3.3806779384613037,
            "stable_rank": 11.036053657531738,
            "spectral_gap": 0.1119564101099968,
            "singular_value_ratio": 1.8640007972717285,
            "layerwise_effective_rank": -2.532717227935791,
            "layerwise_effective_rank_mergeability_score": 12.932897567749023,
            "task_vector_cosine_similarity": 8.716341018676758,
            "task_vector_l2_distance": -7.15388298034668,
            "task_vector_dot_product": 1.9672504663467407,
            "weight_space_angle": 0.9765522480010986,
            "task_vector_magnitude_ratio": 0.723284900188446,
            "activation_l2_distance": -5.489625453948975,
            "activation_cosine_similarity": 5.9504618644714355,
            "activation_magnitude_ratio": -0.8027223944664001,
            "activation_dot_product": 8.984910011291504,
            "encoder_gradient_cosine_similarity": 5.575728416442871,
            "encoder_gradient_l2_distance": -7.123638153076172,
            "encoder_gradient_dot_product": 10.508809089660645,
            "input_gradient_cosine_similarity": 5.841558933258057,
            "input_gradient_l2_distance": -35.408382415771484,
            "input_gradient_dot_product": -16.730314254760742
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7731158680527156,
          "val_r": 0.3813973449483575,
          "n_iterations": 925,
          "coefficients": {
            "effective_rank": 1.297696590423584,
            "effective_rank_mergeability_score": 0.1372118890285492,
            "stable_rank": -1.4690734148025513,
            "spectral_gap": 0.10496644675731659,
            "singular_value_ratio": 1.0013130903244019,
            "layerwise_effective_rank": -0.22739651799201965,
            "layerwise_effective_rank_mergeability_score": -0.04985108971595764,
            "task_vector_cosine_similarity": -0.026922084391117096,
            "task_vector_l2_distance": -0.28480350971221924,
            "task_vector_dot_product": 0.24237589538097382,
            "weight_space_angle": -0.08423373103141785,
            "task_vector_magnitude_ratio": -0.4741450548171997,
            "activation_l2_distance": 0.8731260895729065,
            "activation_cosine_similarity": 1.0758699178695679,
            "activation_magnitude_ratio": 0.018250644207000732,
            "activation_dot_product": 0.013223580084741116,
            "encoder_gradient_cosine_similarity": 0.12333594262599945,
            "encoder_gradient_l2_distance": -0.6911313533782959,
            "encoder_gradient_dot_product": 0.015363299287855625,
            "input_gradient_cosine_similarity": 0.04365519806742668,
            "input_gradient_l2_distance": -0.47013726830482483,
            "input_gradient_dot_product": -0.1697412133216858
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7786013655040758,
          "val_r": 0.6488962996180625,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 9.988219261169434,
            "effective_rank_mergeability_score": -0.18740002810955048,
            "stable_rank": -1.8282643556594849,
            "spectral_gap": 15.165698051452637,
            "singular_value_ratio": 28.629323959350586,
            "layerwise_effective_rank": -11.237648010253906,
            "layerwise_effective_rank_mergeability_score": 2.743936777114868,
            "task_vector_cosine_similarity": 4.599456310272217,
            "task_vector_l2_distance": -17.777786254882812,
            "task_vector_dot_product": 10.397370338439941,
            "weight_space_angle": 5.459417343139648,
            "task_vector_magnitude_ratio": -17.96738052368164,
            "activation_l2_distance": 6.688107967376709,
            "activation_cosine_similarity": 17.34593391418457,
            "activation_magnitude_ratio": -8.901750564575195,
            "activation_dot_product": 30.55018424987793,
            "encoder_gradient_cosine_similarity": 6.123223781585693,
            "encoder_gradient_l2_distance": -60.138423919677734,
            "encoder_gradient_dot_product": -4.537242412567139,
            "input_gradient_cosine_similarity": 9.612516403198242,
            "input_gradient_l2_distance": -5.890133380889893,
            "input_gradient_dot_product": -17.83876609802246
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    },
    "arithmetic": {
      "aggregate_metrics": {
        "train_r": 0.11989877115907766,
        "train_p": 8.624129626892462e-12,
        "val_r": 0.03167337870997225,
        "val_p": 0.5502787458501001
      },
      "per_fold_stats": {
        "train_r_mean": 0.39984438152613216,
        "train_r_std": 0.14591528928086744,
        "val_r_mean": 0.348391256903991,
        "val_r_std": 0.24639741274160554
      },
      "average_coefficients": {
        "effective_rank": 36.58692932128906,
        "effective_rank_mergeability_score": 49.86984634399414,
        "stable_rank": -47.9909782409668,
        "spectral_gap": -1.8941634893417358,
        "singular_value_ratio": 2.690798282623291,
        "layerwise_effective_rank": 39.98095703125,
        "layerwise_effective_rank_mergeability_score": 33.17683029174805,
        "task_vector_cosine_similarity": 62.764320373535156,
        "task_vector_l2_distance": -156.59698486328125,
        "task_vector_dot_product": 78.24459838867188,
        "weight_space_angle": -75.9563217163086,
        "task_vector_magnitude_ratio": 70.54661560058594,
        "activation_l2_distance": 48.70585632324219,
        "activation_cosine_similarity": 38.83490753173828,
        "activation_magnitude_ratio": -3.5970263481140137,
        "activation_dot_product": 62.0295295715332,
        "encoder_gradient_cosine_similarity": 70.27272033691406,
        "encoder_gradient_l2_distance": -76.24400329589844,
        "encoder_gradient_dot_product": 14.345242500305176,
        "input_gradient_cosine_similarity": 28.78887939453125,
        "input_gradient_l2_distance": -140.75328063964844,
        "input_gradient_dot_product": -132.80809020996094
      },
      "coefficient_std": {
        "effective_rank": 128.8020782470703,
        "effective_rank_mergeability_score": 111.16791534423828,
        "stable_rank": 220.61192321777344,
        "spectral_gap": 111.37564086914062,
        "singular_value_ratio": 55.24403762817383,
        "layerwise_effective_rank": 160.09373474121094,
        "layerwise_effective_rank_mergeability_score": 125.38443756103516,
        "task_vector_cosine_similarity": 152.69479370117188,
        "task_vector_l2_distance": 522.4150390625,
        "task_vector_dot_product": 235.315185546875,
        "weight_space_angle": 235.9313507080078,
        "task_vector_magnitude_ratio": 311.0113220214844,
        "activation_l2_distance": 356.7044982910156,
        "activation_cosine_similarity": 115.6213607788086,
        "activation_magnitude_ratio": 37.12839126586914,
        "activation_dot_product": 116.90392303466797,
        "encoder_gradient_cosine_similarity": 254.7305145263672,
        "encoder_gradient_l2_distance": 127.1515121459961,
        "encoder_gradient_dot_product": 198.50059509277344,
        "input_gradient_cosine_similarity": 73.70551300048828,
        "input_gradient_l2_distance": 425.0874328613281,
        "input_gradient_dot_product": 394.3180236816406
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.4438611153698801,
          "val_r": 0.42726140131801427,
          "n_iterations": 664,
          "coefficients": {
            "effective_rank": 11.522387504577637,
            "effective_rank_mergeability_score": 1.877713680267334,
            "stable_rank": -63.525394439697266,
            "spectral_gap": 20.77401351928711,
            "singular_value_ratio": 53.676822662353516,
            "layerwise_effective_rank": 40.02324295043945,
            "layerwise_effective_rank_mergeability_score": -5.998660564422607,
            "task_vector_cosine_similarity": 45.03112030029297,
            "task_vector_l2_distance": -8.10644245147705,
            "task_vector_dot_product": -14.899109840393066,
            "weight_space_angle": -19.235204696655273,
            "task_vector_magnitude_ratio": -38.80952072143555,
            "activation_l2_distance": 9.549771308898926,
            "activation_cosine_similarity": 42.58867263793945,
            "activation_magnitude_ratio": 0.2462863028049469,
            "activation_dot_product": 31.067115783691406,
            "encoder_gradient_cosine_similarity": 31.91367530822754,
            "encoder_gradient_l2_distance": -14.720356941223145,
            "encoder_gradient_dot_product": 21.651647567749023,
            "input_gradient_cosine_similarity": 15.257891654968262,
            "input_gradient_l2_distance": -89.0084457397461,
            "input_gradient_dot_product": -69.87953186035156
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.46893534122299874,
          "val_r": 0.2943846439895879,
          "n_iterations": 929,
          "coefficients": {
            "effective_rank": 94.54259490966797,
            "effective_rank_mergeability_score": 93.60623168945312,
            "stable_rank": -30.248332977294922,
            "spectral_gap": 8.985761642456055,
            "singular_value_ratio": -59.70964813232422,
            "layerwise_effective_rank": -5.116936683654785,
            "layerwise_effective_rank_mergeability_score": -57.65451431274414,
            "task_vector_cosine_similarity": 22.18362045288086,
            "task_vector_l2_distance": -47.33681869506836,
            "task_vector_dot_product": 77.1306381225586,
            "weight_space_angle": 45.05107879638672,
            "task_vector_magnitude_ratio": 31.2720890045166,
            "activation_l2_distance": -13.134604454040527,
            "activation_cosine_similarity": 60.89194869995117,
            "activation_magnitude_ratio": -44.00535583496094,
            "activation_dot_product": -30.856502532958984,
            "encoder_gradient_cosine_similarity": 0.6652258038520813,
            "encoder_gradient_l2_distance": -42.33258819580078,
            "encoder_gradient_dot_product": 49.2602653503418,
            "input_gradient_cosine_similarity": -43.450740814208984,
            "input_gradient_l2_distance": -98.39612579345703,
            "input_gradient_dot_product": -10.348896980285645
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.3465829905602539,
          "val_r": 0.41241579402927947,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": 570.3150024414062,
            "effective_rank_mergeability_score": 419.3130798339844,
            "stable_rank": -971.017822265625,
            "spectral_gap": 351.4214172363281,
            "singular_value_ratio": 31.529081344604492,
            "layerwise_effective_rank": 712.2073974609375,
            "layerwise_effective_rank_mergeability_score": 521.8646850585938,
            "task_vector_cosine_similarity": 706.1134643554688,
            "task_vector_l2_distance": -2373.045166015625,
            "task_vector_dot_product": 1091.702392578125,
            "weight_space_angle": -1080.5303955078125,
            "task_vector_magnitude_ratio": 1418.97607421875,
            "activation_l2_distance": 1571.2705078125,
            "activation_cosine_similarity": 523.877685546875,
            "activation_magnitude_ratio": 106.41976165771484,
            "activation_dot_product": 548.6272583007812,
            "encoder_gradient_cosine_similarity": 1165.515869140625,
            "encoder_gradient_l2_distance": -603.9276123046875,
            "encoder_gradient_dot_product": -775.4651489257812,
            "input_gradient_cosine_similarity": -147.00355529785156,
            "input_gradient_l2_distance": -1989.133544921875,
            "input_gradient_dot_product": -1798.0302734375
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.44167097641528974,
          "val_r": 0.3094787440449513,
          "n_iterations": 645,
          "coefficients": {
            "effective_rank": 13.110542297363281,
            "effective_rank_mergeability_score": 13.154526710510254,
            "stable_rank": -27.801420211791992,
            "spectral_gap": 42.79903030395508,
            "singular_value_ratio": 12.714822769165039,
            "layerwise_effective_rank": -26.213098526000977,
            "layerwise_effective_rank_mergeability_score": -42.61034393310547,
            "task_vector_cosine_similarity": 47.50958251953125,
            "task_vector_l2_distance": -26.41152572631836,
            "task_vector_dot_product": 3.464379072189331,
            "weight_space_angle": -3.7230358123779297,
            "task_vector_magnitude_ratio": 16.94635581970215,
            "activation_l2_distance": 7.163827896118164,
            "activation_cosine_similarity": -5.784586429595947,
            "activation_magnitude_ratio": 11.066012382507324,
            "activation_dot_product": 59.96067428588867,
            "encoder_gradient_cosine_similarity": 14.070479393005371,
            "encoder_gradient_l2_distance": -65.07678985595703,
            "encoder_gradient_dot_product": 28.12376594543457,
            "input_gradient_cosine_similarity": 26.1127986907959,
            "input_gradient_l2_distance": -34.41925811767578,
            "input_gradient_dot_product": -63.15913772583008
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.3171835310227603,
          "val_r": 0.40717349630863436,
          "n_iterations": 759,
          "coefficients": {
            "effective_rank": -20.001880645751953,
            "effective_rank_mergeability_score": 51.547420501708984,
            "stable_rank": 62.24293518066406,
            "spectral_gap": 27.11090850830078,
            "singular_value_ratio": -37.93608856201172,
            "layerwise_effective_rank": -20.20271873474121,
            "layerwise_effective_rank_mergeability_score": -8.312212944030762,
            "task_vector_cosine_similarity": 23.36859703063965,
            "task_vector_l2_distance": -19.544944763183594,
            "task_vector_dot_product": 32.74728775024414,
            "weight_space_angle": -151.11373901367188,
            "task_vector_magnitude_ratio": 50.10537338256836,
            "activation_l2_distance": -67.9867935180664,
            "activation_cosine_similarity": -1.9953041076660156,
            "activation_magnitude_ratio": -17.032054901123047,
            "activation_dot_product": 73.05899810791016,
            "encoder_gradient_cosine_similarity": 36.95292282104492,
            "encoder_gradient_l2_distance": -54.261878967285156,
            "encoder_gradient_dot_product": 38.00862121582031,
            "input_gradient_cosine_similarity": 70.24324035644531,
            "input_gradient_l2_distance": -19.814626693725586,
            "input_gradient_dot_product": -46.18621063232422
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.5005322545881656,
          "val_r": 0.6932907653856077,
          "n_iterations": 831,
          "coefficients": {
            "effective_rank": -12.21310806274414,
            "effective_rank_mergeability_score": 2.8198211193084717,
            "stable_rank": 0.5987972617149353,
            "spectral_gap": 14.875252723693848,
            "singular_value_ratio": 5.097167015075684,
            "layerwise_effective_rank": 2.0063822269439697,
            "layerwise_effective_rank_mergeability_score": -9.985251426696777,
            "task_vector_cosine_similarity": -0.8864018321037292,
            "task_vector_l2_distance": -22.070877075195312,
            "task_vector_dot_product": 25.19261932373047,
            "weight_space_angle": 7.838959217071533,
            "task_vector_magnitude_ratio": 2.3208072185516357,
            "activation_l2_distance": 2.247128486633301,
            "activation_cosine_similarity": 10.570873260498047,
            "activation_magnitude_ratio": 1.5092041492462158,
            "activation_dot_product": 3.9521420001983643,
            "encoder_gradient_cosine_similarity": 8.34498405456543,
            "encoder_gradient_l2_distance": -14.247291564941406,
            "encoder_gradient_dot_product": 15.963883399963379,
            "input_gradient_cosine_similarity": 6.135110378265381,
            "input_gradient_l2_distance": -27.012256622314453,
            "input_gradient_dot_product": -22.059688568115234
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.05569506230738391,
          "val_r": 0.09792043263638915,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": 0.5903240442276001,
            "effective_rank_mergeability_score": -1.7493128776550293,
            "stable_rank": -0.7755810022354126,
            "spectral_gap": -0.8314911723136902,
            "singular_value_ratio": -1.5841809511184692,
            "layerwise_effective_rank": -2.016813039779663,
            "layerwise_effective_rank_mergeability_score": -2.247765302658081,
            "task_vector_cosine_similarity": 0.14108771085739136,
            "task_vector_l2_distance": -2.4977827072143555,
            "task_vector_dot_product": 0.18863685429096222,
            "weight_space_angle": 2.4207794666290283,
            "task_vector_magnitude_ratio": 0.6661447286605835,
            "activation_l2_distance": -7.948389053344727,
            "activation_cosine_similarity": 0.8555179238319397,
            "activation_magnitude_ratio": 1.7959336042404175,
            "activation_dot_product": 4.125377655029297,
            "encoder_gradient_cosine_similarity": -8.766348838806152,
            "encoder_gradient_l2_distance": 0.8416219353675842,
            "encoder_gradient_dot_product": 3.032325267791748,
            "input_gradient_cosine_similarity": 11.668514251708984,
            "input_gradient_l2_distance": 3.116330146789551,
            "input_gradient_dot_product": -0.04001419618725777
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.29051012177103125,
          "val_r": -0.5304582150887321,
          "n_iterations": 405,
          "coefficients": {
            "effective_rank": 76.83485412597656,
            "effective_rank_mergeability_score": -31.386690139770508,
            "stable_rank": -86.94820404052734,
            "spectral_gap": -58.95900344848633,
            "singular_value_ratio": -16.149564743041992,
            "layerwise_effective_rank": -39.816444396972656,
            "layerwise_effective_rank_mergeability_score": 69.23486328125,
            "task_vector_cosine_similarity": -5.652651786804199,
            "task_vector_l2_distance": 31.35320281982422,
            "task_vector_dot_product": 38.92640686035156,
            "weight_space_angle": -145.8230743408203,
            "task_vector_magnitude_ratio": -2.921239137649536,
            "activation_l2_distance": -51.45842742919922,
            "activation_cosine_similarity": 81.33026885986328,
            "activation_magnitude_ratio": 10.755301475524902,
            "activation_dot_product": 34.07033920288086,
            "encoder_gradient_cosine_similarity": 105.10743713378906,
            "encoder_gradient_l2_distance": -172.917724609375,
            "encoder_gradient_dot_product": 50.466217041015625,
            "input_gradient_cosine_similarity": 6.982125282287598,
            "input_gradient_l2_distance": -0.9318314790725708,
            "input_gradient_dot_product": 108.90028381347656
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.12742071581117764,
          "val_r": 0.45325255520416646,
          "n_iterations": 713,
          "coefficients": {
            "effective_rank": 53.96982955932617,
            "effective_rank_mergeability_score": 288.89404296875,
            "stable_rank": 196.3185577392578,
            "spectral_gap": -304.2197265625,
            "singular_value_ratio": 178.17308044433594,
            "layerwise_effective_rank": 124.07943725585938,
            "layerwise_effective_rank_mergeability_score": 177.45843505859375,
            "task_vector_cosine_similarity": 133.8064727783203,
            "task_vector_l2_distance": -539.8726806640625,
            "task_vector_dot_product": 111.38871765136719,
            "weight_space_angle": -3.110382556915283,
            "task_vector_magnitude_ratio": -17.504573822021484,
            "activation_l2_distance": -323.7209167480469,
            "activation_cosine_similarity": -46.603492736816406,
            "activation_magnitude_ratio": -56.564361572265625,
            "activation_dot_product": 102.45729064941406,
            "encoder_gradient_cosine_similarity": -139.01345825195312,
            "encoder_gradient_l2_distance": -29.908493041992188,
            "encoder_gradient_dot_product": 391.57464599609375,
            "input_gradient_cosine_similarity": 220.6424560546875,
            "input_gradient_l2_distance": -83.12076568603516,
            "input_gradient_dot_product": -434.1262512207031
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.2256165951237116,
          "val_r": 0.23400230368873354,
          "n_iterations": 819,
          "coefficients": {
            "effective_rank": 43.74525451660156,
            "effective_rank_mergeability_score": 126.18656921386719,
            "stable_rank": -103.92466735839844,
            "spectral_gap": -141.79595947265625,
            "singular_value_ratio": 90.884033203125,
            "layerwise_effective_rank": -82.99783325195312,
            "layerwise_effective_rank_mergeability_score": 85.21517181396484,
            "task_vector_cosine_similarity": -17.33927345275879,
            "task_vector_l2_distance": 91.95073699951172,
            "task_vector_dot_product": -53.23705291748047,
            "weight_space_angle": -78.48451232910156,
            "task_vector_magnitude_ratio": 26.835529327392578,
            "activation_l2_distance": -89.86837768554688,
            "activation_cosine_similarity": 26.795068740844727,
            "activation_magnitude_ratio": -89.08637237548828,
            "activation_dot_product": 87.09565734863281,
            "encoder_gradient_cosine_similarity": 47.85027313232422,
            "encoder_gradient_l2_distance": -77.07657623291016,
            "encoder_gradient_dot_product": 75.46017456054688,
            "input_gradient_cosine_similarity": 195.6053009033203,
            "input_gradient_l2_distance": -91.89893341064453,
            "input_gradient_dot_product": -70.91619873046875
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.4989752766026555,
          "val_r": 0.22233011270769393,
          "n_iterations": 844,
          "coefficients": {
            "effective_rank": 0.3194844722747803,
            "effective_rank_mergeability_score": 13.568696975708008,
            "stable_rank": 9.754338264465332,
            "spectral_gap": 7.487887859344482,
            "singular_value_ratio": 3.9786665439605713,
            "layerwise_effective_rank": 4.452559947967529,
            "layerwise_effective_rank_mergeability_score": -2.657721757888794,
            "task_vector_cosine_similarity": 0.4392014443874359,
            "task_vector_l2_distance": -19.388851165771484,
            "task_vector_dot_product": 21.149328231811523,
            "weight_space_angle": 8.612858772277832,
            "task_vector_magnitude_ratio": -11.074357032775879,
            "activation_l2_distance": -7.888173580169678,
            "activation_cosine_similarity": 16.06208038330078,
            "activation_magnitude_ratio": -0.053869038820266724,
            "activation_dot_product": 0.4520449936389923,
            "encoder_gradient_cosine_similarity": 1.770403265953064,
            "encoder_gradient_l2_distance": -31.82434844970703,
            "encoder_gradient_dot_product": 15.217584609985352,
            "input_gradient_cosine_similarity": 13.765948295593262,
            "input_gradient_l2_distance": -21.592084884643555,
            "input_gradient_dot_product": -21.553438186645508
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.48303612786295147,
          "val_r": 0.39284292730195225,
          "n_iterations": 643,
          "coefficients": {
            "effective_rank": -47.423702239990234,
            "effective_rank_mergeability_score": -4.977130889892578,
            "stable_rank": 35.52070617675781,
            "spectral_gap": 21.407268524169922,
            "singular_value_ratio": -23.760244369506836,
            "layerwise_effective_rank": 29.823341369628906,
            "layerwise_effective_rank_mergeability_score": 3.999809741973877,
            "task_vector_cosine_similarity": -2.398223638534546,
            "task_vector_l2_distance": -28.68212890625,
            "task_vector_dot_product": 36.13691329956055,
            "weight_space_angle": -8.62051773071289,
            "task_vector_magnitude_ratio": 13.484651565551758,
            "activation_l2_distance": 8.134636878967285,
            "activation_cosine_similarity": 18.841625213623047,
            "activation_magnitude_ratio": -0.43072977662086487,
            "activation_dot_product": 14.68933391571045,
            "encoder_gradient_cosine_similarity": 15.547368049621582,
            "encoder_gradient_l2_distance": -43.329959869384766,
            "encoder_gradient_dot_product": 25.550201416015625,
            "input_gradient_cosine_similarity": 17.76214599609375,
            "input_gradient_l2_distance": -36.842960357666016,
            "input_gradient_dot_product": -43.434730529785156
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.46831402439110137,
          "val_r": 0.30211218604648254,
          "n_iterations": 794,
          "coefficients": {
            "effective_rank": -1.469751000404358,
            "effective_rank_mergeability_score": 18.181066513061523,
            "stable_rank": 21.50086212158203,
            "spectral_gap": 15.301765441894531,
            "singular_value_ratio": -7.238900661468506,
            "layerwise_effective_rank": -3.047292470932007,
            "layerwise_effective_rank_mergeability_score": -12.989472389221191,
            "task_vector_cosine_similarity": 18.031442642211914,
            "task_vector_l2_distance": -6.340893268585205,
            "task_vector_dot_product": -7.105930805206299,
            "weight_space_angle": -26.25352668762207,
            "task_vector_magnitude_ratio": 7.712460517883301,
            "activation_l2_distance": 2.497655153274536,
            "activation_cosine_similarity": 2.7601020336151123,
            "activation_magnitude_ratio": 2.800525426864624,
            "activation_dot_product": 15.073871612548828,
            "encoder_gradient_cosine_similarity": 11.942789077758789,
            "encoder_gradient_l2_distance": -20.21106719970703,
            "encoder_gradient_dot_product": 17.383317947387695,
            "input_gradient_cosine_similarity": 6.923612117767334,
            "input_gradient_l2_distance": -20.778987884521484,
            "input_gradient_dot_product": -33.675575256347656
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.49655281357208,
          "val_r": 0.5462681643631968,
          "n_iterations": 702,
          "coefficients": {
            "effective_rank": 8.36268424987793,
            "effective_rank_mergeability_score": 16.441072463989258,
            "stable_rank": -6.453282356262207,
            "spectral_gap": 0.794687032699585,
            "singular_value_ratio": -10.014398574829102,
            "layerwise_effective_rank": 28.433942794799805,
            "layerwise_effective_rank_mergeability_score": 9.445757865905762,
            "task_vector_cosine_similarity": 18.17560386657715,
            "task_vector_l2_distance": -23.91951560974121,
            "task_vector_dot_product": 11.076075553894043,
            "weight_space_angle": 3.378910779953003,
            "task_vector_magnitude_ratio": -3.032137393951416,
            "activation_l2_distance": -12.439441680908203,
            "activation_cosine_similarity": -4.897181510925293,
            "activation_magnitude_ratio": 3.3624677658081055,
            "activation_dot_product": 17.63648796081543,
            "encoder_gradient_cosine_similarity": 6.267938137054443,
            "encoder_gradient_l2_distance": -47.52074432373047,
            "encoder_gradient_dot_product": 33.74204635620117,
            "input_gradient_cosine_similarity": 5.900745868682861,
            "input_gradient_l2_distance": -25.878734588623047,
            "input_gradient_dot_product": -27.865123748779297
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.3977930815768109,
          "val_r": 0.5751242235768522,
          "n_iterations": 711,
          "coefficients": {
            "effective_rank": 1.6542221307754517,
            "effective_rank_mergeability_score": 19.363590240478516,
            "stable_rank": -11.617297172546387,
            "spectral_gap": 30.42929458618164,
            "singular_value_ratio": 5.558468818664551,
            "layerwise_effective_rank": 37.40480422973633,
            "layerwise_effective_rank_mergeability_score": -49.939178466796875,
            "task_vector_cosine_similarity": 65.03766632080078,
            "task_vector_l2_distance": -30.978296279907227,
            "task_vector_dot_product": 13.720391273498535,
            "weight_space_angle": -39.93062210083008,
            "task_vector_magnitude_ratio": -56.80855178833008,
            "activation_l2_distance": 3.633378505706787,
            "activation_cosine_similarity": 3.7756054401397705,
            "activation_magnitude_ratio": -9.216941833496094,
            "activation_dot_product": 61.49060821533203,
            "encoder_gradient_cosine_similarity": 27.983619689941406,
            "encoder_gradient_l2_distance": -64.75077819824219,
            "encoder_gradient_dot_product": 62.3950080871582,
            "input_gradient_cosine_similarity": 16.403438568115234,
            "input_gradient_l2_distance": -24.508386611938477,
            "input_gradient_dot_product": -60.10230255126953
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.49952778189992814,
          "val_r": 0.5604858615723668,
          "n_iterations": 639,
          "coefficients": {
            "effective_rank": -46.10905838012695,
            "effective_rank_mergeability_score": 38.749244689941406,
            "stable_rank": 24.186315536499023,
            "spectral_gap": -2.7594470977783203,
            "singular_value_ratio": -16.185941696166992,
            "layerwise_effective_rank": 57.761295318603516,
            "layerwise_effective_rank_mergeability_score": -32.9878044128418,
            "task_vector_cosine_similarity": 51.082969665527344,
            "task_vector_l2_distance": -72.98905944824219,
            "task_vector_dot_product": 42.72322082519531,
            "weight_space_angle": 21.795551300048828,
            "task_vector_magnitude_ratio": -34.51123809814453,
            "activation_l2_distance": -6.580506324768066,
            "activation_cosine_similarity": -5.934782981872559,
            "activation_magnitude_ratio": -9.285561561584473,
            "activation_dot_product": 42.252418518066406,
            "encoder_gradient_cosine_similarity": 7.324460506439209,
            "encoder_gradient_l2_distance": -116.82479858398438,
            "encoder_gradient_dot_product": 26.511388778686523,
            "input_gradient_cosine_similarity": 31.1885986328125,
            "input_gradient_l2_distance": -31.5720272064209,
            "input_gradient_dot_product": 33.162391662597656
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.3548142707957168,
          "val_r": 0.35332169888066045,
          "n_iterations": 572,
          "coefficients": {
            "effective_rank": -59.94084167480469,
            "effective_rank_mergeability_score": -10.572295188903809,
            "stable_rank": 37.0619010925293,
            "spectral_gap": -13.77512264251709,
            "singular_value_ratio": -90.91879272460938,
            "layerwise_effective_rank": 0.11634908616542816,
            "layerwise_effective_rank_mergeability_score": -53.54697799682617,
            "task_vector_cosine_similarity": 102.2153549194336,
            "task_vector_l2_distance": 11.870901107788086,
            "task_vector_dot_product": 51.81676483154297,
            "weight_space_angle": -30.182939529418945,
            "task_vector_magnitude_ratio": 11.320893287658691,
            "activation_l2_distance": -46.2264518737793,
            "activation_cosine_similarity": 35.54795837402344,
            "activation_magnitude_ratio": -20.0711612701416,
            "activation_dot_product": 22.047863006591797,
            "encoder_gradient_cosine_similarity": 26.890605926513672,
            "encoder_gradient_l2_distance": -21.060222625732422,
            "encoder_gradient_dot_product": 84.59445190429688,
            "input_gradient_cosine_similarity": 36.608909606933594,
            "input_gradient_l2_distance": -58.75551223754883,
            "input_gradient_dot_product": -14.04434871673584
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.3276541995756133,
          "val_r": 0.25268024178001336,
          "n_iterations": 487,
          "coefficients": {
            "effective_rank": -29.5704345703125,
            "effective_rank_mergeability_score": -75.5811767578125,
            "stable_rank": 27.503028869628906,
            "spectral_gap": -56.50215148925781,
            "singular_value_ratio": -31.55864715576172,
            "layerwise_effective_rank": 2.063833475112915,
            "layerwise_effective_rank_mergeability_score": 90.74849700927734,
            "task_vector_cosine_similarity": -27.580350875854492,
            "task_vector_l2_distance": -47.96099090576172,
            "task_vector_dot_product": 79.71768188476562,
            "weight_space_angle": -55.57450485229492,
            "task_vector_magnitude_ratio": -65.78694915771484,
            "activation_l2_distance": -15.021506309509277,
            "activation_cosine_similarity": -53.7012825012207,
            "activation_magnitude_ratio": 46.547523498535156,
            "activation_dot_product": 104.15943908691406,
            "encoder_gradient_cosine_similarity": 19.851804733276367,
            "encoder_gradient_l2_distance": -7.1219282150268555,
            "encoder_gradient_dot_product": 94.74552917480469,
            "input_gradient_cosine_similarity": 72.24774932861328,
            "input_gradient_l2_distance": -41.851253509521484,
            "input_gradient_dot_product": -28.776994705200195
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7043287693935265,
          "val_r": 0.5753823871850702,
          "n_iterations": 652,
          "coefficients": {
            "effective_rank": 60.95164489746094,
            "effective_rank_mergeability_score": -5.786910057067871,
            "stable_rank": -73.265380859375,
            "spectral_gap": -9.36495304107666,
            "singular_value_ratio": -38.982051849365234,
            "layerwise_effective_rank": -65.03795623779297,
            "layerwise_effective_rank_mergeability_score": -15.315803527832031,
            "task_vector_cosine_similarity": 63.94851303100586,
            "task_vector_l2_distance": 33.69394302368164,
            "task_vector_dot_product": -13.703190803527832,
            "weight_space_angle": 37.85324478149414,
            "task_vector_magnitude_ratio": 70.4179916381836,
            "activation_l2_distance": 8.374897003173828,
            "activation_cosine_similarity": 51.541038513183594,
            "activation_magnitude_ratio": -11.694485664367676,
            "activation_dot_product": 36.80942153930664,
            "encoder_gradient_cosine_similarity": 12.205265998840332,
            "encoder_gradient_l2_distance": -50.55784606933594,
            "encoder_gradient_dot_product": 0.4357925057411194,
            "input_gradient_cosine_similarity": -4.584902286529541,
            "input_gradient_l2_distance": -84.11106872558594,
            "input_gradient_dot_product": -2.829526424407959
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5478825806596075,
          "val_r": 0.3885554131488997,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 12.548609733581543,
            "effective_rank_mergeability_score": 23.747203826904297,
            "stable_rank": 1.0704610347747803,
            "spectral_gap": 8.937307357788086,
            "singular_value_ratio": 6.242284774780273,
            "layerwise_effective_rank": 5.695487022399902,
            "layerwise_effective_rank_mergeability_score": -0.18472668528556824,
            "task_vector_cosine_similarity": 12.05854606628418,
            "task_vector_l2_distance": -31.662307739257812,
            "task_vector_dot_product": 16.755937576293945,
            "weight_space_angle": -3.495429039001465,
            "task_vector_magnitude_ratio": -8.67730712890625,
            "activation_l2_distance": 3.5189006328582764,
            "activation_cosine_similarity": 20.176368713378906,
            "activation_magnitude_ratio": 0.9973644018173218,
            "activation_dot_product": 12.42073917388916,
            "encoder_gradient_cosine_similarity": 13.02911376953125,
            "encoder_gradient_l2_distance": -48.0506477355957,
            "encoder_gradient_dot_product": 28.25307273864746,
            "input_gradient_cosine_similarity": 17.36819076538086,
            "input_gradient_l2_distance": -38.55495071411133,
            "input_gradient_dot_product": -51.19572830200195
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    },
    "tsv": {
      "aggregate_metrics": {
        "train_r": 0.10512498175792483,
        "train_p": 2.211759828377331e-09,
        "val_r": -0.20795638683990952,
        "val_p": 7.358594285931861e-05
      },
      "per_fold_stats": {
        "train_r_mean": 0.51176696134267,
        "train_r_std": 0.29008324648464356,
        "val_r_mean": 0.3678835402333416,
        "val_r_std": 0.29355196368293435
      },
      "average_coefficients": {
        "effective_rank": -6.7596845626831055,
        "effective_rank_mergeability_score": 25.623905181884766,
        "stable_rank": -34.09730911254883,
        "spectral_gap": -18.90238380432129,
        "singular_value_ratio": 31.581707000732422,
        "layerwise_effective_rank": -8.113748550415039,
        "layerwise_effective_rank_mergeability_score": -4.397496700286865,
        "task_vector_cosine_similarity": 18.963287353515625,
        "task_vector_l2_distance": -27.08485984802246,
        "task_vector_dot_product": 38.52593231201172,
        "weight_space_angle": -17.436185836791992,
        "task_vector_magnitude_ratio": 44.63688278198242,
        "activation_l2_distance": 11.489348411560059,
        "activation_cosine_similarity": 1.7216180562973022,
        "activation_magnitude_ratio": -15.763181686401367,
        "activation_dot_product": 8.83303165435791,
        "encoder_gradient_cosine_similarity": 31.801311492919922,
        "encoder_gradient_l2_distance": -3.2287392616271973,
        "encoder_gradient_dot_product": -21.128162384033203,
        "input_gradient_cosine_similarity": 20.456689834594727,
        "input_gradient_l2_distance": -59.281646728515625,
        "input_gradient_dot_product": -16.442514419555664
      },
      "coefficient_std": {
        "effective_rank": 134.74508666992188,
        "effective_rank_mergeability_score": 164.36509704589844,
        "stable_rank": 68.34293365478516,
        "spectral_gap": 103.76392364501953,
        "singular_value_ratio": 80.11180877685547,
        "layerwise_effective_rank": 79.97417449951172,
        "layerwise_effective_rank_mergeability_score": 127.98417663574219,
        "task_vector_cosine_similarity": 88.9659423828125,
        "task_vector_l2_distance": 97.79913330078125,
        "task_vector_dot_product": 85.00641632080078,
        "weight_space_angle": 68.32349395751953,
        "task_vector_magnitude_ratio": 168.19471740722656,
        "activation_l2_distance": 71.74549102783203,
        "activation_cosine_similarity": 55.12752151489258,
        "activation_magnitude_ratio": 82.23844909667969,
        "activation_dot_product": 69.12869262695312,
        "encoder_gradient_cosine_similarity": 107.16895294189453,
        "encoder_gradient_l2_distance": 114.82402801513672,
        "encoder_gradient_dot_product": 153.18353271484375,
        "input_gradient_cosine_similarity": 95.20022583007812,
        "input_gradient_l2_distance": 121.63509368896484,
        "input_gradient_dot_product": 60.941898345947266
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7481721488399978,
          "val_r": 0.6018898403943618,
          "n_iterations": 645,
          "coefficients": {
            "effective_rank": 0.11993422359228134,
            "effective_rank_mergeability_score": -0.017164992168545723,
            "stable_rank": -0.2841717004776001,
            "spectral_gap": 0.0032211607322096825,
            "singular_value_ratio": 0.2787041962146759,
            "layerwise_effective_rank": 0.14321628212928772,
            "layerwise_effective_rank_mergeability_score": 0.05329161137342453,
            "task_vector_cosine_similarity": 0.398360937833786,
            "task_vector_l2_distance": -0.060205794870853424,
            "task_vector_dot_product": 0.02139865979552269,
            "weight_space_angle": 0.3027231693267822,
            "task_vector_magnitude_ratio": -0.2137582153081894,
            "activation_l2_distance": 0.25280508399009705,
            "activation_cosine_similarity": 0.3491460680961609,
            "activation_magnitude_ratio": -0.020172931253910065,
            "activation_dot_product": -0.07224773615598679,
            "encoder_gradient_cosine_similarity": 0.017629852518439293,
            "encoder_gradient_l2_distance": -0.1505742073059082,
            "encoder_gradient_dot_product": -0.009000930935144424,
            "input_gradient_cosine_similarity": 0.015327959321439266,
            "input_gradient_l2_distance": -0.08844441920518875,
            "input_gradient_dot_product": -0.03951291739940643
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6408355309294762,
          "val_r": 0.38917456020486474,
          "n_iterations": 880,
          "coefficients": {
            "effective_rank": 8.272721290588379,
            "effective_rank_mergeability_score": -3.1155734062194824,
            "stable_rank": 44.69996643066406,
            "spectral_gap": 40.560672760009766,
            "singular_value_ratio": -0.134681835770607,
            "layerwise_effective_rank": -43.39711380004883,
            "layerwise_effective_rank_mergeability_score": -10.99774169921875,
            "task_vector_cosine_similarity": 57.1016731262207,
            "task_vector_l2_distance": 3.3561532497406006,
            "task_vector_dot_product": -6.6539692878723145,
            "weight_space_angle": 8.717500686645508,
            "task_vector_magnitude_ratio": 6.858828067779541,
            "activation_l2_distance": -38.89628219604492,
            "activation_cosine_similarity": 10.133366584777832,
            "activation_magnitude_ratio": -15.109967231750488,
            "activation_dot_product": 5.654765605926514,
            "encoder_gradient_cosine_similarity": 4.011516571044922,
            "encoder_gradient_l2_distance": -66.4718246459961,
            "encoder_gradient_dot_product": 24.29950714111328,
            "input_gradient_cosine_similarity": 2.3976638317108154,
            "input_gradient_l2_distance": -47.683067321777344,
            "input_gradient_dot_product": 17.394136428833008
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7540677384964971,
          "val_r": 0.8149353205223813,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 0.9645697474479675,
            "effective_rank_mergeability_score": -0.4875011146068573,
            "stable_rank": -1.3121994733810425,
            "spectral_gap": -0.12957827746868134,
            "singular_value_ratio": 0.8683691620826721,
            "layerwise_effective_rank": -0.08395214378833771,
            "layerwise_effective_rank_mergeability_score": 0.6048736572265625,
            "task_vector_cosine_similarity": -0.19943250715732574,
            "task_vector_l2_distance": -0.4209572374820709,
            "task_vector_dot_product": 0.5918575525283813,
            "weight_space_angle": -0.08741956204175949,
            "task_vector_magnitude_ratio": -0.6276937127113342,
            "activation_l2_distance": 1.3358632326126099,
            "activation_cosine_similarity": 1.7155100107192993,
            "activation_magnitude_ratio": -0.039914801716804504,
            "activation_dot_product": -0.18930044770240784,
            "encoder_gradient_cosine_similarity": 0.05092654004693031,
            "encoder_gradient_l2_distance": -0.8668689727783203,
            "encoder_gradient_dot_product": -0.12619958817958832,
            "input_gradient_cosine_similarity": 0.07721798121929169,
            "input_gradient_l2_distance": -0.5255029201507568,
            "input_gradient_dot_product": -0.1140933558344841
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6916077702110865,
          "val_r": 0.6981613449355816,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 1.214691400527954,
            "effective_rank_mergeability_score": 0.058426085859537125,
            "stable_rank": -9.45583724975586,
            "spectral_gap": 3.971817970275879,
            "singular_value_ratio": -1.5932486057281494,
            "layerwise_effective_rank": 3.3467016220092773,
            "layerwise_effective_rank_mergeability_score": 4.83644962310791,
            "task_vector_cosine_similarity": 9.51919174194336,
            "task_vector_l2_distance": -6.574027061462402,
            "task_vector_dot_product": 0.8171913623809814,
            "weight_space_angle": 0.12524648010730743,
            "task_vector_magnitude_ratio": 12.480134963989258,
            "activation_l2_distance": -0.322563499212265,
            "activation_cosine_similarity": 3.6677989959716797,
            "activation_magnitude_ratio": -3.0699093341827393,
            "activation_dot_product": 10.60316276550293,
            "encoder_gradient_cosine_similarity": 4.848352909088135,
            "encoder_gradient_l2_distance": -17.00718879699707,
            "encoder_gradient_dot_product": -0.5588138103485107,
            "input_gradient_cosine_similarity": 2.8724069595336914,
            "input_gradient_l2_distance": -9.826242446899414,
            "input_gradient_dot_product": -8.954766273498535
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6805225528225028,
          "val_r": 0.641595200822922,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": -1.4520230293273926,
            "effective_rank_mergeability_score": -0.26598110795021057,
            "stable_rank": -5.1679253578186035,
            "spectral_gap": 3.488807201385498,
            "singular_value_ratio": 8.008700370788574,
            "layerwise_effective_rank": -3.1059470176696777,
            "layerwise_effective_rank_mergeability_score": 0.6405285596847534,
            "task_vector_cosine_similarity": 6.40254545211792,
            "task_vector_l2_distance": -11.626130104064941,
            "task_vector_dot_product": 9.118964195251465,
            "weight_space_angle": 4.498887538909912,
            "task_vector_magnitude_ratio": 1.3584519624710083,
            "activation_l2_distance": 0.7339187860488892,
            "activation_cosine_similarity": 1.2133890390396118,
            "activation_magnitude_ratio": -1.6491811275482178,
            "activation_dot_product": 17.069087982177734,
            "encoder_gradient_cosine_similarity": 4.470393180847168,
            "encoder_gradient_l2_distance": -12.322340965270996,
            "encoder_gradient_dot_product": -0.13672377169132233,
            "input_gradient_cosine_similarity": 4.96412992477417,
            "input_gradient_l2_distance": -14.318805694580078,
            "input_gradient_dot_product": -10.923911094665527
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.5297484094928,
          "val_r": 0.5073161782653899,
          "n_iterations": 721,
          "coefficients": {
            "effective_rank": -162.93545532226562,
            "effective_rank_mergeability_score": -82.37456512451172,
            "stable_rank": -70.89096069335938,
            "spectral_gap": -75.96859741210938,
            "singular_value_ratio": 55.321571350097656,
            "layerwise_effective_rank": 264.1982727050781,
            "layerwise_effective_rank_mergeability_score": 156.35797119140625,
            "task_vector_cosine_similarity": 100.38443756103516,
            "task_vector_l2_distance": -21.06255340576172,
            "task_vector_dot_product": 213.5886993408203,
            "weight_space_angle": -83.89837646484375,
            "task_vector_magnitude_ratio": 4.382890224456787,
            "activation_l2_distance": -211.02577209472656,
            "activation_cosine_similarity": -2.1474545001983643,
            "activation_magnitude_ratio": -210.45419311523438,
            "activation_dot_product": 151.1349639892578,
            "encoder_gradient_cosine_similarity": 187.39608764648438,
            "encoder_gradient_l2_distance": -161.18675231933594,
            "encoder_gradient_dot_product": 157.78189086914062,
            "input_gradient_cosine_similarity": 50.71920394897461,
            "input_gradient_l2_distance": -37.20635986328125,
            "input_gradient_dot_product": -221.1171417236328
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.003931856678251495,
          "val_r": 0.09127026063280433,
          "n_iterations": 414,
          "coefficients": {
            "effective_rank": 460.442626953125,
            "effective_rank_mergeability_score": 712.1309814453125,
            "stable_rank": -243.30633544921875,
            "spectral_gap": -429.93133544921875,
            "singular_value_ratio": 293.56317138671875,
            "layerwise_effective_rank": -146.95289611816406,
            "layerwise_effective_rank_mergeability_score": 396.09423828125,
            "task_vector_cosine_similarity": 87.87913513183594,
            "task_vector_l2_distance": -351.7728271484375,
            "task_vector_dot_product": -45.89754867553711,
            "weight_space_angle": -40.94861602783203,
            "task_vector_magnitude_ratio": 738.4496459960938,
            "activation_l2_distance": 113.7435073852539,
            "activation_cosine_similarity": -25.376527786254883,
            "activation_magnitude_ratio": 46.33535385131836,
            "activation_dot_product": -196.68186950683594,
            "encoder_gradient_cosine_similarity": -289.23876953125,
            "encoder_gradient_l2_distance": 443.3898620605469,
            "encoder_gradient_dot_product": -644.1069946289062,
            "input_gradient_cosine_similarity": -306.2356872558594,
            "input_gradient_l2_distance": -444.0614013671875,
            "input_gradient_dot_product": -126.52117156982422
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5966765546063836,
          "val_r": 0.030085053410448787,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": -5.773185729980469,
            "effective_rank_mergeability_score": -13.762384414672852,
            "stable_rank": -92.1949234008789,
            "spectral_gap": -40.641048431396484,
            "singular_value_ratio": 16.54241943359375,
            "layerwise_effective_rank": 35.27704620361328,
            "layerwise_effective_rank_mergeability_score": 20.95935821533203,
            "task_vector_cosine_similarity": 53.92375946044922,
            "task_vector_l2_distance": -37.201290130615234,
            "task_vector_dot_product": -19.52410316467285,
            "weight_space_angle": -53.668975830078125,
            "task_vector_magnitude_ratio": 7.1351423263549805,
            "activation_l2_distance": 28.592666625976562,
            "activation_cosine_similarity": 32.80476379394531,
            "activation_magnitude_ratio": -30.34326171875,
            "activation_dot_product": 94.25540924072266,
            "encoder_gradient_cosine_similarity": 38.556800842285156,
            "encoder_gradient_l2_distance": -44.77205276489258,
            "encoder_gradient_dot_product": -48.1733512878418,
            "input_gradient_cosine_similarity": 41.01254653930664,
            "input_gradient_l2_distance": -19.22270965576172,
            "input_gradient_dot_product": 37.21578598022461
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.7542069227946022,
          "val_r": 0.24350064661915213,
          "n_iterations": 461,
          "coefficients": {
            "effective_rank": -0.12426590919494629,
            "effective_rank_mergeability_score": 0.15055862069129944,
            "stable_rank": 0.20181038975715637,
            "spectral_gap": -0.0335465632379055,
            "singular_value_ratio": 0.279875248670578,
            "layerwise_effective_rank": -0.10520857572555542,
            "layerwise_effective_rank_mergeability_score": -0.008172321133315563,
            "task_vector_cosine_similarity": 0.0707727000117302,
            "task_vector_l2_distance": -0.16496849060058594,
            "task_vector_dot_product": 0.20432499051094055,
            "weight_space_angle": 0.10335812717676163,
            "task_vector_magnitude_ratio": -0.25611796975135803,
            "activation_l2_distance": 0.5480182766914368,
            "activation_cosine_similarity": 0.6584582924842834,
            "activation_magnitude_ratio": 0.006974932737648487,
            "activation_dot_product": -0.06777205318212509,
            "encoder_gradient_cosine_similarity": 0.056088224053382874,
            "encoder_gradient_l2_distance": -0.27543899416923523,
            "encoder_gradient_dot_product": -0.026051292195916176,
            "input_gradient_cosine_similarity": 0.04165274649858475,
            "input_gradient_l2_distance": -0.21444399654865265,
            "input_gradient_dot_product": -0.0464903824031353
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.2943119588054739,
          "val_r": -0.20261207626554667,
          "n_iterations": 595,
          "coefficients": {
            "effective_rank": -21.779916763305664,
            "effective_rank_mergeability_score": -13.159993171691895,
            "stable_rank": -188.0994110107422,
            "spectral_gap": 129.45858764648438,
            "singular_value_ratio": 60.03900146484375,
            "layerwise_effective_rank": -138.46697998046875,
            "layerwise_effective_rank_mergeability_score": -227.4042510986328,
            "task_vector_cosine_similarity": -250.73326110839844,
            "task_vector_l2_distance": 45.25629806518555,
            "task_vector_dot_product": 116.31920623779297,
            "weight_space_angle": 164.7511749267578,
            "task_vector_magnitude_ratio": 110.08290100097656,
            "activation_l2_distance": 76.90904235839844,
            "activation_cosine_similarity": -198.67640686035156,
            "activation_magnitude_ratio": 110.74219512939453,
            "activation_dot_product": -34.729862213134766,
            "encoder_gradient_cosine_similarity": 130.0487060546875,
            "encoder_gradient_l2_distance": 91.38394927978516,
            "encoder_gradient_dot_product": 130.9420623779297,
            "input_gradient_cosine_similarity": 148.53652954101562,
            "input_gradient_l2_distance": -325.1041564941406,
            "input_gradient_dot_product": 84.68199920654297
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.2915619559982968,
          "val_r": 0.31991432736322767,
          "n_iterations": 496,
          "coefficients": {
            "effective_rank": -122.46147918701172,
            "effective_rank_mergeability_score": 50.72157669067383,
            "stable_rank": -63.10405349731445,
            "spectral_gap": -73.95372772216797,
            "singular_value_ratio": -56.18706130981445,
            "layerwise_effective_rank": 45.55643844604492,
            "layerwise_effective_rank_mergeability_score": -283.2310485839844,
            "task_vector_cosine_similarity": -40.75299072265625,
            "task_vector_l2_distance": 141.0513916015625,
            "task_vector_dot_product": 147.26930236816406,
            "weight_space_angle": -143.14657592773438,
            "task_vector_magnitude_ratio": -100.16131591796875,
            "activation_l2_distance": 174.2706756591797,
            "activation_cosine_similarity": 117.26646423339844,
            "activation_magnitude_ratio": 140.72442626953125,
            "activation_dot_product": -68.5719985961914,
            "encoder_gradient_cosine_similarity": 275.6909484863281,
            "encoder_gradient_l2_distance": -79.78544616699219,
            "encoder_gradient_dot_product": 48.738773345947266,
            "input_gradient_cosine_similarity": 97.25777435302734,
            "input_gradient_l2_distance": -219.60926818847656,
            "input_gradient_dot_product": 13.414176940917969
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.3124545273894275,
          "val_r": 0.18542335761656137,
          "n_iterations": 861,
          "coefficients": {
            "effective_rank": -327.1493835449219,
            "effective_rank_mergeability_score": -188.57044982910156,
            "stable_rank": -44.98722839355469,
            "spectral_gap": 77.7498550415039,
            "singular_value_ratio": 224.79971313476562,
            "layerwise_effective_rank": -92.7832260131836,
            "layerwise_effective_rank_mergeability_score": -111.82417297363281,
            "task_vector_cosine_similarity": 263.79754638671875,
            "task_vector_l2_distance": -237.79684448242188,
            "task_vector_dot_product": 271.4932861328125,
            "weight_space_angle": -183.5919189453125,
            "task_vector_magnitude_ratio": 181.87094116210938,
            "activation_l2_distance": 87.08587646484375,
            "activation_cosine_similarity": -41.59576416015625,
            "activation_magnitude_ratio": -238.3144073486328,
            "activation_dot_product": 101.65911102294922,
            "encoder_gradient_cosine_similarity": 185.50209045410156,
            "encoder_gradient_l2_distance": -87.02581024169922,
            "encoder_gradient_dot_product": -123.58011627197266,
            "input_gradient_cosine_similarity": 234.96934509277344,
            "input_gradient_l2_distance": 53.43426513671875,
            "input_gradient_dot_product": -4.1445207595825195
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.7479483218564886,
          "val_r": 0.5981065524536718,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 0.2371327131986618,
            "effective_rank_mergeability_score": 0.0242390725761652,
            "stable_rank": -0.12237421423196793,
            "spectral_gap": -0.0400029718875885,
            "singular_value_ratio": 0.3462737500667572,
            "layerwise_effective_rank": -0.04213166609406471,
            "layerwise_effective_rank_mergeability_score": 0.11886557191610336,
            "task_vector_cosine_similarity": 0.14832639694213867,
            "task_vector_l2_distance": -0.05506758764386177,
            "task_vector_dot_product": -0.07881398499011993,
            "weight_space_angle": -0.19861534237861633,
            "task_vector_magnitude_ratio": -0.33420178294181824,
            "activation_l2_distance": 0.6890080571174622,
            "activation_cosine_similarity": 0.7797138690948486,
            "activation_magnitude_ratio": 0.008410442620515823,
            "activation_dot_product": -0.09591100364923477,
            "encoder_gradient_cosine_similarity": 0.05840502679347992,
            "encoder_gradient_l2_distance": -0.22534023225307465,
            "encoder_gradient_dot_product": -0.027957117184996605,
            "input_gradient_cosine_similarity": 0.0381387397646904,
            "input_gradient_l2_distance": -0.1708085834980011,
            "input_gradient_dot_product": -0.06232370808720589
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7355025981748119,
          "val_r": 0.788144461569927,
          "n_iterations": 524,
          "coefficients": {
            "effective_rank": 0.6055701375007629,
            "effective_rank_mergeability_score": -0.15882427990436554,
            "stable_rank": -0.8840710520744324,
            "spectral_gap": -0.1479475200176239,
            "singular_value_ratio": 0.33525872230529785,
            "layerwise_effective_rank": 0.2505667507648468,
            "layerwise_effective_rank_mergeability_score": 0.39523452520370483,
            "task_vector_cosine_similarity": 0.24942485988140106,
            "task_vector_l2_distance": -0.14528891444206238,
            "task_vector_dot_product": 0.16178685426712036,
            "weight_space_angle": 0.24782101809978485,
            "task_vector_magnitude_ratio": -0.2532159984111786,
            "activation_l2_distance": 0.4015260338783264,
            "activation_cosine_similarity": 0.5484245419502258,
            "activation_magnitude_ratio": -0.010640530847012997,
            "activation_dot_product": -0.02820897102355957,
            "encoder_gradient_cosine_similarity": 0.048840124160051346,
            "encoder_gradient_l2_distance": -0.33320266008377075,
            "encoder_gradient_dot_product": -0.0350823849439621,
            "input_gradient_cosine_similarity": 0.018144497647881508,
            "input_gradient_l2_distance": -0.20479674637317657,
            "input_gradient_dot_product": -0.07146249711513519
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.14297509930968721,
          "val_r": 0.057574929742201714,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": -0.31477299332618713,
            "effective_rank_mergeability_score": 0.8208369612693787,
            "stable_rank": -0.7623541951179504,
            "spectral_gap": 0.437674343585968,
            "singular_value_ratio": 0.046748679131269455,
            "layerwise_effective_rank": 0.31609711050987244,
            "layerwise_effective_rank_mergeability_score": 0.4520571231842041,
            "task_vector_cosine_similarity": 1.0107792615890503,
            "task_vector_l2_distance": -0.4226069152355194,
            "task_vector_dot_product": 1.1185022592544556,
            "weight_space_angle": 0.07086968421936035,
            "task_vector_magnitude_ratio": -0.41757386922836304,
            "activation_l2_distance": -0.6784181594848633,
            "activation_cosine_similarity": 0.1138995885848999,
            "activation_magnitude_ratio": -0.34349626302719116,
            "activation_dot_product": 0.11872871220111847,
            "encoder_gradient_cosine_similarity": 0.05411722883582115,
            "encoder_gradient_l2_distance": 0.18688692152500153,
            "encoder_gradient_dot_product": 0.7240839600563049,
            "input_gradient_cosine_similarity": -1.2398725748062134,
            "input_gradient_l2_distance": 0.07660845667123795,
            "input_gradient_dot_product": -0.36346352100372314
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.6421093027127428,
          "val_r": 0.307580642063504,
          "n_iterations": 961,
          "coefficients": {
            "effective_rank": -27.220674514770508,
            "effective_rank_mergeability_score": 16.324604034423828,
            "stable_rank": 7.979809761047363,
            "spectral_gap": -4.927052974700928,
            "singular_value_ratio": 20.795141220092773,
            "layerwise_effective_rank": -9.472759246826172,
            "layerwise_effective_rank_mergeability_score": 9.297720909118652,
            "task_vector_cosine_similarity": 42.4770622253418,
            "task_vector_l2_distance": -31.867816925048828,
            "task_vector_dot_product": 39.63405990600586,
            "weight_space_angle": -30.27631950378418,
            "task_vector_magnitude_ratio": 8.325090408325195,
            "activation_l2_distance": -2.0526039600372314,
            "activation_cosine_similarity": 31.044069290161133,
            "activation_magnitude_ratio": -28.267515182495117,
            "activation_dot_product": 40.176876068115234,
            "encoder_gradient_cosine_similarity": 28.898149490356445,
            "encoder_gradient_l2_distance": -41.48698043823242,
            "encoder_gradient_dot_product": 4.322728633880615,
            "input_gradient_cosine_similarity": 23.999507904052734,
            "input_gradient_l2_distance": -39.72296905517578,
            "input_gradient_dot_product": -56.981746673583984
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": -0.31913276631971144,
          "val_r": -0.1955568131523215,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": 38.576988220214844,
            "effective_rank_mergeability_score": -2.525904417037964,
            "stable_rank": -2.5189151763916016,
            "spectral_gap": 6.717258453369141,
            "singular_value_ratio": -4.930355548858643,
            "layerwise_effective_rank": -39.7415771484375,
            "layerwise_effective_rank_mergeability_score": -30.402835845947266,
            "task_vector_cosine_similarity": -46.41017532348633,
            "task_vector_l2_distance": -3.2263662815093994,
            "task_vector_dot_product": -46.26909255981445,
            "weight_space_angle": 63.73862838745117,
            "task_vector_magnitude_ratio": -45.989341735839844,
            "activation_l2_distance": 30.7739315032959,
            "activation_cosine_similarity": 31.86696434020996,
            "activation_magnitude_ratio": -44.924991607666016,
            "activation_dot_product": -44.105125427246094,
            "encoder_gradient_cosine_similarity": 28.55419921875,
            "encoder_gradient_l2_distance": 23.5854434967041,
            "encoder_gradient_dot_product": 21.652788162231445,
            "input_gradient_cosine_similarity": 28.37063980102539,
            "input_gradient_l2_distance": 23.905303955078125,
            "input_gradient_dot_product": 14.295334815979004
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5730087970460933,
          "val_r": 0.5050268241239677,
          "n_iterations": 656,
          "coefficients": {
            "effective_rank": -6.13053035736084,
            "effective_rank_mergeability_score": 4.0025224685668945,
            "stable_rank": 9.684576988220215,
            "spectral_gap": -7.388463020324707,
            "singular_value_ratio": 27.057693481445312,
            "layerwise_effective_rank": -51.81120681762695,
            "layerwise_effective_rank_mergeability_score": -20.373668670654297,
            "task_vector_cosine_similarity": 28.696434020996094,
            "task_vector_l2_distance": -0.6787588596343994,
            "task_vector_dot_product": 113.9786148071289,
            "weight_space_angle": -29.64109992980957,
            "task_vector_magnitude_ratio": -49.495182037353516,
            "activation_l2_distance": -30.726268768310547,
            "activation_cosine_similarity": 30.455106735229492,
            "activation_magnitude_ratio": -10.077750205993652,
            "activation_dot_product": 79.07794189453125,
            "encoder_gradient_cosine_similarity": 20.39826774597168,
            "encoder_gradient_l2_distance": -99.04806518554688,
            "encoder_gradient_dot_product": -8.77365493774414,
            "input_gradient_cosine_similarity": 53.791568756103516,
            "input_gradient_l2_distance": -14.37897777557373,
            "input_gradient_dot_product": -37.62146759033203
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.6787545040585448,
          "val_r": 0.5273134110997005,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 5.627866268157959,
            "effective_rank_mergeability_score": 6.205799102783203,
            "stable_rank": -5.9042792320251465,
            "spectral_gap": 4.225013256072998,
            "singular_value_ratio": 1.5865910053253174,
            "layerwise_effective_rank": -6.338498115539551,
            "layerwise_effective_rank_mergeability_score": -6.204732894897461,
            "task_vector_cosine_similarity": 19.255653381347656,
            "task_vector_l2_distance": -2.184088706970215,
            "task_vector_dot_product": -15.629992485046387,
            "weight_space_angle": -2.453291654586792,
            "task_vector_magnitude_ratio": 8.718740463256836,
            "activation_l2_distance": 2.10265851020813,
            "activation_cosine_similarity": 6.611632823944092,
            "activation_magnitude_ratio": -1.2638654708862305,
            "activation_dot_product": 9.181187629699707,
            "encoder_gradient_cosine_similarity": 2.21889591217041,
            "encoder_gradient_l2_distance": -7.888227939605713,
            "encoder_gradient_dot_product": 0.6486199498176575,
            "input_gradient_cosine_similarity": 4.539358139038086,
            "input_gradient_l2_distance": -18.694395065307617,
            "input_gradient_dot_product": -3.361841917037964
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.7360754429499452,
          "val_r": 0.44882678224403294,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 24.08588218688965,
            "effective_rank_mergeability_score": 26.476839065551758,
            "stable_rank": -15.517219543457031,
            "spectral_gap": -11.499252319335938,
            "singular_value_ratio": -15.389694213867188,
            "layerwise_effective_rank": 20.938182830810547,
            "layerwise_effective_rank_mergeability_score": 12.686118125915527,
            "task_vector_cosine_similarity": 46.04654312133789,
            "task_vector_l2_distance": -26.101184844970703,
            "task_vector_dot_product": -9.745064735412598,
            "weight_space_angle": -23.368749618530273,
            "task_vector_magnitude_ratio": 10.823453903198242,
            "activation_l2_distance": -3.9506189823150635,
            "activation_cosine_similarity": 32.99980926513672,
            "activation_magnitude_ratio": -29.191734313964844,
            "activation_dot_product": 12.271684646606445,
            "encoder_gradient_cosine_similarity": 14.384653091430664,
            "encoder_gradient_l2_distance": -4.2748026847839355,
            "encoder_gradient_dot_product": 13.880173683166504,
            "input_gradient_cosine_similarity": 22.988168716430664,
            "input_gradient_l2_distance": -72.01683807373047,
            "input_gradient_dot_product": -25.527856826782227
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    },
    "isotropic": {
      "aggregate_metrics": {
        "train_r": 0.08872492019430087,
        "train_p": 4.552822674513971e-07,
        "val_r": 0.024868989864025123,
        "val_p": 0.6390908612707774
      },
      "per_fold_stats": {
        "train_r_mean": 0.25677858233075146,
        "train_r_std": 0.15588662091747357,
        "val_r_mean": 0.16483813788403423,
        "val_r_std": 0.2302128065569296
      },
      "average_coefficients": {
        "effective_rank": -10.80048942565918,
        "effective_rank_mergeability_score": -6.478586673736572,
        "stable_rank": 1.3593772649765015,
        "spectral_gap": 4.041551113128662,
        "singular_value_ratio": 9.968103408813477,
        "layerwise_effective_rank": 3.6772568225860596,
        "layerwise_effective_rank_mergeability_score": 26.155597686767578,
        "task_vector_cosine_similarity": 25.824661254882812,
        "task_vector_l2_distance": -9.518388748168945,
        "task_vector_dot_product": 20.27986717224121,
        "weight_space_angle": -33.73535919189453,
        "task_vector_magnitude_ratio": 3.848508358001709,
        "activation_l2_distance": -3.6844191551208496,
        "activation_cosine_similarity": 32.29011535644531,
        "activation_magnitude_ratio": 37.90198516845703,
        "activation_dot_product": -48.47354507446289,
        "encoder_gradient_cosine_similarity": 21.530977249145508,
        "encoder_gradient_l2_distance": -32.021461486816406,
        "encoder_gradient_dot_product": 32.019954681396484,
        "input_gradient_cosine_similarity": 7.986054420471191,
        "input_gradient_l2_distance": -69.92407989501953,
        "input_gradient_dot_product": -11.251485824584961
      },
      "coefficient_std": {
        "effective_rank": 20.556961059570312,
        "effective_rank_mergeability_score": 71.43891143798828,
        "stable_rank": 37.77174377441406,
        "spectral_gap": 48.42186737060547,
        "singular_value_ratio": 50.678585052490234,
        "layerwise_effective_rank": 53.10415267944336,
        "layerwise_effective_rank_mergeability_score": 51.12163162231445,
        "task_vector_cosine_similarity": 33.73120880126953,
        "task_vector_l2_distance": 37.87248611450195,
        "task_vector_dot_product": 32.0881233215332,
        "weight_space_angle": 48.09120559692383,
        "task_vector_magnitude_ratio": 33.026302337646484,
        "activation_l2_distance": 55.54478454589844,
        "activation_cosine_similarity": 56.498836517333984,
        "activation_magnitude_ratio": 128.53671264648438,
        "activation_dot_product": 56.62746047973633,
        "encoder_gradient_cosine_similarity": 38.40305709838867,
        "encoder_gradient_l2_distance": 33.630165100097656,
        "encoder_gradient_dot_product": 40.79428482055664,
        "input_gradient_cosine_similarity": 34.76774215698242,
        "input_gradient_l2_distance": 115.29247283935547,
        "input_gradient_dot_product": 61.867576599121094
      },
      "fold_results": [
        {
          "fold": 0,
          "held_out_task": "SUN397",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.26035486434525507,
          "val_r": 0.3837354747480434,
          "n_iterations": 691,
          "coefficients": {
            "effective_rank": -9.379380226135254,
            "effective_rank_mergeability_score": 33.258975982666016,
            "stable_rank": -42.218753814697266,
            "spectral_gap": -18.423826217651367,
            "singular_value_ratio": -93.44426727294922,
            "layerwise_effective_rank": 166.7705078125,
            "layerwise_effective_rank_mergeability_score": 117.4383544921875,
            "task_vector_cosine_similarity": -5.997125148773193,
            "task_vector_l2_distance": -60.20436096191406,
            "task_vector_dot_product": 82.88141632080078,
            "weight_space_angle": -81.17196655273438,
            "task_vector_magnitude_ratio": 63.56058883666992,
            "activation_l2_distance": -75.66233825683594,
            "activation_cosine_similarity": 55.14962387084961,
            "activation_magnitude_ratio": -71.43194580078125,
            "activation_dot_product": -102.56514739990234,
            "encoder_gradient_cosine_similarity": 74.87606048583984,
            "encoder_gradient_l2_distance": -37.05782699584961,
            "encoder_gradient_dot_product": 75.28214263916016,
            "input_gradient_cosine_similarity": 67.98141479492188,
            "input_gradient_l2_distance": -52.65443801879883,
            "input_gradient_dot_product": -85.99004364013672
          }
        },
        {
          "fold": 1,
          "held_out_task": "Cars",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.3956059949189469,
          "val_r": 0.19655810365561469,
          "n_iterations": 716,
          "coefficients": {
            "effective_rank": 3.5524613857269287,
            "effective_rank_mergeability_score": 8.307768821716309,
            "stable_rank": 4.002786159515381,
            "spectral_gap": 2.576845169067383,
            "singular_value_ratio": -4.766049861907959,
            "layerwise_effective_rank": 7.755194187164307,
            "layerwise_effective_rank_mergeability_score": 3.5147924423217773,
            "task_vector_cosine_similarity": 1.2830075025558472,
            "task_vector_l2_distance": -0.8977473974227905,
            "task_vector_dot_product": 1.5666910409927368,
            "weight_space_angle": -0.8586974740028381,
            "task_vector_magnitude_ratio": 2.2377586364746094,
            "activation_l2_distance": -7.590982437133789,
            "activation_cosine_similarity": 1.2974430322647095,
            "activation_magnitude_ratio": -1.3527358770370483,
            "activation_dot_product": -8.309470176696777,
            "encoder_gradient_cosine_similarity": -0.5103645920753479,
            "encoder_gradient_l2_distance": -6.594935894012451,
            "encoder_gradient_dot_product": 4.190763473510742,
            "input_gradient_cosine_similarity": 0.8515767455101013,
            "input_gradient_l2_distance": -6.887408256530762,
            "input_gradient_dot_product": -2.370262622833252
          }
        },
        {
          "fold": 2,
          "held_out_task": "RESISC45",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.36080676654172655,
          "val_r": 0.39868655080121806,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 12.32761001586914,
            "effective_rank_mergeability_score": -0.4845329821109772,
            "stable_rank": -7.716809272766113,
            "spectral_gap": 10.672194480895996,
            "singular_value_ratio": -3.2863049507141113,
            "layerwise_effective_rank": 10.836698532104492,
            "layerwise_effective_rank_mergeability_score": 6.700889587402344,
            "task_vector_cosine_similarity": 6.884379863739014,
            "task_vector_l2_distance": -11.308721542358398,
            "task_vector_dot_product": 16.416400909423828,
            "weight_space_angle": 6.403611660003662,
            "task_vector_magnitude_ratio": -5.233791351318359,
            "activation_l2_distance": 4.385684490203857,
            "activation_cosine_similarity": 26.27412986755371,
            "activation_magnitude_ratio": 0.2369871288537979,
            "activation_dot_product": -25.702423095703125,
            "encoder_gradient_cosine_similarity": -0.4003746509552002,
            "encoder_gradient_l2_distance": -25.871788024902344,
            "encoder_gradient_dot_product": 13.81275749206543,
            "input_gradient_cosine_similarity": 3.666515350341797,
            "input_gradient_l2_distance": -25.97797393798828,
            "input_gradient_dot_product": -11.636483192443848
          }
        },
        {
          "fold": 3,
          "held_out_task": "EuroSAT",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.15432945497111938,
          "val_r": 0.37115587221327456,
          "n_iterations": 603,
          "coefficients": {
            "effective_rank": -42.01506423950195,
            "effective_rank_mergeability_score": -156.0621337890625,
            "stable_rank": 61.52558517456055,
            "spectral_gap": 143.9169921875,
            "singular_value_ratio": -22.097110748291016,
            "layerwise_effective_rank": 34.240882873535156,
            "layerwise_effective_rank_mergeability_score": 70.55458068847656,
            "task_vector_cosine_similarity": 53.730777740478516,
            "task_vector_l2_distance": -29.733558654785156,
            "task_vector_dot_product": -11.954333305358887,
            "weight_space_angle": -112.3812026977539,
            "task_vector_magnitude_ratio": -37.08302688598633,
            "activation_l2_distance": -23.109939575195312,
            "activation_cosine_similarity": 111.98150634765625,
            "activation_magnitude_ratio": 184.51222229003906,
            "activation_dot_product": -19.680185317993164,
            "encoder_gradient_cosine_similarity": 56.0048828125,
            "encoder_gradient_l2_distance": -54.12747573852539,
            "encoder_gradient_dot_product": -70.21294403076172,
            "input_gradient_cosine_similarity": -35.178016662597656,
            "input_gradient_l2_distance": -198.51068115234375,
            "input_gradient_dot_product": 96.6758041381836
          }
        },
        {
          "fold": 4,
          "held_out_task": "SVHN",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.257010269101957,
          "val_r": 0.21973852412243672,
          "n_iterations": 501,
          "coefficients": {
            "effective_rank": -2.304438829421997,
            "effective_rank_mergeability_score": 36.34036636352539,
            "stable_rank": 31.53438949584961,
            "spectral_gap": 5.685209274291992,
            "singular_value_ratio": -17.679048538208008,
            "layerwise_effective_rank": 17.120925903320312,
            "layerwise_effective_rank_mergeability_score": -13.319721221923828,
            "task_vector_cosine_similarity": 20.295503616333008,
            "task_vector_l2_distance": 52.26874542236328,
            "task_vector_dot_product": 26.30342674255371,
            "weight_space_angle": -22.345388412475586,
            "task_vector_magnitude_ratio": -56.122371673583984,
            "activation_l2_distance": -65.13882446289062,
            "activation_cosine_similarity": 46.18889236450195,
            "activation_magnitude_ratio": 44.01821517944336,
            "activation_dot_product": -31.037628173828125,
            "encoder_gradient_cosine_similarity": 2.8889362812042236,
            "encoder_gradient_l2_distance": -43.88055419921875,
            "encoder_gradient_dot_product": 29.312654495239258,
            "input_gradient_cosine_similarity": 42.02341842651367,
            "input_gradient_l2_distance": -80.9242172241211,
            "input_gradient_dot_product": -20.231597900390625
          }
        },
        {
          "fold": 5,
          "held_out_task": "GTSRB",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.2572694119313133,
          "val_r": 0.31923322227178963,
          "n_iterations": 588,
          "coefficients": {
            "effective_rank": -19.795656204223633,
            "effective_rank_mergeability_score": 50.803104400634766,
            "stable_rank": 1.0877180099487305,
            "spectral_gap": 1.9959293603897095,
            "singular_value_ratio": 21.425302505493164,
            "layerwise_effective_rank": -54.41064453125,
            "layerwise_effective_rank_mergeability_score": -18.775615692138672,
            "task_vector_cosine_similarity": 16.634977340698242,
            "task_vector_l2_distance": -18.609264373779297,
            "task_vector_dot_product": 17.466373443603516,
            "weight_space_angle": -2.457412004470825,
            "task_vector_magnitude_ratio": 29.201616287231445,
            "activation_l2_distance": -29.976205825805664,
            "activation_cosine_similarity": 37.813697814941406,
            "activation_magnitude_ratio": 13.071243286132812,
            "activation_dot_product": 12.121170043945312,
            "encoder_gradient_cosine_similarity": 40.876468658447266,
            "encoder_gradient_l2_distance": -6.451660633087158,
            "encoder_gradient_dot_product": 33.16566848754883,
            "input_gradient_cosine_similarity": 10.29902172088623,
            "input_gradient_l2_distance": -101.67066192626953,
            "input_gradient_dot_product": -32.81783676147461
          }
        },
        {
          "fold": 6,
          "held_out_task": "MNIST",
          "n_train_pairs": 164,
          "n_val_pairs": 15,
          "train_r": 0.461250594533448,
          "val_r": -0.2035103088196885,
          "n_iterations": 1000,
          "coefficients": {
            "effective_rank": 13.735724449157715,
            "effective_rank_mergeability_score": -12.735374450683594,
            "stable_rank": -33.18803787231445,
            "spectral_gap": 34.506370544433594,
            "singular_value_ratio": 10.161706924438477,
            "layerwise_effective_rank": 12.053010940551758,
            "layerwise_effective_rank_mergeability_score": 13.864381790161133,
            "task_vector_cosine_similarity": -9.723039627075195,
            "task_vector_l2_distance": -16.663713455200195,
            "task_vector_dot_product": 12.861859321594238,
            "weight_space_angle": 6.3721160888671875,
            "task_vector_magnitude_ratio": 21.643253326416016,
            "activation_l2_distance": -11.467597007751465,
            "activation_cosine_similarity": 22.657970428466797,
            "activation_magnitude_ratio": 17.87261390686035,
            "activation_dot_product": -35.135921478271484,
            "encoder_gradient_cosine_similarity": 10.208192825317383,
            "encoder_gradient_l2_distance": -33.18538284301758,
            "encoder_gradient_dot_product": 31.134485244750977,
            "input_gradient_cosine_similarity": -3.235677719116211,
            "input_gradient_l2_distance": -26.91900634765625,
            "input_gradient_dot_product": -23.81943130493164
          }
        },
        {
          "fold": 7,
          "held_out_task": "DTD",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.2672464289518627,
          "val_r": -0.22635007759635523,
          "n_iterations": 493,
          "coefficients": {
            "effective_rank": -19.438758850097656,
            "effective_rank_mergeability_score": 14.83936882019043,
            "stable_rank": -40.31891632080078,
            "spectral_gap": -5.01287841796875,
            "singular_value_ratio": 23.008607864379883,
            "layerwise_effective_rank": 32.21460723876953,
            "layerwise_effective_rank_mergeability_score": 22.898473739624023,
            "task_vector_cosine_similarity": 28.95951271057129,
            "task_vector_l2_distance": -45.87144088745117,
            "task_vector_dot_product": 43.585845947265625,
            "weight_space_angle": -23.830524444580078,
            "task_vector_magnitude_ratio": -0.2853022515773773,
            "activation_l2_distance": -32.168670654296875,
            "activation_cosine_similarity": 32.1949462890625,
            "activation_magnitude_ratio": -1.0812760591506958,
            "activation_dot_product": -40.17976379394531,
            "encoder_gradient_cosine_similarity": 23.270877838134766,
            "encoder_gradient_l2_distance": -66.94290161132812,
            "encoder_gradient_dot_product": 5.470191478729248,
            "input_gradient_cosine_similarity": 43.38280487060547,
            "input_gradient_l2_distance": -11.150717735290527,
            "input_gradient_dot_product": 17.45275115966797
          }
        },
        {
          "fold": 8,
          "held_out_task": "Flowers102",
          "n_train_pairs": 163,
          "n_val_pairs": 16,
          "train_r": 0.24380436494383645,
          "val_r": -0.394515548301132,
          "n_iterations": 885,
          "coefficients": {
            "effective_rank": 9.771594047546387,
            "effective_rank_mergeability_score": -5.036811351776123,
            "stable_rank": -69.5433120727539,
            "spectral_gap": -18.335763931274414,
            "singular_value_ratio": 13.579228401184082,
            "layerwise_effective_rank": -79.7848892211914,
            "layerwise_effective_rank_mergeability_score": 13.139817237854004,
            "task_vector_cosine_similarity": 44.586997985839844,
            "task_vector_l2_distance": -26.655609130859375,
            "task_vector_dot_product": 7.02794885635376,
            "weight_space_angle": -54.945003509521484,
            "task_vector_magnitude_ratio": 1.7581331729888916,
            "activation_l2_distance": 53.58051681518555,
            "activation_cosine_similarity": 90.36537170410156,
            "activation_magnitude_ratio": -1.7269307374954224,
            "activation_dot_product": -53.93113327026367,
            "encoder_gradient_cosine_similarity": 135.5409698486328,
            "encoder_gradient_l2_distance": -97.95687103271484,
            "encoder_gradient_dot_product": 39.07370376586914,
            "input_gradient_cosine_similarity": 13.467183113098145,
            "input_gradient_l2_distance": -10.429537773132324,
            "input_gradient_dot_product": -2.5475971698760986
          }
        },
        {
          "fold": 9,
          "held_out_task": "PCAM",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.03817246519827602,
          "val_r": 0.08118719798434594,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": 0.5738957524299622,
            "effective_rank_mergeability_score": 2.8444552421569824,
            "stable_rank": -2.074944257736206,
            "spectral_gap": 3.054564952850342,
            "singular_value_ratio": 1.55677330493927,
            "layerwise_effective_rank": -1.0399295091629028,
            "layerwise_effective_rank_mergeability_score": -0.47284403443336487,
            "task_vector_cosine_similarity": 4.958956241607666,
            "task_vector_l2_distance": 0.05471362918615341,
            "task_vector_dot_product": -0.6067521572113037,
            "weight_space_angle": -6.674012184143066,
            "task_vector_magnitude_ratio": 1.9768409729003906,
            "activation_l2_distance": -1.0860674381256104,
            "activation_cosine_similarity": -0.6448934674263,
            "activation_magnitude_ratio": -0.020432135090231895,
            "activation_dot_product": -1.6259827613830566,
            "encoder_gradient_cosine_similarity": -4.736143112182617,
            "encoder_gradient_l2_distance": -1.5387176275253296,
            "encoder_gradient_dot_product": 1.6308043003082275,
            "input_gradient_cosine_similarity": 1.1442235708236694,
            "input_gradient_l2_distance": 4.518240928649902,
            "input_gradient_dot_product": -0.7995033264160156
          }
        },
        {
          "fold": 10,
          "held_out_task": "FER2013",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.019260567128470622,
          "val_r": 0.11538517624300004,
          "n_iterations": 410,
          "coefficients": {
            "effective_rank": -1.7426605224609375,
            "effective_rank_mergeability_score": -235.68560791015625,
            "stable_rank": 48.961158752441406,
            "spectral_gap": -128.84185791015625,
            "singular_value_ratio": 191.7373809814453,
            "layerwise_effective_rank": -99.08219146728516,
            "layerwise_effective_rank_mergeability_score": 187.78640747070312,
            "task_vector_cosine_similarity": 124.40535736083984,
            "task_vector_l2_distance": 25.891637802124023,
            "task_vector_dot_product": -54.96097946166992,
            "weight_space_angle": -169.13143920898438,
            "task_vector_magnitude_ratio": 90.24247741699219,
            "activation_l2_distance": 179.7671661376953,
            "activation_cosine_similarity": -165.52894592285156,
            "activation_magnitude_ratio": 559.1296997070312,
            "activation_dot_product": -233.97032165527344,
            "encoder_gradient_cosine_similarity": -62.88045120239258,
            "encoder_gradient_l2_distance": 39.54617691040039,
            "encoder_gradient_dot_product": 139.5505828857422,
            "input_gradient_cosine_similarity": -109.69853210449219,
            "input_gradient_l2_distance": -523.9965209960938,
            "input_gradient_dot_product": 199.4980926513672
          }
        },
        {
          "fold": 11,
          "held_out_task": "OxfordIIITPet",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.27245061762696,
          "val_r": 0.2637488589642212,
          "n_iterations": 438,
          "coefficients": {
            "effective_rank": 3.833472728729248,
            "effective_rank_mergeability_score": -6.022435665130615,
            "stable_rank": 1.2280066013336182,
            "spectral_gap": 59.012996673583984,
            "singular_value_ratio": -17.539398193359375,
            "layerwise_effective_rank": -13.08182144165039,
            "layerwise_effective_rank_mergeability_score": -18.612701416015625,
            "task_vector_cosine_similarity": -3.025402784347534,
            "task_vector_l2_distance": -11.572588920593262,
            "task_vector_dot_product": 21.56768798828125,
            "weight_space_angle": -15.273694038391113,
            "task_vector_magnitude_ratio": 30.94744300842285,
            "activation_l2_distance": -17.463722229003906,
            "activation_cosine_similarity": 6.067774772644043,
            "activation_magnitude_ratio": 33.494056701660156,
            "activation_dot_product": -9.244593620300293,
            "encoder_gradient_cosine_similarity": 40.08864974975586,
            "encoder_gradient_l2_distance": -69.0750961303711,
            "encoder_gradient_dot_product": 56.95918655395508,
            "input_gradient_cosine_similarity": 23.515073776245117,
            "input_gradient_l2_distance": -34.71204376220703,
            "input_gradient_dot_product": -60.09419250488281
          }
        },
        {
          "fold": 12,
          "held_out_task": "STL10",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": -0.020407105194264308,
          "val_r": 0.02880541506430536,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": 3.9555532932281494,
            "effective_rank_mergeability_score": 3.240473747253418,
            "stable_rank": -0.30727148056030273,
            "spectral_gap": -5.984139442443848,
            "singular_value_ratio": 7.445952415466309,
            "layerwise_effective_rank": -18.229938507080078,
            "layerwise_effective_rank_mergeability_score": -3.658081531524658,
            "task_vector_cosine_similarity": 20.420270919799805,
            "task_vector_l2_distance": -9.194098472595215,
            "task_vector_dot_product": -2.8897695541381836,
            "weight_space_angle": -4.54027795791626,
            "task_vector_magnitude_ratio": 3.447073221206665,
            "activation_l2_distance": -3.3152966499328613,
            "activation_cosine_similarity": 4.336251735687256,
            "activation_magnitude_ratio": -16.116147994995117,
            "activation_dot_product": 1.8457907438278198,
            "encoder_gradient_cosine_similarity": 18.13555908203125,
            "encoder_gradient_l2_distance": -2.094114065170288,
            "encoder_gradient_dot_product": 2.7138280868530273,
            "input_gradient_cosine_similarity": -14.476668357849121,
            "input_gradient_l2_distance": 11.919195175170898,
            "input_gradient_dot_product": 4.332502365112305
          }
        },
        {
          "fold": 13,
          "held_out_task": "CIFAR100",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.20955612821794461,
          "val_r": 0.36685588836299526,
          "n_iterations": 704,
          "coefficients": {
            "effective_rank": 0.32297399640083313,
            "effective_rank_mergeability_score": -8.489228248596191,
            "stable_rank": -34.247413635253906,
            "spectral_gap": -48.067138671875,
            "singular_value_ratio": -10.626395225524902,
            "layerwise_effective_rank": -58.06534957885742,
            "layerwise_effective_rank_mergeability_score": 37.668827056884766,
            "task_vector_cosine_similarity": 65.498291015625,
            "task_vector_l2_distance": 57.998714447021484,
            "task_vector_dot_product": 20.528844833374023,
            "weight_space_angle": -67.1917953491211,
            "task_vector_magnitude_ratio": -29.847131729125977,
            "activation_l2_distance": 56.098304748535156,
            "activation_cosine_similarity": 95.7363052368164,
            "activation_magnitude_ratio": 48.683021545410156,
            "activation_dot_product": -49.25899887084961,
            "encoder_gradient_cosine_similarity": 37.460575103759766,
            "encoder_gradient_l2_distance": 0.2547230124473572,
            "encoder_gradient_dot_product": 58.00896072387695,
            "input_gradient_cosine_similarity": 35.41811752319336,
            "input_gradient_l2_distance": -127.51475524902344,
            "input_gradient_dot_product": -79.37175750732422
          }
        },
        {
          "fold": 14,
          "held_out_task": "CIFAR10",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": -0.004693390373420724,
          "val_r": 0.010406806917417728,
          "n_iterations": 51,
          "coefficients": {
            "effective_rank": 4.511791229248047,
            "effective_rank_mergeability_score": 3.8159019947052,
            "stable_rank": -1.6044986248016357,
            "spectral_gap": -2.5327956676483154,
            "singular_value_ratio": -6.9497971534729,
            "layerwise_effective_rank": 2.4426581859588623,
            "layerwise_effective_rank_mergeability_score": 5.23329496383667,
            "task_vector_cosine_similarity": -1.5423955917358398,
            "task_vector_l2_distance": 7.563510894775391,
            "task_vector_dot_product": -2.087329864501953,
            "weight_space_angle": 6.2532429695129395,
            "task_vector_magnitude_ratio": -4.305060386657715,
            "activation_l2_distance": -4.050480842590332,
            "activation_cosine_similarity": -0.8174546957015991,
            "activation_magnitude_ratio": -3.6251256465911865,
            "activation_dot_product": -3.7430260181427,
            "encoder_gradient_cosine_similarity": 1.2743607759475708,
            "encoder_gradient_l2_distance": 6.372336387634277,
            "encoder_gradient_dot_product": -3.97990083694458,
            "input_gradient_cosine_similarity": -2.496690273284912,
            "input_gradient_l2_distance": 9.4553861618042,
            "input_gradient_dot_product": -8.204654693603516
          }
        },
        {
          "fold": 15,
          "held_out_task": "Food101",
          "n_train_pairs": 162,
          "n_val_pairs": 17,
          "train_r": 0.41569896931591377,
          "val_r": 0.27365173391746855,
          "n_iterations": 858,
          "coefficients": {
            "effective_rank": -39.84418869018555,
            "effective_rank_mergeability_score": 41.2624626159668,
            "stable_rank": 21.624631881713867,
            "spectral_gap": 10.468597412109375,
            "singular_value_ratio": 14.446237564086914,
            "layerwise_effective_rank": 36.09855651855469,
            "layerwise_effective_rank_mergeability_score": -38.53248977661133,
            "task_vector_cosine_similarity": 80.08833312988281,
            "task_vector_l2_distance": -102.29661560058594,
            "task_vector_dot_product": 102.36444091796875,
            "weight_space_angle": 37.89522933959961,
            "task_vector_magnitude_ratio": -39.362884521484375,
            "activation_l2_distance": 17.524290084838867,
            "activation_cosine_similarity": 50.127960205078125,
            "activation_magnitude_ratio": -12.264843940734863,
            "activation_dot_product": -110.61964416503906,
            "encoder_gradient_cosine_similarity": -10.90197467803955,
            "encoder_gradient_l2_distance": -42.73036575317383,
            "encoder_gradient_dot_product": 54.701934814453125,
            "input_gradient_cosine_similarity": 11.276738166809082,
            "input_gradient_l2_distance": -55.93640899658203,
            "input_gradient_dot_product": -24.39179801940918
          }
        },
        {
          "fold": 16,
          "held_out_task": "FashionMNIST",
          "n_train_pairs": 160,
          "n_val_pairs": 19,
          "train_r": 0.3200294817368204,
          "val_r": 0.17328606763108167,
          "n_iterations": 820,
          "coefficients": {
            "effective_rank": -27.825143814086914,
            "effective_rank_mergeability_score": 28.371234893798828,
            "stable_rank": 32.53577423095703,
            "spectral_gap": 10.32785701751709,
            "singular_value_ratio": 20.62294578552246,
            "layerwise_effective_rank": 15.691804885864258,
            "layerwise_effective_rank_mergeability_score": 27.490625381469727,
            "task_vector_cosine_similarity": 50.29215621948242,
            "task_vector_l2_distance": -27.438148498535156,
            "task_vector_dot_product": 25.832990646362305,
            "weight_space_angle": -40.1937370300293,
            "task_vector_magnitude_ratio": -0.19319815933704376,
            "activation_l2_distance": -10.519682884216309,
            "activation_cosine_similarity": 72.9981918334961,
            "activation_magnitude_ratio": -18.378686904907227,
            "activation_dot_product": -101.4349594116211,
            "encoder_gradient_cosine_similarity": 24.24278450012207,
            "encoder_gradient_l2_distance": -41.47803497314453,
            "encoder_gradient_dot_product": 43.1351432800293,
            "input_gradient_cosine_similarity": 25.55318260192871,
            "input_gradient_l2_distance": -54.95563507080078,
            "input_gradient_dot_product": -53.679351806640625
          }
        },
        {
          "fold": 17,
          "held_out_task": "EMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.37859523892155955,
          "val_r": 0.24821875236560292,
          "n_iterations": 648,
          "coefficients": {
            "effective_rank": -3.6004478931427,
            "effective_rank_mergeability_score": -13.894882202148438,
            "stable_rank": -0.1687500774860382,
            "spectral_gap": 20.701202392578125,
            "singular_value_ratio": -8.647724151611328,
            "layerwise_effective_rank": 20.166980743408203,
            "layerwise_effective_rank_mergeability_score": 22.893138885498047,
            "task_vector_cosine_similarity": -5.568740367889404,
            "task_vector_l2_distance": -7.29757833480835,
            "task_vector_dot_product": 35.94725036621094,
            "weight_space_angle": -0.9030632376670837,
            "task_vector_magnitude_ratio": 6.254164218902588,
            "activation_l2_distance": -22.158916473388672,
            "activation_cosine_similarity": 20.879972457885742,
            "activation_magnitude_ratio": 8.05013656616211,
            "activation_dot_product": -44.48179244995117,
            "encoder_gradient_cosine_similarity": 6.113077163696289,
            "encoder_gradient_l2_distance": -17.33171272277832,
            "encoder_gradient_dot_product": 28.36349868774414,
            "input_gradient_cosine_similarity": 19.926755905151367,
            "input_gradient_l2_distance": -30.541868209838867,
            "input_gradient_dot_product": -33.70298767089844
          }
        },
        {
          "fold": 18,
          "held_out_task": "KMNIST",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.5843177380683563,
          "val_r": 0.56547749234015,
          "n_iterations": 848,
          "coefficients": {
            "effective_rank": -53.605403900146484,
            "effective_rank_mergeability_score": -31.29422378540039,
            "stable_rank": -33.97666549682617,
            "spectral_gap": 28.605361938476562,
            "singular_value_ratio": 14.914342880249023,
            "layerwise_effective_rank": 30.296066284179688,
            "layerwise_effective_rank_mergeability_score": 11.561715126037598,
            "task_vector_cosine_similarity": 15.511406898498535,
            "task_vector_l2_distance": 58.90272903442383,
            "task_vector_dot_product": 35.909461975097656,
            "weight_space_angle": -46.180747985839844,
            "task_vector_magnitude_ratio": 15.984819412231445,
            "activation_l2_distance": 16.112770080566406,
            "activation_cosine_similarity": 86.98771667480469,
            "activation_magnitude_ratio": -25.295717239379883,
            "activation_dot_product": -8.749300956726074,
            "encoder_gradient_cosine_similarity": 3.667642593383789,
            "encoder_gradient_l2_distance": -48.96818923950195,
            "encoder_gradient_dot_product": 18.052900314331055,
            "input_gradient_cosine_similarity": 8.099178314208984,
            "input_gradient_l2_distance": -50.549072265625,
            "input_gradient_dot_product": -44.988685607910156
          }
        },
        {
          "fold": 19,
          "held_out_task": "RenderedSST2",
          "n_train_pairs": 161,
          "n_val_pairs": 18,
          "train_r": 0.26491278572894705,
          "val_r": 0.1050075547948946,
          "n_iterations": 704,
          "coefficients": {
            "effective_rank": -49.043739318847656,
            "effective_rank_mergeability_score": 117.04937744140625,
            "stable_rank": 90.05286407470703,
            "spectral_gap": -23.49470329284668,
            "singular_value_ratio": 65.49968719482422,
            "layerwise_effective_rank": 11.552010536193848,
            "layerwise_effective_rank_mergeability_score": 75.73809051513672,
            "task_vector_cosine_similarity": 8.799942016601562,
            "task_vector_l2_distance": -25.30438232421875,
            "task_vector_dot_product": 27.835893630981445,
            "weight_space_angle": -83.55245208740234,
            "task_vector_magnitude_ratio": -17.851238250732422,
            "activation_l2_distance": -97.44840240478516,
            "activation_cosine_similarity": 51.735862731933594,
            "activation_magnitude_ratio": 0.265252023935318,
            "activation_dot_product": -103.7675552368164,
            "encoder_gradient_cosine_similarity": 35.399879455566406,
            "encoder_gradient_l2_distance": -91.31675720214844,
            "encoder_gradient_dot_product": 80.03263854980469,
            "input_gradient_cosine_similarity": 18.201465606689453,
            "input_gradient_l2_distance": -31.04338836669922,
            "input_gradient_dot_product": -58.34267807006836
          }
        }
      ],
      "optimization_params": {
        "n_iterations": 1000,
        "learning_rate": 0.01,
        "patience": 50,
        "convergence_threshold": 0.0001
      }
    }
  }
}