{
  "aggregate_metrics": {
    "train_r": 0.11989877115907766,
    "train_p": 8.624129626892462e-12,
    "val_r": 0.03167337870997225,
    "val_p": 0.5502787458501001
  },
  "per_fold_stats": {
    "train_r_mean": 0.39984438152613216,
    "train_r_std": 0.14591528928086744,
    "val_r_mean": 0.348391256903991,
    "val_r_std": 0.24639741274160554
  },
  "average_coefficients": {
    "effective_rank": 36.58692932128906,
    "effective_rank_mergeability_score": 49.86984634399414,
    "stable_rank": -47.9909782409668,
    "spectral_gap": -1.8941634893417358,
    "singular_value_ratio": 2.690798282623291,
    "layerwise_effective_rank": 39.98095703125,
    "layerwise_effective_rank_mergeability_score": 33.17683029174805,
    "task_vector_cosine_similarity": 62.764320373535156,
    "task_vector_l2_distance": -156.59698486328125,
    "task_vector_dot_product": 78.24459838867188,
    "weight_space_angle": -75.9563217163086,
    "task_vector_magnitude_ratio": 70.54661560058594,
    "activation_l2_distance": 48.70585632324219,
    "activation_cosine_similarity": 38.83490753173828,
    "activation_magnitude_ratio": -3.5970263481140137,
    "activation_dot_product": 62.0295295715332,
    "encoder_gradient_cosine_similarity": 70.27272033691406,
    "encoder_gradient_l2_distance": -76.24400329589844,
    "encoder_gradient_dot_product": 14.345242500305176,
    "input_gradient_cosine_similarity": 28.78887939453125,
    "input_gradient_l2_distance": -140.75328063964844,
    "input_gradient_dot_product": -132.80809020996094
  },
  "coefficient_std": {
    "effective_rank": 128.8020782470703,
    "effective_rank_mergeability_score": 111.16791534423828,
    "stable_rank": 220.61192321777344,
    "spectral_gap": 111.37564086914062,
    "singular_value_ratio": 55.24403762817383,
    "layerwise_effective_rank": 160.09373474121094,
    "layerwise_effective_rank_mergeability_score": 125.38443756103516,
    "task_vector_cosine_similarity": 152.69479370117188,
    "task_vector_l2_distance": 522.4150390625,
    "task_vector_dot_product": 235.315185546875,
    "weight_space_angle": 235.9313507080078,
    "task_vector_magnitude_ratio": 311.0113220214844,
    "activation_l2_distance": 356.7044982910156,
    "activation_cosine_similarity": 115.6213607788086,
    "activation_magnitude_ratio": 37.12839126586914,
    "activation_dot_product": 116.90392303466797,
    "encoder_gradient_cosine_similarity": 254.7305145263672,
    "encoder_gradient_l2_distance": 127.1515121459961,
    "encoder_gradient_dot_product": 198.50059509277344,
    "input_gradient_cosine_similarity": 73.70551300048828,
    "input_gradient_l2_distance": 425.0874328613281,
    "input_gradient_dot_product": 394.3180236816406
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4438611153698801,
      "val_r": 0.42726140131801427,
      "n_iterations": 664,
      "coefficients": {
        "effective_rank": 11.522387504577637,
        "effective_rank_mergeability_score": 1.877713680267334,
        "stable_rank": -63.525394439697266,
        "spectral_gap": 20.77401351928711,
        "singular_value_ratio": 53.676822662353516,
        "layerwise_effective_rank": 40.02324295043945,
        "layerwise_effective_rank_mergeability_score": -5.998660564422607,
        "task_vector_cosine_similarity": 45.03112030029297,
        "task_vector_l2_distance": -8.10644245147705,
        "task_vector_dot_product": -14.899109840393066,
        "weight_space_angle": -19.235204696655273,
        "task_vector_magnitude_ratio": -38.80952072143555,
        "activation_l2_distance": 9.549771308898926,
        "activation_cosine_similarity": 42.58867263793945,
        "activation_magnitude_ratio": 0.2462863028049469,
        "activation_dot_product": 31.067115783691406,
        "encoder_gradient_cosine_similarity": 31.91367530822754,
        "encoder_gradient_l2_distance": -14.720356941223145,
        "encoder_gradient_dot_product": 21.651647567749023,
        "input_gradient_cosine_similarity": 15.257891654968262,
        "input_gradient_l2_distance": -89.0084457397461,
        "input_gradient_dot_product": -69.87953186035156
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.46893534122299874,
      "val_r": 0.2943846439895879,
      "n_iterations": 929,
      "coefficients": {
        "effective_rank": 94.54259490966797,
        "effective_rank_mergeability_score": 93.60623168945312,
        "stable_rank": -30.248332977294922,
        "spectral_gap": 8.985761642456055,
        "singular_value_ratio": -59.70964813232422,
        "layerwise_effective_rank": -5.116936683654785,
        "layerwise_effective_rank_mergeability_score": -57.65451431274414,
        "task_vector_cosine_similarity": 22.18362045288086,
        "task_vector_l2_distance": -47.33681869506836,
        "task_vector_dot_product": 77.1306381225586,
        "weight_space_angle": 45.05107879638672,
        "task_vector_magnitude_ratio": 31.2720890045166,
        "activation_l2_distance": -13.134604454040527,
        "activation_cosine_similarity": 60.89194869995117,
        "activation_magnitude_ratio": -44.00535583496094,
        "activation_dot_product": -30.856502532958984,
        "encoder_gradient_cosine_similarity": 0.6652258038520813,
        "encoder_gradient_l2_distance": -42.33258819580078,
        "encoder_gradient_dot_product": 49.2602653503418,
        "input_gradient_cosine_similarity": -43.450740814208984,
        "input_gradient_l2_distance": -98.39612579345703,
        "input_gradient_dot_product": -10.348896980285645
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.3465829905602539,
      "val_r": 0.41241579402927947,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": 570.3150024414062,
        "effective_rank_mergeability_score": 419.3130798339844,
        "stable_rank": -971.017822265625,
        "spectral_gap": 351.4214172363281,
        "singular_value_ratio": 31.529081344604492,
        "layerwise_effective_rank": 712.2073974609375,
        "layerwise_effective_rank_mergeability_score": 521.8646850585938,
        "task_vector_cosine_similarity": 706.1134643554688,
        "task_vector_l2_distance": -2373.045166015625,
        "task_vector_dot_product": 1091.702392578125,
        "weight_space_angle": -1080.5303955078125,
        "task_vector_magnitude_ratio": 1418.97607421875,
        "activation_l2_distance": 1571.2705078125,
        "activation_cosine_similarity": 523.877685546875,
        "activation_magnitude_ratio": 106.41976165771484,
        "activation_dot_product": 548.6272583007812,
        "encoder_gradient_cosine_similarity": 1165.515869140625,
        "encoder_gradient_l2_distance": -603.9276123046875,
        "encoder_gradient_dot_product": -775.4651489257812,
        "input_gradient_cosine_similarity": -147.00355529785156,
        "input_gradient_l2_distance": -1989.133544921875,
        "input_gradient_dot_product": -1798.0302734375
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.44167097641528974,
      "val_r": 0.3094787440449513,
      "n_iterations": 645,
      "coefficients": {
        "effective_rank": 13.110542297363281,
        "effective_rank_mergeability_score": 13.154526710510254,
        "stable_rank": -27.801420211791992,
        "spectral_gap": 42.79903030395508,
        "singular_value_ratio": 12.714822769165039,
        "layerwise_effective_rank": -26.213098526000977,
        "layerwise_effective_rank_mergeability_score": -42.61034393310547,
        "task_vector_cosine_similarity": 47.50958251953125,
        "task_vector_l2_distance": -26.41152572631836,
        "task_vector_dot_product": 3.464379072189331,
        "weight_space_angle": -3.7230358123779297,
        "task_vector_magnitude_ratio": 16.94635581970215,
        "activation_l2_distance": 7.163827896118164,
        "activation_cosine_similarity": -5.784586429595947,
        "activation_magnitude_ratio": 11.066012382507324,
        "activation_dot_product": 59.96067428588867,
        "encoder_gradient_cosine_similarity": 14.070479393005371,
        "encoder_gradient_l2_distance": -65.07678985595703,
        "encoder_gradient_dot_product": 28.12376594543457,
        "input_gradient_cosine_similarity": 26.1127986907959,
        "input_gradient_l2_distance": -34.41925811767578,
        "input_gradient_dot_product": -63.15913772583008
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3171835310227603,
      "val_r": 0.40717349630863436,
      "n_iterations": 759,
      "coefficients": {
        "effective_rank": -20.001880645751953,
        "effective_rank_mergeability_score": 51.547420501708984,
        "stable_rank": 62.24293518066406,
        "spectral_gap": 27.11090850830078,
        "singular_value_ratio": -37.93608856201172,
        "layerwise_effective_rank": -20.20271873474121,
        "layerwise_effective_rank_mergeability_score": -8.312212944030762,
        "task_vector_cosine_similarity": 23.36859703063965,
        "task_vector_l2_distance": -19.544944763183594,
        "task_vector_dot_product": 32.74728775024414,
        "weight_space_angle": -151.11373901367188,
        "task_vector_magnitude_ratio": 50.10537338256836,
        "activation_l2_distance": -67.9867935180664,
        "activation_cosine_similarity": -1.9953041076660156,
        "activation_magnitude_ratio": -17.032054901123047,
        "activation_dot_product": 73.05899810791016,
        "encoder_gradient_cosine_similarity": 36.95292282104492,
        "encoder_gradient_l2_distance": -54.261878967285156,
        "encoder_gradient_dot_product": 38.00862121582031,
        "input_gradient_cosine_similarity": 70.24324035644531,
        "input_gradient_l2_distance": -19.814626693725586,
        "input_gradient_dot_product": -46.18621063232422
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5005322545881656,
      "val_r": 0.6932907653856077,
      "n_iterations": 831,
      "coefficients": {
        "effective_rank": -12.21310806274414,
        "effective_rank_mergeability_score": 2.8198211193084717,
        "stable_rank": 0.5987972617149353,
        "spectral_gap": 14.875252723693848,
        "singular_value_ratio": 5.097167015075684,
        "layerwise_effective_rank": 2.0063822269439697,
        "layerwise_effective_rank_mergeability_score": -9.985251426696777,
        "task_vector_cosine_similarity": -0.8864018321037292,
        "task_vector_l2_distance": -22.070877075195312,
        "task_vector_dot_product": 25.19261932373047,
        "weight_space_angle": 7.838959217071533,
        "task_vector_magnitude_ratio": 2.3208072185516357,
        "activation_l2_distance": 2.247128486633301,
        "activation_cosine_similarity": 10.570873260498047,
        "activation_magnitude_ratio": 1.5092041492462158,
        "activation_dot_product": 3.9521420001983643,
        "encoder_gradient_cosine_similarity": 8.34498405456543,
        "encoder_gradient_l2_distance": -14.247291564941406,
        "encoder_gradient_dot_product": 15.963883399963379,
        "input_gradient_cosine_similarity": 6.135110378265381,
        "input_gradient_l2_distance": -27.012256622314453,
        "input_gradient_dot_product": -22.059688568115234
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.05569506230738391,
      "val_r": 0.09792043263638915,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": 0.5903240442276001,
        "effective_rank_mergeability_score": -1.7493128776550293,
        "stable_rank": -0.7755810022354126,
        "spectral_gap": -0.8314911723136902,
        "singular_value_ratio": -1.5841809511184692,
        "layerwise_effective_rank": -2.016813039779663,
        "layerwise_effective_rank_mergeability_score": -2.247765302658081,
        "task_vector_cosine_similarity": 0.14108771085739136,
        "task_vector_l2_distance": -2.4977827072143555,
        "task_vector_dot_product": 0.18863685429096222,
        "weight_space_angle": 2.4207794666290283,
        "task_vector_magnitude_ratio": 0.6661447286605835,
        "activation_l2_distance": -7.948389053344727,
        "activation_cosine_similarity": 0.8555179238319397,
        "activation_magnitude_ratio": 1.7959336042404175,
        "activation_dot_product": 4.125377655029297,
        "encoder_gradient_cosine_similarity": -8.766348838806152,
        "encoder_gradient_l2_distance": 0.8416219353675842,
        "encoder_gradient_dot_product": 3.032325267791748,
        "input_gradient_cosine_similarity": 11.668514251708984,
        "input_gradient_l2_distance": 3.116330146789551,
        "input_gradient_dot_product": -0.04001419618725777
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.29051012177103125,
      "val_r": -0.5304582150887321,
      "n_iterations": 405,
      "coefficients": {
        "effective_rank": 76.83485412597656,
        "effective_rank_mergeability_score": -31.386690139770508,
        "stable_rank": -86.94820404052734,
        "spectral_gap": -58.95900344848633,
        "singular_value_ratio": -16.149564743041992,
        "layerwise_effective_rank": -39.816444396972656,
        "layerwise_effective_rank_mergeability_score": 69.23486328125,
        "task_vector_cosine_similarity": -5.652651786804199,
        "task_vector_l2_distance": 31.35320281982422,
        "task_vector_dot_product": 38.92640686035156,
        "weight_space_angle": -145.8230743408203,
        "task_vector_magnitude_ratio": -2.921239137649536,
        "activation_l2_distance": -51.45842742919922,
        "activation_cosine_similarity": 81.33026885986328,
        "activation_magnitude_ratio": 10.755301475524902,
        "activation_dot_product": 34.07033920288086,
        "encoder_gradient_cosine_similarity": 105.10743713378906,
        "encoder_gradient_l2_distance": -172.917724609375,
        "encoder_gradient_dot_product": 50.466217041015625,
        "input_gradient_cosine_similarity": 6.982125282287598,
        "input_gradient_l2_distance": -0.9318314790725708,
        "input_gradient_dot_product": 108.90028381347656
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.12742071581117764,
      "val_r": 0.45325255520416646,
      "n_iterations": 713,
      "coefficients": {
        "effective_rank": 53.96982955932617,
        "effective_rank_mergeability_score": 288.89404296875,
        "stable_rank": 196.3185577392578,
        "spectral_gap": -304.2197265625,
        "singular_value_ratio": 178.17308044433594,
        "layerwise_effective_rank": 124.07943725585938,
        "layerwise_effective_rank_mergeability_score": 177.45843505859375,
        "task_vector_cosine_similarity": 133.8064727783203,
        "task_vector_l2_distance": -539.8726806640625,
        "task_vector_dot_product": 111.38871765136719,
        "weight_space_angle": -3.110382556915283,
        "task_vector_magnitude_ratio": -17.504573822021484,
        "activation_l2_distance": -323.7209167480469,
        "activation_cosine_similarity": -46.603492736816406,
        "activation_magnitude_ratio": -56.564361572265625,
        "activation_dot_product": 102.45729064941406,
        "encoder_gradient_cosine_similarity": -139.01345825195312,
        "encoder_gradient_l2_distance": -29.908493041992188,
        "encoder_gradient_dot_product": 391.57464599609375,
        "input_gradient_cosine_similarity": 220.6424560546875,
        "input_gradient_l2_distance": -83.12076568603516,
        "input_gradient_dot_product": -434.1262512207031
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.2256165951237116,
      "val_r": 0.23400230368873354,
      "n_iterations": 819,
      "coefficients": {
        "effective_rank": 43.74525451660156,
        "effective_rank_mergeability_score": 126.18656921386719,
        "stable_rank": -103.92466735839844,
        "spectral_gap": -141.79595947265625,
        "singular_value_ratio": 90.884033203125,
        "layerwise_effective_rank": -82.99783325195312,
        "layerwise_effective_rank_mergeability_score": 85.21517181396484,
        "task_vector_cosine_similarity": -17.33927345275879,
        "task_vector_l2_distance": 91.95073699951172,
        "task_vector_dot_product": -53.23705291748047,
        "weight_space_angle": -78.48451232910156,
        "task_vector_magnitude_ratio": 26.835529327392578,
        "activation_l2_distance": -89.86837768554688,
        "activation_cosine_similarity": 26.795068740844727,
        "activation_magnitude_ratio": -89.08637237548828,
        "activation_dot_product": 87.09565734863281,
        "encoder_gradient_cosine_similarity": 47.85027313232422,
        "encoder_gradient_l2_distance": -77.07657623291016,
        "encoder_gradient_dot_product": 75.46017456054688,
        "input_gradient_cosine_similarity": 195.6053009033203,
        "input_gradient_l2_distance": -91.89893341064453,
        "input_gradient_dot_product": -70.91619873046875
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4989752766026555,
      "val_r": 0.22233011270769393,
      "n_iterations": 844,
      "coefficients": {
        "effective_rank": 0.3194844722747803,
        "effective_rank_mergeability_score": 13.568696975708008,
        "stable_rank": 9.754338264465332,
        "spectral_gap": 7.487887859344482,
        "singular_value_ratio": 3.9786665439605713,
        "layerwise_effective_rank": 4.452559947967529,
        "layerwise_effective_rank_mergeability_score": -2.657721757888794,
        "task_vector_cosine_similarity": 0.4392014443874359,
        "task_vector_l2_distance": -19.388851165771484,
        "task_vector_dot_product": 21.149328231811523,
        "weight_space_angle": 8.612858772277832,
        "task_vector_magnitude_ratio": -11.074357032775879,
        "activation_l2_distance": -7.888173580169678,
        "activation_cosine_similarity": 16.06208038330078,
        "activation_magnitude_ratio": -0.053869038820266724,
        "activation_dot_product": 0.4520449936389923,
        "encoder_gradient_cosine_similarity": 1.770403265953064,
        "encoder_gradient_l2_distance": -31.82434844970703,
        "encoder_gradient_dot_product": 15.217584609985352,
        "input_gradient_cosine_similarity": 13.765948295593262,
        "input_gradient_l2_distance": -21.592084884643555,
        "input_gradient_dot_product": -21.553438186645508
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.48303612786295147,
      "val_r": 0.39284292730195225,
      "n_iterations": 643,
      "coefficients": {
        "effective_rank": -47.423702239990234,
        "effective_rank_mergeability_score": -4.977130889892578,
        "stable_rank": 35.52070617675781,
        "spectral_gap": 21.407268524169922,
        "singular_value_ratio": -23.760244369506836,
        "layerwise_effective_rank": 29.823341369628906,
        "layerwise_effective_rank_mergeability_score": 3.999809741973877,
        "task_vector_cosine_similarity": -2.398223638534546,
        "task_vector_l2_distance": -28.68212890625,
        "task_vector_dot_product": 36.13691329956055,
        "weight_space_angle": -8.62051773071289,
        "task_vector_magnitude_ratio": 13.484651565551758,
        "activation_l2_distance": 8.134636878967285,
        "activation_cosine_similarity": 18.841625213623047,
        "activation_magnitude_ratio": -0.43072977662086487,
        "activation_dot_product": 14.68933391571045,
        "encoder_gradient_cosine_similarity": 15.547368049621582,
        "encoder_gradient_l2_distance": -43.329959869384766,
        "encoder_gradient_dot_product": 25.550201416015625,
        "input_gradient_cosine_similarity": 17.76214599609375,
        "input_gradient_l2_distance": -36.842960357666016,
        "input_gradient_dot_product": -43.434730529785156
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.46831402439110137,
      "val_r": 0.30211218604648254,
      "n_iterations": 794,
      "coefficients": {
        "effective_rank": -1.469751000404358,
        "effective_rank_mergeability_score": 18.181066513061523,
        "stable_rank": 21.50086212158203,
        "spectral_gap": 15.301765441894531,
        "singular_value_ratio": -7.238900661468506,
        "layerwise_effective_rank": -3.047292470932007,
        "layerwise_effective_rank_mergeability_score": -12.989472389221191,
        "task_vector_cosine_similarity": 18.031442642211914,
        "task_vector_l2_distance": -6.340893268585205,
        "task_vector_dot_product": -7.105930805206299,
        "weight_space_angle": -26.25352668762207,
        "task_vector_magnitude_ratio": 7.712460517883301,
        "activation_l2_distance": 2.497655153274536,
        "activation_cosine_similarity": 2.7601020336151123,
        "activation_magnitude_ratio": 2.800525426864624,
        "activation_dot_product": 15.073871612548828,
        "encoder_gradient_cosine_similarity": 11.942789077758789,
        "encoder_gradient_l2_distance": -20.21106719970703,
        "encoder_gradient_dot_product": 17.383317947387695,
        "input_gradient_cosine_similarity": 6.923612117767334,
        "input_gradient_l2_distance": -20.778987884521484,
        "input_gradient_dot_product": -33.675575256347656
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.49655281357208,
      "val_r": 0.5462681643631968,
      "n_iterations": 702,
      "coefficients": {
        "effective_rank": 8.36268424987793,
        "effective_rank_mergeability_score": 16.441072463989258,
        "stable_rank": -6.453282356262207,
        "spectral_gap": 0.794687032699585,
        "singular_value_ratio": -10.014398574829102,
        "layerwise_effective_rank": 28.433942794799805,
        "layerwise_effective_rank_mergeability_score": 9.445757865905762,
        "task_vector_cosine_similarity": 18.17560386657715,
        "task_vector_l2_distance": -23.91951560974121,
        "task_vector_dot_product": 11.076075553894043,
        "weight_space_angle": 3.378910779953003,
        "task_vector_magnitude_ratio": -3.032137393951416,
        "activation_l2_distance": -12.439441680908203,
        "activation_cosine_similarity": -4.897181510925293,
        "activation_magnitude_ratio": 3.3624677658081055,
        "activation_dot_product": 17.63648796081543,
        "encoder_gradient_cosine_similarity": 6.267938137054443,
        "encoder_gradient_l2_distance": -47.52074432373047,
        "encoder_gradient_dot_product": 33.74204635620117,
        "input_gradient_cosine_similarity": 5.900745868682861,
        "input_gradient_l2_distance": -25.878734588623047,
        "input_gradient_dot_product": -27.865123748779297
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3977930815768109,
      "val_r": 0.5751242235768522,
      "n_iterations": 711,
      "coefficients": {
        "effective_rank": 1.6542221307754517,
        "effective_rank_mergeability_score": 19.363590240478516,
        "stable_rank": -11.617297172546387,
        "spectral_gap": 30.42929458618164,
        "singular_value_ratio": 5.558468818664551,
        "layerwise_effective_rank": 37.40480422973633,
        "layerwise_effective_rank_mergeability_score": -49.939178466796875,
        "task_vector_cosine_similarity": 65.03766632080078,
        "task_vector_l2_distance": -30.978296279907227,
        "task_vector_dot_product": 13.720391273498535,
        "weight_space_angle": -39.93062210083008,
        "task_vector_magnitude_ratio": -56.80855178833008,
        "activation_l2_distance": 3.633378505706787,
        "activation_cosine_similarity": 3.7756054401397705,
        "activation_magnitude_ratio": -9.216941833496094,
        "activation_dot_product": 61.49060821533203,
        "encoder_gradient_cosine_similarity": 27.983619689941406,
        "encoder_gradient_l2_distance": -64.75077819824219,
        "encoder_gradient_dot_product": 62.3950080871582,
        "input_gradient_cosine_similarity": 16.403438568115234,
        "input_gradient_l2_distance": -24.508386611938477,
        "input_gradient_dot_product": -60.10230255126953
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.49952778189992814,
      "val_r": 0.5604858615723668,
      "n_iterations": 639,
      "coefficients": {
        "effective_rank": -46.10905838012695,
        "effective_rank_mergeability_score": 38.749244689941406,
        "stable_rank": 24.186315536499023,
        "spectral_gap": -2.7594470977783203,
        "singular_value_ratio": -16.185941696166992,
        "layerwise_effective_rank": 57.761295318603516,
        "layerwise_effective_rank_mergeability_score": -32.9878044128418,
        "task_vector_cosine_similarity": 51.082969665527344,
        "task_vector_l2_distance": -72.98905944824219,
        "task_vector_dot_product": 42.72322082519531,
        "weight_space_angle": 21.795551300048828,
        "task_vector_magnitude_ratio": -34.51123809814453,
        "activation_l2_distance": -6.580506324768066,
        "activation_cosine_similarity": -5.934782981872559,
        "activation_magnitude_ratio": -9.285561561584473,
        "activation_dot_product": 42.252418518066406,
        "encoder_gradient_cosine_similarity": 7.324460506439209,
        "encoder_gradient_l2_distance": -116.82479858398438,
        "encoder_gradient_dot_product": 26.511388778686523,
        "input_gradient_cosine_similarity": 31.1885986328125,
        "input_gradient_l2_distance": -31.5720272064209,
        "input_gradient_dot_product": 33.162391662597656
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.3548142707957168,
      "val_r": 0.35332169888066045,
      "n_iterations": 572,
      "coefficients": {
        "effective_rank": -59.94084167480469,
        "effective_rank_mergeability_score": -10.572295188903809,
        "stable_rank": 37.0619010925293,
        "spectral_gap": -13.77512264251709,
        "singular_value_ratio": -90.91879272460938,
        "layerwise_effective_rank": 0.11634908616542816,
        "layerwise_effective_rank_mergeability_score": -53.54697799682617,
        "task_vector_cosine_similarity": 102.2153549194336,
        "task_vector_l2_distance": 11.870901107788086,
        "task_vector_dot_product": 51.81676483154297,
        "weight_space_angle": -30.182939529418945,
        "task_vector_magnitude_ratio": 11.320893287658691,
        "activation_l2_distance": -46.2264518737793,
        "activation_cosine_similarity": 35.54795837402344,
        "activation_magnitude_ratio": -20.0711612701416,
        "activation_dot_product": 22.047863006591797,
        "encoder_gradient_cosine_similarity": 26.890605926513672,
        "encoder_gradient_l2_distance": -21.060222625732422,
        "encoder_gradient_dot_product": 84.59445190429688,
        "input_gradient_cosine_similarity": 36.608909606933594,
        "input_gradient_l2_distance": -58.75551223754883,
        "input_gradient_dot_product": -14.04434871673584
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3276541995756133,
      "val_r": 0.25268024178001336,
      "n_iterations": 487,
      "coefficients": {
        "effective_rank": -29.5704345703125,
        "effective_rank_mergeability_score": -75.5811767578125,
        "stable_rank": 27.503028869628906,
        "spectral_gap": -56.50215148925781,
        "singular_value_ratio": -31.55864715576172,
        "layerwise_effective_rank": 2.063833475112915,
        "layerwise_effective_rank_mergeability_score": 90.74849700927734,
        "task_vector_cosine_similarity": -27.580350875854492,
        "task_vector_l2_distance": -47.96099090576172,
        "task_vector_dot_product": 79.71768188476562,
        "weight_space_angle": -55.57450485229492,
        "task_vector_magnitude_ratio": -65.78694915771484,
        "activation_l2_distance": -15.021506309509277,
        "activation_cosine_similarity": -53.7012825012207,
        "activation_magnitude_ratio": 46.547523498535156,
        "activation_dot_product": 104.15943908691406,
        "encoder_gradient_cosine_similarity": 19.851804733276367,
        "encoder_gradient_l2_distance": -7.1219282150268555,
        "encoder_gradient_dot_product": 94.74552917480469,
        "input_gradient_cosine_similarity": 72.24774932861328,
        "input_gradient_l2_distance": -41.851253509521484,
        "input_gradient_dot_product": -28.776994705200195
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7043287693935265,
      "val_r": 0.5753823871850702,
      "n_iterations": 652,
      "coefficients": {
        "effective_rank": 60.95164489746094,
        "effective_rank_mergeability_score": -5.786910057067871,
        "stable_rank": -73.265380859375,
        "spectral_gap": -9.36495304107666,
        "singular_value_ratio": -38.982051849365234,
        "layerwise_effective_rank": -65.03795623779297,
        "layerwise_effective_rank_mergeability_score": -15.315803527832031,
        "task_vector_cosine_similarity": 63.94851303100586,
        "task_vector_l2_distance": 33.69394302368164,
        "task_vector_dot_product": -13.703190803527832,
        "weight_space_angle": 37.85324478149414,
        "task_vector_magnitude_ratio": 70.4179916381836,
        "activation_l2_distance": 8.374897003173828,
        "activation_cosine_similarity": 51.541038513183594,
        "activation_magnitude_ratio": -11.694485664367676,
        "activation_dot_product": 36.80942153930664,
        "encoder_gradient_cosine_similarity": 12.205265998840332,
        "encoder_gradient_l2_distance": -50.55784606933594,
        "encoder_gradient_dot_product": 0.4357925057411194,
        "input_gradient_cosine_similarity": -4.584902286529541,
        "input_gradient_l2_distance": -84.11106872558594,
        "input_gradient_dot_product": -2.829526424407959
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5478825806596075,
      "val_r": 0.3885554131488997,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 12.548609733581543,
        "effective_rank_mergeability_score": 23.747203826904297,
        "stable_rank": 1.0704610347747803,
        "spectral_gap": 8.937307357788086,
        "singular_value_ratio": 6.242284774780273,
        "layerwise_effective_rank": 5.695487022399902,
        "layerwise_effective_rank_mergeability_score": -0.18472668528556824,
        "task_vector_cosine_similarity": 12.05854606628418,
        "task_vector_l2_distance": -31.662307739257812,
        "task_vector_dot_product": 16.755937576293945,
        "weight_space_angle": -3.495429039001465,
        "task_vector_magnitude_ratio": -8.67730712890625,
        "activation_l2_distance": 3.5189006328582764,
        "activation_cosine_similarity": 20.176368713378906,
        "activation_magnitude_ratio": 0.9973644018173218,
        "activation_dot_product": 12.42073917388916,
        "encoder_gradient_cosine_similarity": 13.02911376953125,
        "encoder_gradient_l2_distance": -48.0506477355957,
        "encoder_gradient_dot_product": 28.25307273864746,
        "input_gradient_cosine_similarity": 17.36819076538086,
        "input_gradient_l2_distance": -38.55495071411133,
        "input_gradient_dot_product": -51.19572830200195
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}