{
  "aggregate_metrics": {
    "train_r": 0.1877017706451737,
    "train_p": 6.191276262081849e-27,
    "val_r": 0.20103644198545956,
    "val_p": 0.000128322958206954
  },
  "per_fold_stats": {
    "train_r_mean": 0.5736383681723893,
    "train_r_std": 0.2504042175751728,
    "val_r_mean": 0.42438359588747876,
    "val_r_std": 0.30383915831625213
  },
  "average_coefficients": {
    "effective_rank": -3.758315324783325,
    "effective_rank_mergeability_score": 10.188277244567871,
    "stable_rank": 12.04945182800293,
    "spectral_gap": -0.4523714482784271,
    "singular_value_ratio": -7.618811130523682,
    "layerwise_effective_rank": 0.8052960634231567,
    "layerwise_effective_rank_mergeability_score": -3.4298012256622314,
    "task_vector_cosine_similarity": 2.7382891178131104,
    "task_vector_l2_distance": 8.70966911315918,
    "task_vector_dot_product": 6.554912567138672,
    "weight_space_angle": -5.9695234298706055,
    "task_vector_magnitude_ratio": -3.175868511199951,
    "activation_l2_distance": -18.18015480041504,
    "activation_cosine_similarity": 18.22173500061035,
    "activation_magnitude_ratio": -8.906698226928711,
    "activation_dot_product": 21.860380172729492,
    "encoder_gradient_cosine_similarity": 16.869836807250977,
    "encoder_gradient_l2_distance": -34.13471221923828,
    "encoder_gradient_dot_product": 13.468910217285156,
    "input_gradient_cosine_similarity": 16.162302017211914,
    "input_gradient_l2_distance": -27.80255699157715,
    "input_gradient_dot_product": -13.201458930969238
  },
  "coefficient_std": {
    "effective_rank": 28.364273071289062,
    "effective_rank_mergeability_score": 25.32481575012207,
    "stable_rank": 36.753089904785156,
    "spectral_gap": 31.437013626098633,
    "singular_value_ratio": 33.98372268676758,
    "layerwise_effective_rank": 26.955015182495117,
    "layerwise_effective_rank_mergeability_score": 25.97682762145996,
    "task_vector_cosine_similarity": 24.003971099853516,
    "task_vector_l2_distance": 35.304710388183594,
    "task_vector_dot_product": 18.406095504760742,
    "weight_space_angle": 33.33672332763672,
    "task_vector_magnitude_ratio": 44.85594940185547,
    "activation_l2_distance": 49.084022521972656,
    "activation_cosine_similarity": 36.91358184814453,
    "activation_magnitude_ratio": 15.024666786193848,
    "activation_dot_product": 28.548110961914062,
    "encoder_gradient_cosine_similarity": 26.470966339111328,
    "encoder_gradient_l2_distance": 46.92348098754883,
    "encoder_gradient_dot_product": 28.15730857849121,
    "input_gradient_cosine_similarity": 26.776174545288086,
    "input_gradient_l2_distance": 33.43470764160156,
    "input_gradient_dot_product": 24.107622146606445
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": -0.04570349493905039,
      "val_r": -0.2655955553301436,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": -6.949795722961426,
        "effective_rank_mergeability_score": -1.0722306966781616,
        "stable_rank": -0.3663243353366852,
        "spectral_gap": 7.193935394287109,
        "singular_value_ratio": 2.2558093070983887,
        "layerwise_effective_rank": 11.354029655456543,
        "layerwise_effective_rank_mergeability_score": -4.5637006759643555,
        "task_vector_cosine_similarity": 5.827106475830078,
        "task_vector_l2_distance": 1.9217569828033447,
        "task_vector_dot_product": -3.097933530807495,
        "weight_space_angle": -5.164436340332031,
        "task_vector_magnitude_ratio": 2.2463619709014893,
        "activation_l2_distance": -7.017400741577148,
        "activation_cosine_similarity": -2.840245246887207,
        "activation_magnitude_ratio": -3.1762888431549072,
        "activation_dot_product": 2.335317611694336,
        "encoder_gradient_cosine_similarity": -7.037820816040039,
        "encoder_gradient_l2_distance": 2.635085105895996,
        "encoder_gradient_dot_product": 2.0204784870147705,
        "input_gradient_cosine_similarity": -3.161983013153076,
        "input_gradient_l2_distance": 2.919093370437622,
        "input_gradient_dot_product": 4.744661331176758
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5665840230496599,
      "val_r": 0.5365080894438957,
      "n_iterations": 567,
      "coefficients": {
        "effective_rank": -12.735401153564453,
        "effective_rank_mergeability_score": 15.218719482421875,
        "stable_rank": 59.3719482421875,
        "spectral_gap": -28.869367599487305,
        "singular_value_ratio": -8.715813636779785,
        "layerwise_effective_rank": -65.8265609741211,
        "layerwise_effective_rank_mergeability_score": -26.35480499267578,
        "task_vector_cosine_similarity": 13.026275634765625,
        "task_vector_l2_distance": 37.4151496887207,
        "task_vector_dot_product": 11.764007568359375,
        "weight_space_angle": -32.50175476074219,
        "task_vector_magnitude_ratio": -47.713401794433594,
        "activation_l2_distance": 23.41571807861328,
        "activation_cosine_similarity": 67.39183044433594,
        "activation_magnitude_ratio": -10.120556831359863,
        "activation_dot_product": 84.1650619506836,
        "encoder_gradient_cosine_similarity": 13.738377571105957,
        "encoder_gradient_l2_distance": -50.75181198120117,
        "encoder_gradient_dot_product": 8.385309219360352,
        "input_gradient_cosine_similarity": 43.25615692138672,
        "input_gradient_l2_distance": -59.33909225463867,
        "input_gradient_dot_product": -33.222633361816406
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7413273336041792,
      "val_r": 0.7877816588842264,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": -0.3649028539657593,
        "effective_rank_mergeability_score": -0.22556251287460327,
        "stable_rank": 0.2013067901134491,
        "spectral_gap": 0.03234105929732323,
        "singular_value_ratio": -0.08523250371217728,
        "layerwise_effective_rank": 0.08781342208385468,
        "layerwise_effective_rank_mergeability_score": 0.37714946269989014,
        "task_vector_cosine_similarity": 0.35829538106918335,
        "task_vector_l2_distance": -0.3388618528842926,
        "task_vector_dot_product": 0.27355778217315674,
        "weight_space_angle": 0.39137348532676697,
        "task_vector_magnitude_ratio": 0.11453243345022202,
        "activation_l2_distance": 0.7842167615890503,
        "activation_cosine_similarity": 1.2099906206130981,
        "activation_magnitude_ratio": -0.06738349795341492,
        "activation_dot_product": -0.045404329895973206,
        "encoder_gradient_cosine_similarity": 0.07473544031381607,
        "encoder_gradient_l2_distance": -1.006628155708313,
        "encoder_gradient_dot_product": -0.0015703901881352067,
        "input_gradient_cosine_similarity": 0.10164427757263184,
        "input_gradient_l2_distance": -0.6312002539634705,
        "input_gradient_dot_product": -0.24112094938755035
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7075922234420882,
      "val_r": 0.7160018846534751,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": -0.23121590912342072,
        "effective_rank_mergeability_score": 2.474454879760742,
        "stable_rank": -3.4062139987945557,
        "spectral_gap": -0.42015790939331055,
        "singular_value_ratio": -2.3911094665527344,
        "layerwise_effective_rank": 5.2779693603515625,
        "layerwise_effective_rank_mergeability_score": 4.700900077819824,
        "task_vector_cosine_similarity": 2.631774425506592,
        "task_vector_l2_distance": -4.677471160888672,
        "task_vector_dot_product": -0.14680632948875427,
        "weight_space_angle": 1.092189908027649,
        "task_vector_magnitude_ratio": 5.185915946960449,
        "activation_l2_distance": 0.3761330544948578,
        "activation_cosine_similarity": 1.6574604511260986,
        "activation_magnitude_ratio": -0.8073009848594666,
        "activation_dot_product": 8.348931312561035,
        "encoder_gradient_cosine_similarity": 2.1305737495422363,
        "encoder_gradient_l2_distance": -11.978658676147461,
        "encoder_gradient_dot_product": 1.0248342752456665,
        "input_gradient_cosine_similarity": 1.7160557508468628,
        "input_gradient_l2_distance": -8.407828330993652,
        "input_gradient_dot_product": -3.1515562534332275
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.10022738710244423,
      "val_r": -0.07701753833697958,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": -0.9401532411575317,
        "effective_rank_mergeability_score": -1.3012603521347046,
        "stable_rank": -0.15514208376407623,
        "spectral_gap": 1.2369917631149292,
        "singular_value_ratio": -0.6772366166114807,
        "layerwise_effective_rank": -0.4603213667869568,
        "layerwise_effective_rank_mergeability_score": -0.13396714627742767,
        "task_vector_cosine_similarity": -0.5090071558952332,
        "task_vector_l2_distance": 0.16105154156684875,
        "task_vector_dot_product": 0.8895413279533386,
        "weight_space_angle": -0.09055211395025253,
        "task_vector_magnitude_ratio": -0.35916754603385925,
        "activation_l2_distance": -0.8851715922355652,
        "activation_cosine_similarity": 1.3389396667480469,
        "activation_magnitude_ratio": -1.0900251865386963,
        "activation_dot_product": 0.8791757822036743,
        "encoder_gradient_cosine_similarity": 0.7938652038574219,
        "encoder_gradient_l2_distance": 0.4734978675842285,
        "encoder_gradient_dot_product": -0.2634439468383789,
        "input_gradient_cosine_similarity": 1.5306851863861084,
        "input_gradient_l2_distance": 0.8481109142303467,
        "input_gradient_dot_product": -0.2755057215690613
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7522254105869997,
      "val_r": 0.6821063637247817,
      "n_iterations": 648,
      "coefficients": {
        "effective_rank": 1.575722575187683,
        "effective_rank_mergeability_score": 1.9396976232528687,
        "stable_rank": -1.1992484331130981,
        "spectral_gap": 1.5045520067214966,
        "singular_value_ratio": 0.9300130605697632,
        "layerwise_effective_rank": 2.0287182331085205,
        "layerwise_effective_rank_mergeability_score": 1.7616239786148071,
        "task_vector_cosine_similarity": -1.458923578262329,
        "task_vector_l2_distance": -1.7877644300460815,
        "task_vector_dot_product": -0.0005375179462134838,
        "weight_space_angle": -2.1197142601013184,
        "task_vector_magnitude_ratio": 0.8031673431396484,
        "activation_l2_distance": 0.5405551195144653,
        "activation_cosine_similarity": 2.817683458328247,
        "activation_magnitude_ratio": -0.5600684285163879,
        "activation_dot_product": 1.13280189037323,
        "encoder_gradient_cosine_similarity": 1.1609570980072021,
        "encoder_gradient_l2_distance": -5.058168411254883,
        "encoder_gradient_dot_product": 0.1939309686422348,
        "input_gradient_cosine_similarity": 0.32158660888671875,
        "input_gradient_l2_distance": -1.8817228078842163,
        "input_gradient_dot_product": -1.6453171968460083
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.6945833569333495,
      "val_r": 0.44039274093916303,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 2.7429468631744385,
        "effective_rank_mergeability_score": 4.487942695617676,
        "stable_rank": 1.8231000900268555,
        "spectral_gap": -4.431467056274414,
        "singular_value_ratio": -12.218056678771973,
        "layerwise_effective_rank": -0.1968882828950882,
        "layerwise_effective_rank_mergeability_score": 9.729141235351562,
        "task_vector_cosine_similarity": 1.0256016254425049,
        "task_vector_l2_distance": -18.214839935302734,
        "task_vector_dot_product": 11.541658401489258,
        "weight_space_angle": 4.619645118713379,
        "task_vector_magnitude_ratio": 7.916584491729736,
        "activation_l2_distance": 7.922162055969238,
        "activation_cosine_similarity": 9.785309791564941,
        "activation_magnitude_ratio": 2.330739974975586,
        "activation_dot_product": 18.155248641967773,
        "encoder_gradient_cosine_similarity": 6.9235944747924805,
        "encoder_gradient_l2_distance": -23.18515968322754,
        "encoder_gradient_dot_product": 10.362251281738281,
        "input_gradient_cosine_similarity": 2.6389403343200684,
        "input_gradient_l2_distance": -22.903993606567383,
        "input_gradient_dot_product": -19.85575294494629
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6753603263933059,
      "val_r": 0.3166362502700752,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": -4.504055500030518,
        "effective_rank_mergeability_score": 2.7466118335723877,
        "stable_rank": -0.3147001266479492,
        "spectral_gap": 1.2045644521713257,
        "singular_value_ratio": 8.103690147399902,
        "layerwise_effective_rank": 0.16506701707839966,
        "layerwise_effective_rank_mergeability_score": 0.32962408661842346,
        "task_vector_cosine_similarity": 3.1390833854675293,
        "task_vector_l2_distance": -9.991339683532715,
        "task_vector_dot_product": 3.884503126144409,
        "weight_space_angle": 0.1785837560892105,
        "task_vector_magnitude_ratio": -3.201083183288574,
        "activation_l2_distance": 0.9438455104827881,
        "activation_cosine_similarity": 6.2935967445373535,
        "activation_magnitude_ratio": -1.1573708057403564,
        "activation_dot_product": 8.038196563720703,
        "encoder_gradient_cosine_similarity": 3.9913787841796875,
        "encoder_gradient_l2_distance": -17.140262603759766,
        "encoder_gradient_dot_product": 1.5664867162704468,
        "input_gradient_cosine_similarity": 5.140308856964111,
        "input_gradient_l2_distance": -9.323247909545898,
        "input_gradient_dot_product": 0.9051271677017212
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5913383378101329,
      "val_r": 0.13267521279605204,
      "n_iterations": 597,
      "coefficients": {
        "effective_rank": -81.54327392578125,
        "effective_rank_mergeability_score": 8.344572067260742,
        "stable_rank": 142.29393005371094,
        "spectral_gap": 60.94699478149414,
        "singular_value_ratio": -111.27411651611328,
        "layerwise_effective_rank": 30.585689544677734,
        "layerwise_effective_rank_mergeability_score": 67.91785430908203,
        "task_vector_cosine_similarity": 1.5191971063613892,
        "task_vector_l2_distance": 52.79710388183594,
        "task_vector_dot_product": -42.286415100097656,
        "weight_space_angle": -119.47195434570312,
        "task_vector_magnitude_ratio": 114.42793273925781,
        "activation_l2_distance": -133.89114379882812,
        "activation_cosine_similarity": -32.87437057495117,
        "activation_magnitude_ratio": -27.159887313842773,
        "activation_dot_product": 34.72404098510742,
        "encoder_gradient_cosine_similarity": 58.23405075073242,
        "encoder_gradient_l2_distance": -86.10266876220703,
        "encoder_gradient_dot_product": 88.7999267578125,
        "input_gradient_cosine_similarity": 47.94587707519531,
        "input_gradient_l2_distance": -120.04664611816406,
        "input_gradient_dot_product": 47.11080551147461
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6976095816175445,
      "val_r": 0.6612809177523373,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": -0.030795244500041008,
        "effective_rank_mergeability_score": -4.232767581939697,
        "stable_rank": 3.9849536418914795,
        "spectral_gap": 5.6027421951293945,
        "singular_value_ratio": 8.616925239562988,
        "layerwise_effective_rank": -1.860262155532837,
        "layerwise_effective_rank_mergeability_score": 9.56264877319336,
        "task_vector_cosine_similarity": 3.670053005218506,
        "task_vector_l2_distance": -3.8961966037750244,
        "task_vector_dot_product": 0.8722373843193054,
        "weight_space_angle": -0.20459435880184174,
        "task_vector_magnitude_ratio": -3.2421088218688965,
        "activation_l2_distance": 2.2164204120635986,
        "activation_cosine_similarity": 0.7599062323570251,
        "activation_magnitude_ratio": -0.795062780380249,
        "activation_dot_product": -1.9859087467193604,
        "encoder_gradient_cosine_similarity": 2.431565284729004,
        "encoder_gradient_l2_distance": -7.66160774230957,
        "encoder_gradient_dot_product": 2.865762233734131,
        "input_gradient_cosine_similarity": 1.0382747650146484,
        "input_gradient_l2_distance": -12.71165657043457,
        "input_gradient_dot_product": -4.0013203620910645
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5634000240488231,
      "val_r": 0.18843624410595536,
      "n_iterations": 595,
      "coefficients": {
        "effective_rank": 47.31863784790039,
        "effective_rank_mergeability_score": 76.16912841796875,
        "stable_rank": 68.15062713623047,
        "spectral_gap": -98.12654113769531,
        "singular_value_ratio": -85.1376953125,
        "layerwise_effective_rank": -19.52223777770996,
        "layerwise_effective_rank_mergeability_score": -71.71187591552734,
        "task_vector_cosine_similarity": 75.66146087646484,
        "task_vector_l2_distance": 72.3773193359375,
        "task_vector_dot_product": -0.5964272618293762,
        "weight_space_angle": 49.12101745605469,
        "task_vector_magnitude_ratio": -110.31140899658203,
        "activation_l2_distance": -156.07664489746094,
        "activation_cosine_similarity": 61.7389030456543,
        "activation_magnitude_ratio": -30.626718521118164,
        "activation_dot_product": 66.25082397460938,
        "encoder_gradient_cosine_similarity": 46.5970344543457,
        "encoder_gradient_l2_distance": -66.67843627929688,
        "encoder_gradient_dot_product": 101.19176483154297,
        "input_gradient_cosine_similarity": 109.85391998291016,
        "input_gradient_l2_distance": -76.24470520019531,
        "input_gradient_dot_product": -58.400550842285156
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.511798372788252,
      "val_r": 0.38668013176381283,
      "n_iterations": 825,
      "coefficients": {
        "effective_rank": 42.571998596191406,
        "effective_rank_mergeability_score": 82.29194641113281,
        "stable_rank": -20.95009422302246,
        "spectral_gap": -22.969633102416992,
        "singular_value_ratio": 2.5435657501220703,
        "layerwise_effective_rank": 83.7514419555664,
        "layerwise_effective_rank_mergeability_score": -43.73118209838867,
        "task_vector_cosine_similarity": -61.075496673583984,
        "task_vector_l2_distance": 122.17794799804688,
        "task_vector_dot_product": 56.89876937866211,
        "weight_space_angle": 6.170718669891357,
        "task_vector_magnitude_ratio": -99.17805480957031,
        "activation_l2_distance": -96.24658966064453,
        "activation_cosine_similarity": 148.08656311035156,
        "activation_magnitude_ratio": -52.848854064941406,
        "activation_dot_product": 1.3877410888671875,
        "encoder_gradient_cosine_similarity": 100.23208618164062,
        "encoder_gradient_l2_distance": -197.03726196289062,
        "encoder_gradient_dot_product": 6.9785943031311035,
        "input_gradient_cosine_similarity": 46.36387252807617,
        "input_gradient_l2_distance": -52.99732208251953,
        "input_gradient_dot_product": -51.42272186279297
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6690102945587899,
      "val_r": 0.6859282297554661,
      "n_iterations": 946,
      "coefficients": {
        "effective_rank": -72.79582214355469,
        "effective_rank_mergeability_score": -27.16938018798828,
        "stable_rank": 16.297893524169922,
        "spectral_gap": 67.76978302001953,
        "singular_value_ratio": 51.72367477416992,
        "layerwise_effective_rank": -36.8642578125,
        "layerwise_effective_rank_mergeability_score": -30.19085693359375,
        "task_vector_cosine_similarity": -22.196128845214844,
        "task_vector_l2_distance": -22.596548080444336,
        "task_vector_dot_product": 20.96973991394043,
        "weight_space_angle": 38.75796127319336,
        "task_vector_magnitude_ratio": 35.5713996887207,
        "activation_l2_distance": 11.644025802612305,
        "activation_cosine_similarity": 31.06305694580078,
        "activation_magnitude_ratio": -5.548069953918457,
        "activation_dot_product": 91.24530029296875,
        "encoder_gradient_cosine_similarity": 35.39712905883789,
        "encoder_gradient_l2_distance": -68.7265396118164,
        "encoder_gradient_dot_product": 3.9178781509399414,
        "input_gradient_cosine_similarity": 16.988983154296875,
        "input_gradient_l2_distance": -76.63126373291016,
        "input_gradient_dot_product": -57.62953567504883
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6137718421764532,
      "val_r": 0.7026975873426619,
      "n_iterations": 708,
      "coefficients": {
        "effective_rank": 3.6961402893066406,
        "effective_rank_mergeability_score": 33.45564270019531,
        "stable_rank": -15.029562950134277,
        "spectral_gap": -1.8778594732284546,
        "singular_value_ratio": -20.813060760498047,
        "layerwise_effective_rank": 6.8393425941467285,
        "layerwise_effective_rank_mergeability_score": -5.426224708557129,
        "task_vector_cosine_similarity": 34.584781646728516,
        "task_vector_l2_distance": 3.360539436340332,
        "task_vector_dot_product": 35.675174713134766,
        "weight_space_angle": -59.53836441040039,
        "task_vector_magnitude_ratio": 30.146320343017578,
        "activation_l2_distance": -43.17163848876953,
        "activation_cosine_similarity": 30.492406845092773,
        "activation_magnitude_ratio": -37.39933395385742,
        "activation_dot_product": 45.0956916809082,
        "encoder_gradient_cosine_similarity": 48.318939208984375,
        "encoder_gradient_l2_distance": -66.04785919189453,
        "encoder_gradient_dot_product": 30.89417266845703,
        "input_gradient_cosine_similarity": 24.642187118530273,
        "input_gradient_l2_distance": -49.0650749206543,
        "input_gradient_dot_product": -27.8346004486084
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": -0.03970473271585378,
      "val_r": -0.1511793277544313,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": 0.830409049987793,
        "effective_rank_mergeability_score": -2.661609649658203,
        "stable_rank": 3.0075395107269287,
        "spectral_gap": -1.5491690635681152,
        "singular_value_ratio": 0.7800021171569824,
        "layerwise_effective_rank": 1.6299763917922974,
        "layerwise_effective_rank_mergeability_score": -0.9022207260131836,
        "task_vector_cosine_similarity": -1.2814470529556274,
        "task_vector_l2_distance": -2.004441499710083,
        "task_vector_dot_product": -0.4576821029186249,
        "weight_space_angle": -3.245635509490967,
        "task_vector_magnitude_ratio": 0.795712947845459,
        "activation_l2_distance": 0.30780407786369324,
        "activation_cosine_similarity": -0.05037865787744522,
        "activation_magnitude_ratio": -0.4225356876850128,
        "activation_dot_product": 1.6404343843460083,
        "encoder_gradient_cosine_similarity": 1.2621870040893555,
        "encoder_gradient_l2_distance": 0.5777586102485657,
        "encoder_gradient_dot_product": 1.7120712995529175,
        "input_gradient_cosine_similarity": -0.8866254091262817,
        "input_gradient_l2_distance": 1.7024327516555786,
        "input_gradient_dot_product": 0.20060384273529053
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.6894583706806239,
      "val_r": 0.4858532638027599,
      "n_iterations": 986,
      "coefficients": {
        "effective_rank": -3.1518750190734863,
        "effective_rank_mergeability_score": 9.670104026794434,
        "stable_rank": -20.075687408447266,
        "spectral_gap": -11.33110237121582,
        "singular_value_ratio": -17.646406173706055,
        "layerwise_effective_rank": 13.213006973266602,
        "layerwise_effective_rank_mergeability_score": 4.452528476715088,
        "task_vector_cosine_similarity": -13.836134910583496,
        "task_vector_l2_distance": -26.892019271850586,
        "task_vector_dot_product": 22.05367088317871,
        "weight_space_angle": -4.032810211181641,
        "task_vector_magnitude_ratio": 21.28520393371582,
        "activation_l2_distance": 22.37901496887207,
        "activation_cosine_similarity": 11.697956085205078,
        "activation_magnitude_ratio": 1.0518873929977417,
        "activation_dot_product": 36.405296325683594,
        "encoder_gradient_cosine_similarity": 11.164202690124512,
        "encoder_gradient_l2_distance": -16.08236312866211,
        "encoder_gradient_dot_product": 3.695988416671753,
        "input_gradient_cosine_similarity": 10.16010570526123,
        "input_gradient_l2_distance": -28.882610321044922,
        "input_gradient_dot_product": -24.299467086791992
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7390691608469998,
      "val_r": 0.6752293526568118,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 0.3897587060928345,
        "effective_rank_mergeability_score": 0.29904016852378845,
        "stable_rank": -0.3840450644493103,
        "spectral_gap": -0.3466546833515167,
        "singular_value_ratio": 0.13420459628105164,
        "layerwise_effective_rank": -0.09884587675333023,
        "layerwise_effective_rank_mergeability_score": -0.03964102268218994,
        "task_vector_cosine_similarity": 0.3904103636741638,
        "task_vector_l2_distance": -0.4015405774116516,
        "task_vector_dot_product": 0.25419238209724426,
        "weight_space_angle": 0.29612788558006287,
        "task_vector_magnitude_ratio": -0.2870313227176666,
        "activation_l2_distance": 1.083980679512024,
        "activation_cosine_similarity": 1.4938150644302368,
        "activation_magnitude_ratio": -0.050917524844408035,
        "activation_dot_product": -0.11348061263561249,
        "encoder_gradient_cosine_similarity": 0.16159731149673462,
        "encoder_gradient_l2_distance": -0.9700100421905518,
        "encoder_gradient_dot_product": 0.04685400053858757,
        "input_gradient_cosine_similarity": 0.0983530655503273,
        "input_gradient_l2_distance": -0.6857722997665405,
        "input_gradient_dot_product": -0.2714727520942688
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6931023119062545,
      "val_r": 0.5529627667132346,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": -2.3305320739746094,
        "effective_rank_mergeability_score": 3.3806779384613037,
        "stable_rank": 11.036053657531738,
        "spectral_gap": 0.1119564101099968,
        "singular_value_ratio": 1.8640007972717285,
        "layerwise_effective_rank": -2.532717227935791,
        "layerwise_effective_rank_mergeability_score": 12.932897567749023,
        "task_vector_cosine_similarity": 8.716341018676758,
        "task_vector_l2_distance": -7.15388298034668,
        "task_vector_dot_product": 1.9672504663467407,
        "weight_space_angle": 0.9765522480010986,
        "task_vector_magnitude_ratio": 0.723284900188446,
        "activation_l2_distance": -5.489625453948975,
        "activation_cosine_similarity": 5.9504618644714355,
        "activation_magnitude_ratio": -0.8027223944664001,
        "activation_dot_product": 8.984910011291504,
        "encoder_gradient_cosine_similarity": 5.575728416442871,
        "encoder_gradient_l2_distance": -7.123638153076172,
        "encoder_gradient_dot_product": 10.508809089660645,
        "input_gradient_cosine_similarity": 5.841558933258057,
        "input_gradient_l2_distance": -35.408382415771484,
        "input_gradient_dot_product": -16.730314254760742
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7731158680527156,
      "val_r": 0.3813973449483575,
      "n_iterations": 925,
      "coefficients": {
        "effective_rank": 1.297696590423584,
        "effective_rank_mergeability_score": 0.1372118890285492,
        "stable_rank": -1.4690734148025513,
        "spectral_gap": 0.10496644675731659,
        "singular_value_ratio": 1.0013130903244019,
        "layerwise_effective_rank": -0.22739651799201965,
        "layerwise_effective_rank_mergeability_score": -0.04985108971595764,
        "task_vector_cosine_similarity": -0.026922084391117096,
        "task_vector_l2_distance": -0.28480350971221924,
        "task_vector_dot_product": 0.24237589538097382,
        "weight_space_angle": -0.08423373103141785,
        "task_vector_magnitude_ratio": -0.4741450548171997,
        "activation_l2_distance": 0.8731260895729065,
        "activation_cosine_similarity": 1.0758699178695679,
        "activation_magnitude_ratio": 0.018250644207000732,
        "activation_dot_product": 0.013223580084741116,
        "encoder_gradient_cosine_similarity": 0.12333594262599945,
        "encoder_gradient_l2_distance": -0.6911313533782959,
        "encoder_gradient_dot_product": 0.015363299287855625,
        "input_gradient_cosine_similarity": 0.04365519806742668,
        "input_gradient_l2_distance": -0.47013726830482483,
        "input_gradient_dot_product": -0.1697412133216858
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7786013655040758,
      "val_r": 0.6488962996180625,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 9.988219261169434,
        "effective_rank_mergeability_score": -0.18740002810955048,
        "stable_rank": -1.8282643556594849,
        "spectral_gap": 15.165698051452637,
        "singular_value_ratio": 28.629323959350586,
        "layerwise_effective_rank": -11.237648010253906,
        "layerwise_effective_rank_mergeability_score": 2.743936777114868,
        "task_vector_cosine_similarity": 4.599456310272217,
        "task_vector_l2_distance": -17.777786254882812,
        "task_vector_dot_product": 10.397370338439941,
        "weight_space_angle": 5.459417343139648,
        "task_vector_magnitude_ratio": -17.96738052368164,
        "activation_l2_distance": 6.688107967376709,
        "activation_cosine_similarity": 17.34593391418457,
        "activation_magnitude_ratio": -8.901750564575195,
        "activation_dot_product": 30.55018424987793,
        "encoder_gradient_cosine_similarity": 6.123223781585693,
        "encoder_gradient_l2_distance": -60.138423919677734,
        "encoder_gradient_dot_product": -4.537242412567139,
        "input_gradient_cosine_similarity": 9.612516403198242,
        "input_gradient_l2_distance": -5.890133380889893,
        "input_gradient_dot_product": -17.83876609802246
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}