{
  "aggregate_metrics": {
    "train_r": 0.10512498175792483,
    "train_p": 2.211759828377331e-09,
    "val_r": -0.20795638683990952,
    "val_p": 7.358594285931861e-05
  },
  "per_fold_stats": {
    "train_r_mean": 0.51176696134267,
    "train_r_std": 0.29008324648464356,
    "val_r_mean": 0.3678835402333416,
    "val_r_std": 0.29355196368293435
  },
  "average_coefficients": {
    "effective_rank": -6.7596845626831055,
    "effective_rank_mergeability_score": 25.623905181884766,
    "stable_rank": -34.09730911254883,
    "spectral_gap": -18.90238380432129,
    "singular_value_ratio": 31.581707000732422,
    "layerwise_effective_rank": -8.113748550415039,
    "layerwise_effective_rank_mergeability_score": -4.397496700286865,
    "task_vector_cosine_similarity": 18.963287353515625,
    "task_vector_l2_distance": -27.08485984802246,
    "task_vector_dot_product": 38.52593231201172,
    "weight_space_angle": -17.436185836791992,
    "task_vector_magnitude_ratio": 44.63688278198242,
    "activation_l2_distance": 11.489348411560059,
    "activation_cosine_similarity": 1.7216180562973022,
    "activation_magnitude_ratio": -15.763181686401367,
    "activation_dot_product": 8.83303165435791,
    "encoder_gradient_cosine_similarity": 31.801311492919922,
    "encoder_gradient_l2_distance": -3.2287392616271973,
    "encoder_gradient_dot_product": -21.128162384033203,
    "input_gradient_cosine_similarity": 20.456689834594727,
    "input_gradient_l2_distance": -59.281646728515625,
    "input_gradient_dot_product": -16.442514419555664
  },
  "coefficient_std": {
    "effective_rank": 134.74508666992188,
    "effective_rank_mergeability_score": 164.36509704589844,
    "stable_rank": 68.34293365478516,
    "spectral_gap": 103.76392364501953,
    "singular_value_ratio": 80.11180877685547,
    "layerwise_effective_rank": 79.97417449951172,
    "layerwise_effective_rank_mergeability_score": 127.98417663574219,
    "task_vector_cosine_similarity": 88.9659423828125,
    "task_vector_l2_distance": 97.79913330078125,
    "task_vector_dot_product": 85.00641632080078,
    "weight_space_angle": 68.32349395751953,
    "task_vector_magnitude_ratio": 168.19471740722656,
    "activation_l2_distance": 71.74549102783203,
    "activation_cosine_similarity": 55.12752151489258,
    "activation_magnitude_ratio": 82.23844909667969,
    "activation_dot_product": 69.12869262695312,
    "encoder_gradient_cosine_similarity": 107.16895294189453,
    "encoder_gradient_l2_distance": 114.82402801513672,
    "encoder_gradient_dot_product": 153.18353271484375,
    "input_gradient_cosine_similarity": 95.20022583007812,
    "input_gradient_l2_distance": 121.63509368896484,
    "input_gradient_dot_product": 60.941898345947266
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7481721488399978,
      "val_r": 0.6018898403943618,
      "n_iterations": 645,
      "coefficients": {
        "effective_rank": 0.11993422359228134,
        "effective_rank_mergeability_score": -0.017164992168545723,
        "stable_rank": -0.2841717004776001,
        "spectral_gap": 0.0032211607322096825,
        "singular_value_ratio": 0.2787041962146759,
        "layerwise_effective_rank": 0.14321628212928772,
        "layerwise_effective_rank_mergeability_score": 0.05329161137342453,
        "task_vector_cosine_similarity": 0.398360937833786,
        "task_vector_l2_distance": -0.060205794870853424,
        "task_vector_dot_product": 0.02139865979552269,
        "weight_space_angle": 0.3027231693267822,
        "task_vector_magnitude_ratio": -0.2137582153081894,
        "activation_l2_distance": 0.25280508399009705,
        "activation_cosine_similarity": 0.3491460680961609,
        "activation_magnitude_ratio": -0.020172931253910065,
        "activation_dot_product": -0.07224773615598679,
        "encoder_gradient_cosine_similarity": 0.017629852518439293,
        "encoder_gradient_l2_distance": -0.1505742073059082,
        "encoder_gradient_dot_product": -0.009000930935144424,
        "input_gradient_cosine_similarity": 0.015327959321439266,
        "input_gradient_l2_distance": -0.08844441920518875,
        "input_gradient_dot_product": -0.03951291739940643
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6408355309294762,
      "val_r": 0.38917456020486474,
      "n_iterations": 880,
      "coefficients": {
        "effective_rank": 8.272721290588379,
        "effective_rank_mergeability_score": -3.1155734062194824,
        "stable_rank": 44.69996643066406,
        "spectral_gap": 40.560672760009766,
        "singular_value_ratio": -0.134681835770607,
        "layerwise_effective_rank": -43.39711380004883,
        "layerwise_effective_rank_mergeability_score": -10.99774169921875,
        "task_vector_cosine_similarity": 57.1016731262207,
        "task_vector_l2_distance": 3.3561532497406006,
        "task_vector_dot_product": -6.6539692878723145,
        "weight_space_angle": 8.717500686645508,
        "task_vector_magnitude_ratio": 6.858828067779541,
        "activation_l2_distance": -38.89628219604492,
        "activation_cosine_similarity": 10.133366584777832,
        "activation_magnitude_ratio": -15.109967231750488,
        "activation_dot_product": 5.654765605926514,
        "encoder_gradient_cosine_similarity": 4.011516571044922,
        "encoder_gradient_l2_distance": -66.4718246459961,
        "encoder_gradient_dot_product": 24.29950714111328,
        "input_gradient_cosine_similarity": 2.3976638317108154,
        "input_gradient_l2_distance": -47.683067321777344,
        "input_gradient_dot_product": 17.394136428833008
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7540677384964971,
      "val_r": 0.8149353205223813,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 0.9645697474479675,
        "effective_rank_mergeability_score": -0.4875011146068573,
        "stable_rank": -1.3121994733810425,
        "spectral_gap": -0.12957827746868134,
        "singular_value_ratio": 0.8683691620826721,
        "layerwise_effective_rank": -0.08395214378833771,
        "layerwise_effective_rank_mergeability_score": 0.6048736572265625,
        "task_vector_cosine_similarity": -0.19943250715732574,
        "task_vector_l2_distance": -0.4209572374820709,
        "task_vector_dot_product": 0.5918575525283813,
        "weight_space_angle": -0.08741956204175949,
        "task_vector_magnitude_ratio": -0.6276937127113342,
        "activation_l2_distance": 1.3358632326126099,
        "activation_cosine_similarity": 1.7155100107192993,
        "activation_magnitude_ratio": -0.039914801716804504,
        "activation_dot_product": -0.18930044770240784,
        "encoder_gradient_cosine_similarity": 0.05092654004693031,
        "encoder_gradient_l2_distance": -0.8668689727783203,
        "encoder_gradient_dot_product": -0.12619958817958832,
        "input_gradient_cosine_similarity": 0.07721798121929169,
        "input_gradient_l2_distance": -0.5255029201507568,
        "input_gradient_dot_product": -0.1140933558344841
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6916077702110865,
      "val_r": 0.6981613449355816,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 1.214691400527954,
        "effective_rank_mergeability_score": 0.058426085859537125,
        "stable_rank": -9.45583724975586,
        "spectral_gap": 3.971817970275879,
        "singular_value_ratio": -1.5932486057281494,
        "layerwise_effective_rank": 3.3467016220092773,
        "layerwise_effective_rank_mergeability_score": 4.83644962310791,
        "task_vector_cosine_similarity": 9.51919174194336,
        "task_vector_l2_distance": -6.574027061462402,
        "task_vector_dot_product": 0.8171913623809814,
        "weight_space_angle": 0.12524648010730743,
        "task_vector_magnitude_ratio": 12.480134963989258,
        "activation_l2_distance": -0.322563499212265,
        "activation_cosine_similarity": 3.6677989959716797,
        "activation_magnitude_ratio": -3.0699093341827393,
        "activation_dot_product": 10.60316276550293,
        "encoder_gradient_cosine_similarity": 4.848352909088135,
        "encoder_gradient_l2_distance": -17.00718879699707,
        "encoder_gradient_dot_product": -0.5588138103485107,
        "input_gradient_cosine_similarity": 2.8724069595336914,
        "input_gradient_l2_distance": -9.826242446899414,
        "input_gradient_dot_product": -8.954766273498535
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6805225528225028,
      "val_r": 0.641595200822922,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": -1.4520230293273926,
        "effective_rank_mergeability_score": -0.26598110795021057,
        "stable_rank": -5.1679253578186035,
        "spectral_gap": 3.488807201385498,
        "singular_value_ratio": 8.008700370788574,
        "layerwise_effective_rank": -3.1059470176696777,
        "layerwise_effective_rank_mergeability_score": 0.6405285596847534,
        "task_vector_cosine_similarity": 6.40254545211792,
        "task_vector_l2_distance": -11.626130104064941,
        "task_vector_dot_product": 9.118964195251465,
        "weight_space_angle": 4.498887538909912,
        "task_vector_magnitude_ratio": 1.3584519624710083,
        "activation_l2_distance": 0.7339187860488892,
        "activation_cosine_similarity": 1.2133890390396118,
        "activation_magnitude_ratio": -1.6491811275482178,
        "activation_dot_product": 17.069087982177734,
        "encoder_gradient_cosine_similarity": 4.470393180847168,
        "encoder_gradient_l2_distance": -12.322340965270996,
        "encoder_gradient_dot_product": -0.13672377169132233,
        "input_gradient_cosine_similarity": 4.96412992477417,
        "input_gradient_l2_distance": -14.318805694580078,
        "input_gradient_dot_product": -10.923911094665527
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5297484094928,
      "val_r": 0.5073161782653899,
      "n_iterations": 721,
      "coefficients": {
        "effective_rank": -162.93545532226562,
        "effective_rank_mergeability_score": -82.37456512451172,
        "stable_rank": -70.89096069335938,
        "spectral_gap": -75.96859741210938,
        "singular_value_ratio": 55.321571350097656,
        "layerwise_effective_rank": 264.1982727050781,
        "layerwise_effective_rank_mergeability_score": 156.35797119140625,
        "task_vector_cosine_similarity": 100.38443756103516,
        "task_vector_l2_distance": -21.06255340576172,
        "task_vector_dot_product": 213.5886993408203,
        "weight_space_angle": -83.89837646484375,
        "task_vector_magnitude_ratio": 4.382890224456787,
        "activation_l2_distance": -211.02577209472656,
        "activation_cosine_similarity": -2.1474545001983643,
        "activation_magnitude_ratio": -210.45419311523438,
        "activation_dot_product": 151.1349639892578,
        "encoder_gradient_cosine_similarity": 187.39608764648438,
        "encoder_gradient_l2_distance": -161.18675231933594,
        "encoder_gradient_dot_product": 157.78189086914062,
        "input_gradient_cosine_similarity": 50.71920394897461,
        "input_gradient_l2_distance": -37.20635986328125,
        "input_gradient_dot_product": -221.1171417236328
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.003931856678251495,
      "val_r": 0.09127026063280433,
      "n_iterations": 414,
      "coefficients": {
        "effective_rank": 460.442626953125,
        "effective_rank_mergeability_score": 712.1309814453125,
        "stable_rank": -243.30633544921875,
        "spectral_gap": -429.93133544921875,
        "singular_value_ratio": 293.56317138671875,
        "layerwise_effective_rank": -146.95289611816406,
        "layerwise_effective_rank_mergeability_score": 396.09423828125,
        "task_vector_cosine_similarity": 87.87913513183594,
        "task_vector_l2_distance": -351.7728271484375,
        "task_vector_dot_product": -45.89754867553711,
        "weight_space_angle": -40.94861602783203,
        "task_vector_magnitude_ratio": 738.4496459960938,
        "activation_l2_distance": 113.7435073852539,
        "activation_cosine_similarity": -25.376527786254883,
        "activation_magnitude_ratio": 46.33535385131836,
        "activation_dot_product": -196.68186950683594,
        "encoder_gradient_cosine_similarity": -289.23876953125,
        "encoder_gradient_l2_distance": 443.3898620605469,
        "encoder_gradient_dot_product": -644.1069946289062,
        "input_gradient_cosine_similarity": -306.2356872558594,
        "input_gradient_l2_distance": -444.0614013671875,
        "input_gradient_dot_product": -126.52117156982422
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5966765546063836,
      "val_r": 0.030085053410448787,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": -5.773185729980469,
        "effective_rank_mergeability_score": -13.762384414672852,
        "stable_rank": -92.1949234008789,
        "spectral_gap": -40.641048431396484,
        "singular_value_ratio": 16.54241943359375,
        "layerwise_effective_rank": 35.27704620361328,
        "layerwise_effective_rank_mergeability_score": 20.95935821533203,
        "task_vector_cosine_similarity": 53.92375946044922,
        "task_vector_l2_distance": -37.201290130615234,
        "task_vector_dot_product": -19.52410316467285,
        "weight_space_angle": -53.668975830078125,
        "task_vector_magnitude_ratio": 7.1351423263549805,
        "activation_l2_distance": 28.592666625976562,
        "activation_cosine_similarity": 32.80476379394531,
        "activation_magnitude_ratio": -30.34326171875,
        "activation_dot_product": 94.25540924072266,
        "encoder_gradient_cosine_similarity": 38.556800842285156,
        "encoder_gradient_l2_distance": -44.77205276489258,
        "encoder_gradient_dot_product": -48.1733512878418,
        "input_gradient_cosine_similarity": 41.01254653930664,
        "input_gradient_l2_distance": -19.22270965576172,
        "input_gradient_dot_product": 37.21578598022461
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7542069227946022,
      "val_r": 0.24350064661915213,
      "n_iterations": 461,
      "coefficients": {
        "effective_rank": -0.12426590919494629,
        "effective_rank_mergeability_score": 0.15055862069129944,
        "stable_rank": 0.20181038975715637,
        "spectral_gap": -0.0335465632379055,
        "singular_value_ratio": 0.279875248670578,
        "layerwise_effective_rank": -0.10520857572555542,
        "layerwise_effective_rank_mergeability_score": -0.008172321133315563,
        "task_vector_cosine_similarity": 0.0707727000117302,
        "task_vector_l2_distance": -0.16496849060058594,
        "task_vector_dot_product": 0.20432499051094055,
        "weight_space_angle": 0.10335812717676163,
        "task_vector_magnitude_ratio": -0.25611796975135803,
        "activation_l2_distance": 0.5480182766914368,
        "activation_cosine_similarity": 0.6584582924842834,
        "activation_magnitude_ratio": 0.006974932737648487,
        "activation_dot_product": -0.06777205318212509,
        "encoder_gradient_cosine_similarity": 0.056088224053382874,
        "encoder_gradient_l2_distance": -0.27543899416923523,
        "encoder_gradient_dot_product": -0.026051292195916176,
        "input_gradient_cosine_similarity": 0.04165274649858475,
        "input_gradient_l2_distance": -0.21444399654865265,
        "input_gradient_dot_product": -0.0464903824031353
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.2943119588054739,
      "val_r": -0.20261207626554667,
      "n_iterations": 595,
      "coefficients": {
        "effective_rank": -21.779916763305664,
        "effective_rank_mergeability_score": -13.159993171691895,
        "stable_rank": -188.0994110107422,
        "spectral_gap": 129.45858764648438,
        "singular_value_ratio": 60.03900146484375,
        "layerwise_effective_rank": -138.46697998046875,
        "layerwise_effective_rank_mergeability_score": -227.4042510986328,
        "task_vector_cosine_similarity": -250.73326110839844,
        "task_vector_l2_distance": 45.25629806518555,
        "task_vector_dot_product": 116.31920623779297,
        "weight_space_angle": 164.7511749267578,
        "task_vector_magnitude_ratio": 110.08290100097656,
        "activation_l2_distance": 76.90904235839844,
        "activation_cosine_similarity": -198.67640686035156,
        "activation_magnitude_ratio": 110.74219512939453,
        "activation_dot_product": -34.729862213134766,
        "encoder_gradient_cosine_similarity": 130.0487060546875,
        "encoder_gradient_l2_distance": 91.38394927978516,
        "encoder_gradient_dot_product": 130.9420623779297,
        "input_gradient_cosine_similarity": 148.53652954101562,
        "input_gradient_l2_distance": -325.1041564941406,
        "input_gradient_dot_product": 84.68199920654297
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.2915619559982968,
      "val_r": 0.31991432736322767,
      "n_iterations": 496,
      "coefficients": {
        "effective_rank": -122.46147918701172,
        "effective_rank_mergeability_score": 50.72157669067383,
        "stable_rank": -63.10405349731445,
        "spectral_gap": -73.95372772216797,
        "singular_value_ratio": -56.18706130981445,
        "layerwise_effective_rank": 45.55643844604492,
        "layerwise_effective_rank_mergeability_score": -283.2310485839844,
        "task_vector_cosine_similarity": -40.75299072265625,
        "task_vector_l2_distance": 141.0513916015625,
        "task_vector_dot_product": 147.26930236816406,
        "weight_space_angle": -143.14657592773438,
        "task_vector_magnitude_ratio": -100.16131591796875,
        "activation_l2_distance": 174.2706756591797,
        "activation_cosine_similarity": 117.26646423339844,
        "activation_magnitude_ratio": 140.72442626953125,
        "activation_dot_product": -68.5719985961914,
        "encoder_gradient_cosine_similarity": 275.6909484863281,
        "encoder_gradient_l2_distance": -79.78544616699219,
        "encoder_gradient_dot_product": 48.738773345947266,
        "input_gradient_cosine_similarity": 97.25777435302734,
        "input_gradient_l2_distance": -219.60926818847656,
        "input_gradient_dot_product": 13.414176940917969
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.3124545273894275,
      "val_r": 0.18542335761656137,
      "n_iterations": 861,
      "coefficients": {
        "effective_rank": -327.1493835449219,
        "effective_rank_mergeability_score": -188.57044982910156,
        "stable_rank": -44.98722839355469,
        "spectral_gap": 77.7498550415039,
        "singular_value_ratio": 224.79971313476562,
        "layerwise_effective_rank": -92.7832260131836,
        "layerwise_effective_rank_mergeability_score": -111.82417297363281,
        "task_vector_cosine_similarity": 263.79754638671875,
        "task_vector_l2_distance": -237.79684448242188,
        "task_vector_dot_product": 271.4932861328125,
        "weight_space_angle": -183.5919189453125,
        "task_vector_magnitude_ratio": 181.87094116210938,
        "activation_l2_distance": 87.08587646484375,
        "activation_cosine_similarity": -41.59576416015625,
        "activation_magnitude_ratio": -238.3144073486328,
        "activation_dot_product": 101.65911102294922,
        "encoder_gradient_cosine_similarity": 185.50209045410156,
        "encoder_gradient_l2_distance": -87.02581024169922,
        "encoder_gradient_dot_product": -123.58011627197266,
        "input_gradient_cosine_similarity": 234.96934509277344,
        "input_gradient_l2_distance": 53.43426513671875,
        "input_gradient_dot_product": -4.1445207595825195
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7479483218564886,
      "val_r": 0.5981065524536718,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 0.2371327131986618,
        "effective_rank_mergeability_score": 0.0242390725761652,
        "stable_rank": -0.12237421423196793,
        "spectral_gap": -0.0400029718875885,
        "singular_value_ratio": 0.3462737500667572,
        "layerwise_effective_rank": -0.04213166609406471,
        "layerwise_effective_rank_mergeability_score": 0.11886557191610336,
        "task_vector_cosine_similarity": 0.14832639694213867,
        "task_vector_l2_distance": -0.05506758764386177,
        "task_vector_dot_product": -0.07881398499011993,
        "weight_space_angle": -0.19861534237861633,
        "task_vector_magnitude_ratio": -0.33420178294181824,
        "activation_l2_distance": 0.6890080571174622,
        "activation_cosine_similarity": 0.7797138690948486,
        "activation_magnitude_ratio": 0.008410442620515823,
        "activation_dot_product": -0.09591100364923477,
        "encoder_gradient_cosine_similarity": 0.05840502679347992,
        "encoder_gradient_l2_distance": -0.22534023225307465,
        "encoder_gradient_dot_product": -0.027957117184996605,
        "input_gradient_cosine_similarity": 0.0381387397646904,
        "input_gradient_l2_distance": -0.1708085834980011,
        "input_gradient_dot_product": -0.06232370808720589
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7355025981748119,
      "val_r": 0.788144461569927,
      "n_iterations": 524,
      "coefficients": {
        "effective_rank": 0.6055701375007629,
        "effective_rank_mergeability_score": -0.15882427990436554,
        "stable_rank": -0.8840710520744324,
        "spectral_gap": -0.1479475200176239,
        "singular_value_ratio": 0.33525872230529785,
        "layerwise_effective_rank": 0.2505667507648468,
        "layerwise_effective_rank_mergeability_score": 0.39523452520370483,
        "task_vector_cosine_similarity": 0.24942485988140106,
        "task_vector_l2_distance": -0.14528891444206238,
        "task_vector_dot_product": 0.16178685426712036,
        "weight_space_angle": 0.24782101809978485,
        "task_vector_magnitude_ratio": -0.2532159984111786,
        "activation_l2_distance": 0.4015260338783264,
        "activation_cosine_similarity": 0.5484245419502258,
        "activation_magnitude_ratio": -0.010640530847012997,
        "activation_dot_product": -0.02820897102355957,
        "encoder_gradient_cosine_similarity": 0.048840124160051346,
        "encoder_gradient_l2_distance": -0.33320266008377075,
        "encoder_gradient_dot_product": -0.0350823849439621,
        "input_gradient_cosine_similarity": 0.018144497647881508,
        "input_gradient_l2_distance": -0.20479674637317657,
        "input_gradient_dot_product": -0.07146249711513519
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.14297509930968721,
      "val_r": 0.057574929742201714,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": -0.31477299332618713,
        "effective_rank_mergeability_score": 0.8208369612693787,
        "stable_rank": -0.7623541951179504,
        "spectral_gap": 0.437674343585968,
        "singular_value_ratio": 0.046748679131269455,
        "layerwise_effective_rank": 0.31609711050987244,
        "layerwise_effective_rank_mergeability_score": 0.4520571231842041,
        "task_vector_cosine_similarity": 1.0107792615890503,
        "task_vector_l2_distance": -0.4226069152355194,
        "task_vector_dot_product": 1.1185022592544556,
        "weight_space_angle": 0.07086968421936035,
        "task_vector_magnitude_ratio": -0.41757386922836304,
        "activation_l2_distance": -0.6784181594848633,
        "activation_cosine_similarity": 0.1138995885848999,
        "activation_magnitude_ratio": -0.34349626302719116,
        "activation_dot_product": 0.11872871220111847,
        "encoder_gradient_cosine_similarity": 0.05411722883582115,
        "encoder_gradient_l2_distance": 0.18688692152500153,
        "encoder_gradient_dot_product": 0.7240839600563049,
        "input_gradient_cosine_similarity": -1.2398725748062134,
        "input_gradient_l2_distance": 0.07660845667123795,
        "input_gradient_dot_product": -0.36346352100372314
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.6421093027127428,
      "val_r": 0.307580642063504,
      "n_iterations": 961,
      "coefficients": {
        "effective_rank": -27.220674514770508,
        "effective_rank_mergeability_score": 16.324604034423828,
        "stable_rank": 7.979809761047363,
        "spectral_gap": -4.927052974700928,
        "singular_value_ratio": 20.795141220092773,
        "layerwise_effective_rank": -9.472759246826172,
        "layerwise_effective_rank_mergeability_score": 9.297720909118652,
        "task_vector_cosine_similarity": 42.4770622253418,
        "task_vector_l2_distance": -31.867816925048828,
        "task_vector_dot_product": 39.63405990600586,
        "weight_space_angle": -30.27631950378418,
        "task_vector_magnitude_ratio": 8.325090408325195,
        "activation_l2_distance": -2.0526039600372314,
        "activation_cosine_similarity": 31.044069290161133,
        "activation_magnitude_ratio": -28.267515182495117,
        "activation_dot_product": 40.176876068115234,
        "encoder_gradient_cosine_similarity": 28.898149490356445,
        "encoder_gradient_l2_distance": -41.48698043823242,
        "encoder_gradient_dot_product": 4.322728633880615,
        "input_gradient_cosine_similarity": 23.999507904052734,
        "input_gradient_l2_distance": -39.72296905517578,
        "input_gradient_dot_product": -56.981746673583984
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": -0.31913276631971144,
      "val_r": -0.1955568131523215,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": 38.576988220214844,
        "effective_rank_mergeability_score": -2.525904417037964,
        "stable_rank": -2.5189151763916016,
        "spectral_gap": 6.717258453369141,
        "singular_value_ratio": -4.930355548858643,
        "layerwise_effective_rank": -39.7415771484375,
        "layerwise_effective_rank_mergeability_score": -30.402835845947266,
        "task_vector_cosine_similarity": -46.41017532348633,
        "task_vector_l2_distance": -3.2263662815093994,
        "task_vector_dot_product": -46.26909255981445,
        "weight_space_angle": 63.73862838745117,
        "task_vector_magnitude_ratio": -45.989341735839844,
        "activation_l2_distance": 30.7739315032959,
        "activation_cosine_similarity": 31.86696434020996,
        "activation_magnitude_ratio": -44.924991607666016,
        "activation_dot_product": -44.105125427246094,
        "encoder_gradient_cosine_similarity": 28.55419921875,
        "encoder_gradient_l2_distance": 23.5854434967041,
        "encoder_gradient_dot_product": 21.652788162231445,
        "input_gradient_cosine_similarity": 28.37063980102539,
        "input_gradient_l2_distance": 23.905303955078125,
        "input_gradient_dot_product": 14.295334815979004
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5730087970460933,
      "val_r": 0.5050268241239677,
      "n_iterations": 656,
      "coefficients": {
        "effective_rank": -6.13053035736084,
        "effective_rank_mergeability_score": 4.0025224685668945,
        "stable_rank": 9.684576988220215,
        "spectral_gap": -7.388463020324707,
        "singular_value_ratio": 27.057693481445312,
        "layerwise_effective_rank": -51.81120681762695,
        "layerwise_effective_rank_mergeability_score": -20.373668670654297,
        "task_vector_cosine_similarity": 28.696434020996094,
        "task_vector_l2_distance": -0.6787588596343994,
        "task_vector_dot_product": 113.9786148071289,
        "weight_space_angle": -29.64109992980957,
        "task_vector_magnitude_ratio": -49.495182037353516,
        "activation_l2_distance": -30.726268768310547,
        "activation_cosine_similarity": 30.455106735229492,
        "activation_magnitude_ratio": -10.077750205993652,
        "activation_dot_product": 79.07794189453125,
        "encoder_gradient_cosine_similarity": 20.39826774597168,
        "encoder_gradient_l2_distance": -99.04806518554688,
        "encoder_gradient_dot_product": -8.77365493774414,
        "input_gradient_cosine_similarity": 53.791568756103516,
        "input_gradient_l2_distance": -14.37897777557373,
        "input_gradient_dot_product": -37.62146759033203
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6787545040585448,
      "val_r": 0.5273134110997005,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 5.627866268157959,
        "effective_rank_mergeability_score": 6.205799102783203,
        "stable_rank": -5.9042792320251465,
        "spectral_gap": 4.225013256072998,
        "singular_value_ratio": 1.5865910053253174,
        "layerwise_effective_rank": -6.338498115539551,
        "layerwise_effective_rank_mergeability_score": -6.204732894897461,
        "task_vector_cosine_similarity": 19.255653381347656,
        "task_vector_l2_distance": -2.184088706970215,
        "task_vector_dot_product": -15.629992485046387,
        "weight_space_angle": -2.453291654586792,
        "task_vector_magnitude_ratio": 8.718740463256836,
        "activation_l2_distance": 2.10265851020813,
        "activation_cosine_similarity": 6.611632823944092,
        "activation_magnitude_ratio": -1.2638654708862305,
        "activation_dot_product": 9.181187629699707,
        "encoder_gradient_cosine_similarity": 2.21889591217041,
        "encoder_gradient_l2_distance": -7.888227939605713,
        "encoder_gradient_dot_product": 0.6486199498176575,
        "input_gradient_cosine_similarity": 4.539358139038086,
        "input_gradient_l2_distance": -18.694395065307617,
        "input_gradient_dot_product": -3.361841917037964
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7360754429499452,
      "val_r": 0.44882678224403294,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 24.08588218688965,
        "effective_rank_mergeability_score": 26.476839065551758,
        "stable_rank": -15.517219543457031,
        "spectral_gap": -11.499252319335938,
        "singular_value_ratio": -15.389694213867188,
        "layerwise_effective_rank": 20.938182830810547,
        "layerwise_effective_rank_mergeability_score": 12.686118125915527,
        "task_vector_cosine_similarity": 46.04654312133789,
        "task_vector_l2_distance": -26.101184844970703,
        "task_vector_dot_product": -9.745064735412598,
        "weight_space_angle": -23.368749618530273,
        "task_vector_magnitude_ratio": 10.823453903198242,
        "activation_l2_distance": -3.9506189823150635,
        "activation_cosine_similarity": 32.99980926513672,
        "activation_magnitude_ratio": -29.191734313964844,
        "activation_dot_product": 12.271684646606445,
        "encoder_gradient_cosine_similarity": 14.384653091430664,
        "encoder_gradient_l2_distance": -4.2748026847839355,
        "encoder_gradient_dot_product": 13.880173683166504,
        "input_gradient_cosine_similarity": 22.988168716430664,
        "input_gradient_l2_distance": -72.01683807373047,
        "input_gradient_dot_product": -25.527856826782227
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}