{
  "aggregate_metrics": {
    "train_r": 0.08872492019430087,
    "train_p": 4.552822674513971e-07,
    "val_r": 0.024868989864025123,
    "val_p": 0.6390908612707774
  },
  "per_fold_stats": {
    "train_r_mean": 0.25677858233075146,
    "train_r_std": 0.15588662091747357,
    "val_r_mean": 0.16483813788403423,
    "val_r_std": 0.2302128065569296
  },
  "average_coefficients": {
    "effective_rank": -10.80048942565918,
    "effective_rank_mergeability_score": -6.478586673736572,
    "stable_rank": 1.3593772649765015,
    "spectral_gap": 4.041551113128662,
    "singular_value_ratio": 9.968103408813477,
    "layerwise_effective_rank": 3.6772568225860596,
    "layerwise_effective_rank_mergeability_score": 26.155597686767578,
    "task_vector_cosine_similarity": 25.824661254882812,
    "task_vector_l2_distance": -9.518388748168945,
    "task_vector_dot_product": 20.27986717224121,
    "weight_space_angle": -33.73535919189453,
    "task_vector_magnitude_ratio": 3.848508358001709,
    "activation_l2_distance": -3.6844191551208496,
    "activation_cosine_similarity": 32.29011535644531,
    "activation_magnitude_ratio": 37.90198516845703,
    "activation_dot_product": -48.47354507446289,
    "encoder_gradient_cosine_similarity": 21.530977249145508,
    "encoder_gradient_l2_distance": -32.021461486816406,
    "encoder_gradient_dot_product": 32.019954681396484,
    "input_gradient_cosine_similarity": 7.986054420471191,
    "input_gradient_l2_distance": -69.92407989501953,
    "input_gradient_dot_product": -11.251485824584961
  },
  "coefficient_std": {
    "effective_rank": 20.556961059570312,
    "effective_rank_mergeability_score": 71.43891143798828,
    "stable_rank": 37.77174377441406,
    "spectral_gap": 48.42186737060547,
    "singular_value_ratio": 50.678585052490234,
    "layerwise_effective_rank": 53.10415267944336,
    "layerwise_effective_rank_mergeability_score": 51.12163162231445,
    "task_vector_cosine_similarity": 33.73120880126953,
    "task_vector_l2_distance": 37.87248611450195,
    "task_vector_dot_product": 32.0881233215332,
    "weight_space_angle": 48.09120559692383,
    "task_vector_magnitude_ratio": 33.026302337646484,
    "activation_l2_distance": 55.54478454589844,
    "activation_cosine_similarity": 56.498836517333984,
    "activation_magnitude_ratio": 128.53671264648438,
    "activation_dot_product": 56.62746047973633,
    "encoder_gradient_cosine_similarity": 38.40305709838867,
    "encoder_gradient_l2_distance": 33.630165100097656,
    "encoder_gradient_dot_product": 40.79428482055664,
    "input_gradient_cosine_similarity": 34.76774215698242,
    "input_gradient_l2_distance": 115.29247283935547,
    "input_gradient_dot_product": 61.867576599121094
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.26035486434525507,
      "val_r": 0.3837354747480434,
      "n_iterations": 691,
      "coefficients": {
        "effective_rank": -9.379380226135254,
        "effective_rank_mergeability_score": 33.258975982666016,
        "stable_rank": -42.218753814697266,
        "spectral_gap": -18.423826217651367,
        "singular_value_ratio": -93.44426727294922,
        "layerwise_effective_rank": 166.7705078125,
        "layerwise_effective_rank_mergeability_score": 117.4383544921875,
        "task_vector_cosine_similarity": -5.997125148773193,
        "task_vector_l2_distance": -60.20436096191406,
        "task_vector_dot_product": 82.88141632080078,
        "weight_space_angle": -81.17196655273438,
        "task_vector_magnitude_ratio": 63.56058883666992,
        "activation_l2_distance": -75.66233825683594,
        "activation_cosine_similarity": 55.14962387084961,
        "activation_magnitude_ratio": -71.43194580078125,
        "activation_dot_product": -102.56514739990234,
        "encoder_gradient_cosine_similarity": 74.87606048583984,
        "encoder_gradient_l2_distance": -37.05782699584961,
        "encoder_gradient_dot_product": 75.28214263916016,
        "input_gradient_cosine_similarity": 67.98141479492188,
        "input_gradient_l2_distance": -52.65443801879883,
        "input_gradient_dot_product": -85.99004364013672
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3956059949189469,
      "val_r": 0.19655810365561469,
      "n_iterations": 716,
      "coefficients": {
        "effective_rank": 3.5524613857269287,
        "effective_rank_mergeability_score": 8.307768821716309,
        "stable_rank": 4.002786159515381,
        "spectral_gap": 2.576845169067383,
        "singular_value_ratio": -4.766049861907959,
        "layerwise_effective_rank": 7.755194187164307,
        "layerwise_effective_rank_mergeability_score": 3.5147924423217773,
        "task_vector_cosine_similarity": 1.2830075025558472,
        "task_vector_l2_distance": -0.8977473974227905,
        "task_vector_dot_product": 1.5666910409927368,
        "weight_space_angle": -0.8586974740028381,
        "task_vector_magnitude_ratio": 2.2377586364746094,
        "activation_l2_distance": -7.590982437133789,
        "activation_cosine_similarity": 1.2974430322647095,
        "activation_magnitude_ratio": -1.3527358770370483,
        "activation_dot_product": -8.309470176696777,
        "encoder_gradient_cosine_similarity": -0.5103645920753479,
        "encoder_gradient_l2_distance": -6.594935894012451,
        "encoder_gradient_dot_product": 4.190763473510742,
        "input_gradient_cosine_similarity": 0.8515767455101013,
        "input_gradient_l2_distance": -6.887408256530762,
        "input_gradient_dot_product": -2.370262622833252
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.36080676654172655,
      "val_r": 0.39868655080121806,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 12.32761001586914,
        "effective_rank_mergeability_score": -0.4845329821109772,
        "stable_rank": -7.716809272766113,
        "spectral_gap": 10.672194480895996,
        "singular_value_ratio": -3.2863049507141113,
        "layerwise_effective_rank": 10.836698532104492,
        "layerwise_effective_rank_mergeability_score": 6.700889587402344,
        "task_vector_cosine_similarity": 6.884379863739014,
        "task_vector_l2_distance": -11.308721542358398,
        "task_vector_dot_product": 16.416400909423828,
        "weight_space_angle": 6.403611660003662,
        "task_vector_magnitude_ratio": -5.233791351318359,
        "activation_l2_distance": 4.385684490203857,
        "activation_cosine_similarity": 26.27412986755371,
        "activation_magnitude_ratio": 0.2369871288537979,
        "activation_dot_product": -25.702423095703125,
        "encoder_gradient_cosine_similarity": -0.4003746509552002,
        "encoder_gradient_l2_distance": -25.871788024902344,
        "encoder_gradient_dot_product": 13.81275749206543,
        "input_gradient_cosine_similarity": 3.666515350341797,
        "input_gradient_l2_distance": -25.97797393798828,
        "input_gradient_dot_product": -11.636483192443848
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.15432945497111938,
      "val_r": 0.37115587221327456,
      "n_iterations": 603,
      "coefficients": {
        "effective_rank": -42.01506423950195,
        "effective_rank_mergeability_score": -156.0621337890625,
        "stable_rank": 61.52558517456055,
        "spectral_gap": 143.9169921875,
        "singular_value_ratio": -22.097110748291016,
        "layerwise_effective_rank": 34.240882873535156,
        "layerwise_effective_rank_mergeability_score": 70.55458068847656,
        "task_vector_cosine_similarity": 53.730777740478516,
        "task_vector_l2_distance": -29.733558654785156,
        "task_vector_dot_product": -11.954333305358887,
        "weight_space_angle": -112.3812026977539,
        "task_vector_magnitude_ratio": -37.08302688598633,
        "activation_l2_distance": -23.109939575195312,
        "activation_cosine_similarity": 111.98150634765625,
        "activation_magnitude_ratio": 184.51222229003906,
        "activation_dot_product": -19.680185317993164,
        "encoder_gradient_cosine_similarity": 56.0048828125,
        "encoder_gradient_l2_distance": -54.12747573852539,
        "encoder_gradient_dot_product": -70.21294403076172,
        "input_gradient_cosine_similarity": -35.178016662597656,
        "input_gradient_l2_distance": -198.51068115234375,
        "input_gradient_dot_product": 96.6758041381836
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.257010269101957,
      "val_r": 0.21973852412243672,
      "n_iterations": 501,
      "coefficients": {
        "effective_rank": -2.304438829421997,
        "effective_rank_mergeability_score": 36.34036636352539,
        "stable_rank": 31.53438949584961,
        "spectral_gap": 5.685209274291992,
        "singular_value_ratio": -17.679048538208008,
        "layerwise_effective_rank": 17.120925903320312,
        "layerwise_effective_rank_mergeability_score": -13.319721221923828,
        "task_vector_cosine_similarity": 20.295503616333008,
        "task_vector_l2_distance": 52.26874542236328,
        "task_vector_dot_product": 26.30342674255371,
        "weight_space_angle": -22.345388412475586,
        "task_vector_magnitude_ratio": -56.122371673583984,
        "activation_l2_distance": -65.13882446289062,
        "activation_cosine_similarity": 46.18889236450195,
        "activation_magnitude_ratio": 44.01821517944336,
        "activation_dot_product": -31.037628173828125,
        "encoder_gradient_cosine_similarity": 2.8889362812042236,
        "encoder_gradient_l2_distance": -43.88055419921875,
        "encoder_gradient_dot_product": 29.312654495239258,
        "input_gradient_cosine_similarity": 42.02341842651367,
        "input_gradient_l2_distance": -80.9242172241211,
        "input_gradient_dot_product": -20.231597900390625
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.2572694119313133,
      "val_r": 0.31923322227178963,
      "n_iterations": 588,
      "coefficients": {
        "effective_rank": -19.795656204223633,
        "effective_rank_mergeability_score": 50.803104400634766,
        "stable_rank": 1.0877180099487305,
        "spectral_gap": 1.9959293603897095,
        "singular_value_ratio": 21.425302505493164,
        "layerwise_effective_rank": -54.41064453125,
        "layerwise_effective_rank_mergeability_score": -18.775615692138672,
        "task_vector_cosine_similarity": 16.634977340698242,
        "task_vector_l2_distance": -18.609264373779297,
        "task_vector_dot_product": 17.466373443603516,
        "weight_space_angle": -2.457412004470825,
        "task_vector_magnitude_ratio": 29.201616287231445,
        "activation_l2_distance": -29.976205825805664,
        "activation_cosine_similarity": 37.813697814941406,
        "activation_magnitude_ratio": 13.071243286132812,
        "activation_dot_product": 12.121170043945312,
        "encoder_gradient_cosine_similarity": 40.876468658447266,
        "encoder_gradient_l2_distance": -6.451660633087158,
        "encoder_gradient_dot_product": 33.16566848754883,
        "input_gradient_cosine_similarity": 10.29902172088623,
        "input_gradient_l2_distance": -101.67066192626953,
        "input_gradient_dot_product": -32.81783676147461
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.461250594533448,
      "val_r": -0.2035103088196885,
      "n_iterations": 1000,
      "coefficients": {
        "effective_rank": 13.735724449157715,
        "effective_rank_mergeability_score": -12.735374450683594,
        "stable_rank": -33.18803787231445,
        "spectral_gap": 34.506370544433594,
        "singular_value_ratio": 10.161706924438477,
        "layerwise_effective_rank": 12.053010940551758,
        "layerwise_effective_rank_mergeability_score": 13.864381790161133,
        "task_vector_cosine_similarity": -9.723039627075195,
        "task_vector_l2_distance": -16.663713455200195,
        "task_vector_dot_product": 12.861859321594238,
        "weight_space_angle": 6.3721160888671875,
        "task_vector_magnitude_ratio": 21.643253326416016,
        "activation_l2_distance": -11.467597007751465,
        "activation_cosine_similarity": 22.657970428466797,
        "activation_magnitude_ratio": 17.87261390686035,
        "activation_dot_product": -35.135921478271484,
        "encoder_gradient_cosine_similarity": 10.208192825317383,
        "encoder_gradient_l2_distance": -33.18538284301758,
        "encoder_gradient_dot_product": 31.134485244750977,
        "input_gradient_cosine_similarity": -3.235677719116211,
        "input_gradient_l2_distance": -26.91900634765625,
        "input_gradient_dot_product": -23.81943130493164
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.2672464289518627,
      "val_r": -0.22635007759635523,
      "n_iterations": 493,
      "coefficients": {
        "effective_rank": -19.438758850097656,
        "effective_rank_mergeability_score": 14.83936882019043,
        "stable_rank": -40.31891632080078,
        "spectral_gap": -5.01287841796875,
        "singular_value_ratio": 23.008607864379883,
        "layerwise_effective_rank": 32.21460723876953,
        "layerwise_effective_rank_mergeability_score": 22.898473739624023,
        "task_vector_cosine_similarity": 28.95951271057129,
        "task_vector_l2_distance": -45.87144088745117,
        "task_vector_dot_product": 43.585845947265625,
        "weight_space_angle": -23.830524444580078,
        "task_vector_magnitude_ratio": -0.2853022515773773,
        "activation_l2_distance": -32.168670654296875,
        "activation_cosine_similarity": 32.1949462890625,
        "activation_magnitude_ratio": -1.0812760591506958,
        "activation_dot_product": -40.17976379394531,
        "encoder_gradient_cosine_similarity": 23.270877838134766,
        "encoder_gradient_l2_distance": -66.94290161132812,
        "encoder_gradient_dot_product": 5.470191478729248,
        "input_gradient_cosine_similarity": 43.38280487060547,
        "input_gradient_l2_distance": -11.150717735290527,
        "input_gradient_dot_product": 17.45275115966797
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.24380436494383645,
      "val_r": -0.394515548301132,
      "n_iterations": 885,
      "coefficients": {
        "effective_rank": 9.771594047546387,
        "effective_rank_mergeability_score": -5.036811351776123,
        "stable_rank": -69.5433120727539,
        "spectral_gap": -18.335763931274414,
        "singular_value_ratio": 13.579228401184082,
        "layerwise_effective_rank": -79.7848892211914,
        "layerwise_effective_rank_mergeability_score": 13.139817237854004,
        "task_vector_cosine_similarity": 44.586997985839844,
        "task_vector_l2_distance": -26.655609130859375,
        "task_vector_dot_product": 7.02794885635376,
        "weight_space_angle": -54.945003509521484,
        "task_vector_magnitude_ratio": 1.7581331729888916,
        "activation_l2_distance": 53.58051681518555,
        "activation_cosine_similarity": 90.36537170410156,
        "activation_magnitude_ratio": -1.7269307374954224,
        "activation_dot_product": -53.93113327026367,
        "encoder_gradient_cosine_similarity": 135.5409698486328,
        "encoder_gradient_l2_distance": -97.95687103271484,
        "encoder_gradient_dot_product": 39.07370376586914,
        "input_gradient_cosine_similarity": 13.467183113098145,
        "input_gradient_l2_distance": -10.429537773132324,
        "input_gradient_dot_product": -2.5475971698760986
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.03817246519827602,
      "val_r": 0.08118719798434594,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": 0.5738957524299622,
        "effective_rank_mergeability_score": 2.8444552421569824,
        "stable_rank": -2.074944257736206,
        "spectral_gap": 3.054564952850342,
        "singular_value_ratio": 1.55677330493927,
        "layerwise_effective_rank": -1.0399295091629028,
        "layerwise_effective_rank_mergeability_score": -0.47284403443336487,
        "task_vector_cosine_similarity": 4.958956241607666,
        "task_vector_l2_distance": 0.05471362918615341,
        "task_vector_dot_product": -0.6067521572113037,
        "weight_space_angle": -6.674012184143066,
        "task_vector_magnitude_ratio": 1.9768409729003906,
        "activation_l2_distance": -1.0860674381256104,
        "activation_cosine_similarity": -0.6448934674263,
        "activation_magnitude_ratio": -0.020432135090231895,
        "activation_dot_product": -1.6259827613830566,
        "encoder_gradient_cosine_similarity": -4.736143112182617,
        "encoder_gradient_l2_distance": -1.5387176275253296,
        "encoder_gradient_dot_product": 1.6308043003082275,
        "input_gradient_cosine_similarity": 1.1442235708236694,
        "input_gradient_l2_distance": 4.518240928649902,
        "input_gradient_dot_product": -0.7995033264160156
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.019260567128470622,
      "val_r": 0.11538517624300004,
      "n_iterations": 410,
      "coefficients": {
        "effective_rank": -1.7426605224609375,
        "effective_rank_mergeability_score": -235.68560791015625,
        "stable_rank": 48.961158752441406,
        "spectral_gap": -128.84185791015625,
        "singular_value_ratio": 191.7373809814453,
        "layerwise_effective_rank": -99.08219146728516,
        "layerwise_effective_rank_mergeability_score": 187.78640747070312,
        "task_vector_cosine_similarity": 124.40535736083984,
        "task_vector_l2_distance": 25.891637802124023,
        "task_vector_dot_product": -54.96097946166992,
        "weight_space_angle": -169.13143920898438,
        "task_vector_magnitude_ratio": 90.24247741699219,
        "activation_l2_distance": 179.7671661376953,
        "activation_cosine_similarity": -165.52894592285156,
        "activation_magnitude_ratio": 559.1296997070312,
        "activation_dot_product": -233.97032165527344,
        "encoder_gradient_cosine_similarity": -62.88045120239258,
        "encoder_gradient_l2_distance": 39.54617691040039,
        "encoder_gradient_dot_product": 139.5505828857422,
        "input_gradient_cosine_similarity": -109.69853210449219,
        "input_gradient_l2_distance": -523.9965209960938,
        "input_gradient_dot_product": 199.4980926513672
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.27245061762696,
      "val_r": 0.2637488589642212,
      "n_iterations": 438,
      "coefficients": {
        "effective_rank": 3.833472728729248,
        "effective_rank_mergeability_score": -6.022435665130615,
        "stable_rank": 1.2280066013336182,
        "spectral_gap": 59.012996673583984,
        "singular_value_ratio": -17.539398193359375,
        "layerwise_effective_rank": -13.08182144165039,
        "layerwise_effective_rank_mergeability_score": -18.612701416015625,
        "task_vector_cosine_similarity": -3.025402784347534,
        "task_vector_l2_distance": -11.572588920593262,
        "task_vector_dot_product": 21.56768798828125,
        "weight_space_angle": -15.273694038391113,
        "task_vector_magnitude_ratio": 30.94744300842285,
        "activation_l2_distance": -17.463722229003906,
        "activation_cosine_similarity": 6.067774772644043,
        "activation_magnitude_ratio": 33.494056701660156,
        "activation_dot_product": -9.244593620300293,
        "encoder_gradient_cosine_similarity": 40.08864974975586,
        "encoder_gradient_l2_distance": -69.0750961303711,
        "encoder_gradient_dot_product": 56.95918655395508,
        "input_gradient_cosine_similarity": 23.515073776245117,
        "input_gradient_l2_distance": -34.71204376220703,
        "input_gradient_dot_product": -60.09419250488281
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": -0.020407105194264308,
      "val_r": 0.02880541506430536,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": 3.9555532932281494,
        "effective_rank_mergeability_score": 3.240473747253418,
        "stable_rank": -0.30727148056030273,
        "spectral_gap": -5.984139442443848,
        "singular_value_ratio": 7.445952415466309,
        "layerwise_effective_rank": -18.229938507080078,
        "layerwise_effective_rank_mergeability_score": -3.658081531524658,
        "task_vector_cosine_similarity": 20.420270919799805,
        "task_vector_l2_distance": -9.194098472595215,
        "task_vector_dot_product": -2.8897695541381836,
        "weight_space_angle": -4.54027795791626,
        "task_vector_magnitude_ratio": 3.447073221206665,
        "activation_l2_distance": -3.3152966499328613,
        "activation_cosine_similarity": 4.336251735687256,
        "activation_magnitude_ratio": -16.116147994995117,
        "activation_dot_product": 1.8457907438278198,
        "encoder_gradient_cosine_similarity": 18.13555908203125,
        "encoder_gradient_l2_distance": -2.094114065170288,
        "encoder_gradient_dot_product": 2.7138280868530273,
        "input_gradient_cosine_similarity": -14.476668357849121,
        "input_gradient_l2_distance": 11.919195175170898,
        "input_gradient_dot_product": 4.332502365112305
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.20955612821794461,
      "val_r": 0.36685588836299526,
      "n_iterations": 704,
      "coefficients": {
        "effective_rank": 0.32297399640083313,
        "effective_rank_mergeability_score": -8.489228248596191,
        "stable_rank": -34.247413635253906,
        "spectral_gap": -48.067138671875,
        "singular_value_ratio": -10.626395225524902,
        "layerwise_effective_rank": -58.06534957885742,
        "layerwise_effective_rank_mergeability_score": 37.668827056884766,
        "task_vector_cosine_similarity": 65.498291015625,
        "task_vector_l2_distance": 57.998714447021484,
        "task_vector_dot_product": 20.528844833374023,
        "weight_space_angle": -67.1917953491211,
        "task_vector_magnitude_ratio": -29.847131729125977,
        "activation_l2_distance": 56.098304748535156,
        "activation_cosine_similarity": 95.7363052368164,
        "activation_magnitude_ratio": 48.683021545410156,
        "activation_dot_product": -49.25899887084961,
        "encoder_gradient_cosine_similarity": 37.460575103759766,
        "encoder_gradient_l2_distance": 0.2547230124473572,
        "encoder_gradient_dot_product": 58.00896072387695,
        "input_gradient_cosine_similarity": 35.41811752319336,
        "input_gradient_l2_distance": -127.51475524902344,
        "input_gradient_dot_product": -79.37175750732422
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": -0.004693390373420724,
      "val_r": 0.010406806917417728,
      "n_iterations": 51,
      "coefficients": {
        "effective_rank": 4.511791229248047,
        "effective_rank_mergeability_score": 3.8159019947052,
        "stable_rank": -1.6044986248016357,
        "spectral_gap": -2.5327956676483154,
        "singular_value_ratio": -6.9497971534729,
        "layerwise_effective_rank": 2.4426581859588623,
        "layerwise_effective_rank_mergeability_score": 5.23329496383667,
        "task_vector_cosine_similarity": -1.5423955917358398,
        "task_vector_l2_distance": 7.563510894775391,
        "task_vector_dot_product": -2.087329864501953,
        "weight_space_angle": 6.2532429695129395,
        "task_vector_magnitude_ratio": -4.305060386657715,
        "activation_l2_distance": -4.050480842590332,
        "activation_cosine_similarity": -0.8174546957015991,
        "activation_magnitude_ratio": -3.6251256465911865,
        "activation_dot_product": -3.7430260181427,
        "encoder_gradient_cosine_similarity": 1.2743607759475708,
        "encoder_gradient_l2_distance": 6.372336387634277,
        "encoder_gradient_dot_product": -3.97990083694458,
        "input_gradient_cosine_similarity": -2.496690273284912,
        "input_gradient_l2_distance": 9.4553861618042,
        "input_gradient_dot_product": -8.204654693603516
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.41569896931591377,
      "val_r": 0.27365173391746855,
      "n_iterations": 858,
      "coefficients": {
        "effective_rank": -39.84418869018555,
        "effective_rank_mergeability_score": 41.2624626159668,
        "stable_rank": 21.624631881713867,
        "spectral_gap": 10.468597412109375,
        "singular_value_ratio": 14.446237564086914,
        "layerwise_effective_rank": 36.09855651855469,
        "layerwise_effective_rank_mergeability_score": -38.53248977661133,
        "task_vector_cosine_similarity": 80.08833312988281,
        "task_vector_l2_distance": -102.29661560058594,
        "task_vector_dot_product": 102.36444091796875,
        "weight_space_angle": 37.89522933959961,
        "task_vector_magnitude_ratio": -39.362884521484375,
        "activation_l2_distance": 17.524290084838867,
        "activation_cosine_similarity": 50.127960205078125,
        "activation_magnitude_ratio": -12.264843940734863,
        "activation_dot_product": -110.61964416503906,
        "encoder_gradient_cosine_similarity": -10.90197467803955,
        "encoder_gradient_l2_distance": -42.73036575317383,
        "encoder_gradient_dot_product": 54.701934814453125,
        "input_gradient_cosine_similarity": 11.276738166809082,
        "input_gradient_l2_distance": -55.93640899658203,
        "input_gradient_dot_product": -24.39179801940918
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.3200294817368204,
      "val_r": 0.17328606763108167,
      "n_iterations": 820,
      "coefficients": {
        "effective_rank": -27.825143814086914,
        "effective_rank_mergeability_score": 28.371234893798828,
        "stable_rank": 32.53577423095703,
        "spectral_gap": 10.32785701751709,
        "singular_value_ratio": 20.62294578552246,
        "layerwise_effective_rank": 15.691804885864258,
        "layerwise_effective_rank_mergeability_score": 27.490625381469727,
        "task_vector_cosine_similarity": 50.29215621948242,
        "task_vector_l2_distance": -27.438148498535156,
        "task_vector_dot_product": 25.832990646362305,
        "weight_space_angle": -40.1937370300293,
        "task_vector_magnitude_ratio": -0.19319815933704376,
        "activation_l2_distance": -10.519682884216309,
        "activation_cosine_similarity": 72.9981918334961,
        "activation_magnitude_ratio": -18.378686904907227,
        "activation_dot_product": -101.4349594116211,
        "encoder_gradient_cosine_similarity": 24.24278450012207,
        "encoder_gradient_l2_distance": -41.47803497314453,
        "encoder_gradient_dot_product": 43.1351432800293,
        "input_gradient_cosine_similarity": 25.55318260192871,
        "input_gradient_l2_distance": -54.95563507080078,
        "input_gradient_dot_product": -53.679351806640625
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.37859523892155955,
      "val_r": 0.24821875236560292,
      "n_iterations": 648,
      "coefficients": {
        "effective_rank": -3.6004478931427,
        "effective_rank_mergeability_score": -13.894882202148438,
        "stable_rank": -0.1687500774860382,
        "spectral_gap": 20.701202392578125,
        "singular_value_ratio": -8.647724151611328,
        "layerwise_effective_rank": 20.166980743408203,
        "layerwise_effective_rank_mergeability_score": 22.893138885498047,
        "task_vector_cosine_similarity": -5.568740367889404,
        "task_vector_l2_distance": -7.29757833480835,
        "task_vector_dot_product": 35.94725036621094,
        "weight_space_angle": -0.9030632376670837,
        "task_vector_magnitude_ratio": 6.254164218902588,
        "activation_l2_distance": -22.158916473388672,
        "activation_cosine_similarity": 20.879972457885742,
        "activation_magnitude_ratio": 8.05013656616211,
        "activation_dot_product": -44.48179244995117,
        "encoder_gradient_cosine_similarity": 6.113077163696289,
        "encoder_gradient_l2_distance": -17.33171272277832,
        "encoder_gradient_dot_product": 28.36349868774414,
        "input_gradient_cosine_similarity": 19.926755905151367,
        "input_gradient_l2_distance": -30.541868209838867,
        "input_gradient_dot_product": -33.70298767089844
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5843177380683563,
      "val_r": 0.56547749234015,
      "n_iterations": 848,
      "coefficients": {
        "effective_rank": -53.605403900146484,
        "effective_rank_mergeability_score": -31.29422378540039,
        "stable_rank": -33.97666549682617,
        "spectral_gap": 28.605361938476562,
        "singular_value_ratio": 14.914342880249023,
        "layerwise_effective_rank": 30.296066284179688,
        "layerwise_effective_rank_mergeability_score": 11.561715126037598,
        "task_vector_cosine_similarity": 15.511406898498535,
        "task_vector_l2_distance": 58.90272903442383,
        "task_vector_dot_product": 35.909461975097656,
        "weight_space_angle": -46.180747985839844,
        "task_vector_magnitude_ratio": 15.984819412231445,
        "activation_l2_distance": 16.112770080566406,
        "activation_cosine_similarity": 86.98771667480469,
        "activation_magnitude_ratio": -25.295717239379883,
        "activation_dot_product": -8.749300956726074,
        "encoder_gradient_cosine_similarity": 3.667642593383789,
        "encoder_gradient_l2_distance": -48.96818923950195,
        "encoder_gradient_dot_product": 18.052900314331055,
        "input_gradient_cosine_similarity": 8.099178314208984,
        "input_gradient_l2_distance": -50.549072265625,
        "input_gradient_dot_product": -44.988685607910156
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.26491278572894705,
      "val_r": 0.1050075547948946,
      "n_iterations": 704,
      "coefficients": {
        "effective_rank": -49.043739318847656,
        "effective_rank_mergeability_score": 117.04937744140625,
        "stable_rank": 90.05286407470703,
        "spectral_gap": -23.49470329284668,
        "singular_value_ratio": 65.49968719482422,
        "layerwise_effective_rank": 11.552010536193848,
        "layerwise_effective_rank_mergeability_score": 75.73809051513672,
        "task_vector_cosine_similarity": 8.799942016601562,
        "task_vector_l2_distance": -25.30438232421875,
        "task_vector_dot_product": 27.835893630981445,
        "weight_space_angle": -83.55245208740234,
        "task_vector_magnitude_ratio": -17.851238250732422,
        "activation_l2_distance": -97.44840240478516,
        "activation_cosine_similarity": 51.735862731933594,
        "activation_magnitude_ratio": 0.265252023935318,
        "activation_dot_product": -103.7675552368164,
        "encoder_gradient_cosine_similarity": 35.399879455566406,
        "encoder_gradient_l2_distance": -91.31675720214844,
        "encoder_gradient_dot_product": 80.03263854980469,
        "input_gradient_cosine_similarity": 18.201465606689453,
        "input_gradient_l2_distance": -31.04338836669922,
        "input_gradient_dot_product": -58.34267807006836
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}