{
  "aggregate_metrics": {
    "train_mse": 203.33887427833918,
    "train_r2": -14826.024764467677,
    "train_pearson_r": 0.014196215290816992,
    "train_pearson_p": 0.42050645684764265,
    "val_mse": 214.887141243676,
    "val_r2": -15668.09903639886,
    "val_pearson_r": -0.06217753611763909,
    "val_pearson_p": 0.2406051480558673
  },
  "per_fold_stats": {
    "train_mse_mean": 202.21669989124206,
    "train_mse_std": 876.0751191951183,
    "val_mse_mean": 226.17567054949623,
    "val_mse_std": 979.146216814534,
    "train_r_mean": 0.07625783065008787,
    "train_r_std": 0.1323439898779083,
    "val_r_mean": 0.08190730434074647,
    "val_r_std": 0.197799498826537
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.19084852933883667,
    "right_subspace_overlap_bottom_k": -0.7688701748847961,
    "interaction_matrix_overlap_top_k": 0.499372661113739,
    "interaction_matrix_overlap_bottom_k": 0.33530324697494507,
    "effective_rank": -1.8433221578598022,
    "effective_rank_mergeability_score": -0.07229985296726227,
    "stable_rank": -0.17211191356182098,
    "spectral_gap": 1.5110061168670654,
    "singular_value_ratio": 1.2150951623916626,
    "layerwise_effective_rank": 1.17367684841156,
    "layerwise_effective_rank_mergeability_score": 2.855938673019409,
    "task_vector_cosine_similarity": -1.145220160484314,
    "task_vector_l2_distance": -0.6551850438117981,
    "task_vector_dot_product": 0.8074405789375305,
    "weight_space_angle": -0.7864280939102173,
    "task_vector_magnitude_ratio": -0.04690765216946602,
    "singular_value_overlap": -0.14943332970142365,
    "subspace_overlap": -1.166695475578308,
    "right_subspace_overlap": -0.571045994758606,
    "activation_l2_distance": -0.7451198697090149,
    "activation_cosine_similarity": 0.14132744073867798,
    "activation_magnitude_ratio": 0.28263646364212036,
    "activation_dot_product": 0.4128771424293518,
    "encoder_gradient_cosine_similarity": -0.21290525794029236,
    "encoder_gradient_l2_distance": 1.264595866203308,
    "encoder_gradient_dot_product": -0.2422790229320526,
    "input_gradient_cosine_similarity": -0.35566583275794983,
    "input_gradient_l2_distance": 0.21039243042469025,
    "input_gradient_dot_product": -0.9745997190475464
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.5706644654273987,
    "right_subspace_overlap_bottom_k": 2.2825136184692383,
    "interaction_matrix_overlap_top_k": 1.5748592615127563,
    "interaction_matrix_overlap_bottom_k": 1.659278154373169,
    "effective_rank": 6.9234089851379395,
    "effective_rank_mergeability_score": 1.0580519437789917,
    "stable_rank": 1.3540372848510742,
    "spectral_gap": 5.309899806976318,
    "singular_value_ratio": 4.043066024780273,
    "layerwise_effective_rank": 3.838733434677124,
    "layerwise_effective_rank_mergeability_score": 10.955427169799805,
    "task_vector_cosine_similarity": 3.846855401992798,
    "task_vector_l2_distance": 2.9753777980804443,
    "task_vector_dot_product": 3.1980838775634766,
    "weight_space_angle": 3.7270522117614746,
    "task_vector_magnitude_ratio": 1.1358726024627686,
    "singular_value_overlap": 2.348289728164673,
    "subspace_overlap": 4.057639122009277,
    "right_subspace_overlap": 3.2014787197113037,
    "activation_l2_distance": 2.1147308349609375,
    "activation_cosine_similarity": 0.765545129776001,
    "activation_magnitude_ratio": 0.4787321388721466,
    "activation_dot_product": 1.704944372177124,
    "encoder_gradient_cosine_similarity": 2.0359046459198,
    "encoder_gradient_l2_distance": 4.928892612457275,
    "encoder_gradient_dot_product": 2.7708916664123535,
    "input_gradient_cosine_similarity": 1.5144866704940796,
    "input_gradient_l2_distance": 3.4977834224700928,
    "input_gradient_dot_product": 3.626002550125122
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.17302778998278573,
      "train_r2": -11.033790720318438,
      "train_pearson_r": 0.0762345294837552,
      "val_mse": 0.21587778517171965,
      "val_r2": -28.414728537106015,
      "val_pearson_r": 0.3729196769656553,
      "n_iterations": 57,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.2939257323741913,
        "right_subspace_overlap_bottom_k": 0.5545640587806702,
        "interaction_matrix_overlap_top_k": 0.6688445210456848,
        "interaction_matrix_overlap_bottom_k": -0.3108638525009155,
        "effective_rank": 0.10320203006267548,
        "effective_rank_mergeability_score": -0.14188231527805328,
        "stable_rank": -0.9131637811660767,
        "spectral_gap": 0.4181327223777771,
        "singular_value_ratio": 1.358400583267212,
        "layerwise_effective_rank": -0.8420835733413696,
        "layerwise_effective_rank_mergeability_score": -0.30885422229766846,
        "task_vector_cosine_similarity": -0.29910025000572205,
        "task_vector_l2_distance": -0.48896774649620056,
        "task_vector_dot_product": 0.4685319662094116,
        "weight_space_angle": 0.3687526285648346,
        "task_vector_magnitude_ratio": 0.07096366584300995,
        "singular_value_overlap": 0.1078319400548935,
        "subspace_overlap": -1.837984323501587,
        "right_subspace_overlap": 0.9204232692718506,
        "activation_l2_distance": -0.01808871515095234,
        "activation_cosine_similarity": -0.043995533138513565,
        "activation_magnitude_ratio": 0.1367330253124237,
        "activation_dot_product": 0.05976630747318268,
        "encoder_gradient_cosine_similarity": 0.3072780668735504,
        "encoder_gradient_l2_distance": -0.38045379519462585,
        "encoder_gradient_dot_product": 0.9230774641036987,
        "input_gradient_cosine_similarity": 0.07720524817705154,
        "input_gradient_l2_distance": -0.3204299211502075,
        "input_gradient_dot_product": 0.6411697268486023
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 16.48768180647519,
      "train_r2": -1147.1145076834505,
      "train_pearson_r": 0.012147786593088997,
      "val_mse": 22.52061417970381,
      "val_r2": -2890.974232796764,
      "val_pearson_r": 0.228192319295458,
      "n_iterations": 91,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.8906164169311523,
        "right_subspace_overlap_bottom_k": -3.4812355041503906,
        "interaction_matrix_overlap_top_k": 4.8431172370910645,
        "interaction_matrix_overlap_bottom_k": 0.33135494589805603,
        "effective_rank": -4.470944404602051,
        "effective_rank_mergeability_score": -2.4655048847198486,
        "stable_rank": 2.8188796043395996,
        "spectral_gap": 1.7053773403167725,
        "singular_value_ratio": 6.271564483642578,
        "layerwise_effective_rank": 2.7966551780700684,
        "layerwise_effective_rank_mergeability_score": 2.102994441986084,
        "task_vector_cosine_similarity": -1.3490220308303833,
        "task_vector_l2_distance": 0.33005666732788086,
        "task_vector_dot_product": -1.6851727962493896,
        "weight_space_angle": -2.2087483406066895,
        "task_vector_magnitude_ratio": -4.205746173858643,
        "singular_value_overlap": 2.849130630493164,
        "subspace_overlap": -1.2633581161499023,
        "right_subspace_overlap": 1.3914917707443237,
        "activation_l2_distance": -5.836390495300293,
        "activation_cosine_similarity": -1.0099098682403564,
        "activation_magnitude_ratio": 1.1258758306503296,
        "activation_dot_product": 0.41804009675979614,
        "encoder_gradient_cosine_similarity": 1.6536598205566406,
        "encoder_gradient_l2_distance": 8.954771041870117,
        "encoder_gradient_dot_product": 3.2400524616241455,
        "input_gradient_cosine_similarity": -3.7272541522979736,
        "input_gradient_l2_distance": -3.2628724575042725,
        "input_gradient_dot_product": -6.785585403442383
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.9011013882321851,
      "train_r2": -62.0671097409711,
      "train_pearson_r": 0.017415952129969464,
      "val_mse": 0.39788553156669554,
      "val_r2": -51.64392067079144,
      "val_pearson_r": 0.23080680462585268,
      "n_iterations": 85,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.5240185260772705,
        "right_subspace_overlap_bottom_k": -0.08513104170560837,
        "interaction_matrix_overlap_top_k": -1.3955399990081787,
        "interaction_matrix_overlap_bottom_k": -0.7694824934005737,
        "effective_rank": -1.0496501922607422,
        "effective_rank_mergeability_score": -0.41877973079681396,
        "stable_rank": -0.7304440140724182,
        "spectral_gap": -0.9774077534675598,
        "singular_value_ratio": 0.3529066741466522,
        "layerwise_effective_rank": 0.6195008754730225,
        "layerwise_effective_rank_mergeability_score": 1.5947614908218384,
        "task_vector_cosine_similarity": -2.1547181606292725,
        "task_vector_l2_distance": 0.681984007358551,
        "task_vector_dot_product": 0.07943529635667801,
        "weight_space_angle": -0.5609956383705139,
        "task_vector_magnitude_ratio": 0.7067607641220093,
        "singular_value_overlap": 0.5171496272087097,
        "subspace_overlap": 1.8623924255371094,
        "right_subspace_overlap": 1.3910428285598755,
        "activation_l2_distance": 0.6226107478141785,
        "activation_cosine_similarity": 1.4306029081344604,
        "activation_magnitude_ratio": 1.413681983947754,
        "activation_dot_product": -0.20380599796772003,
        "encoder_gradient_cosine_similarity": -0.2554261088371277,
        "encoder_gradient_l2_distance": -0.18495692312717438,
        "encoder_gradient_dot_product": -1.3168702125549316,
        "input_gradient_cosine_similarity": 0.2894432246685028,
        "input_gradient_l2_distance": -0.9730249047279358,
        "input_gradient_dot_product": 1.0243483781814575
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.07776640646730022,
      "train_r2": -4.524027173140446,
      "train_pearson_r": 0.021666049261349934,
      "val_mse": 0.035272618443588755,
      "val_r2": -3.698216331791283,
      "val_pearson_r": -0.20493223660706147,
      "n_iterations": 93,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.04052373766899109,
        "right_subspace_overlap_bottom_k": 0.044705867767333984,
        "interaction_matrix_overlap_top_k": -0.791556715965271,
        "interaction_matrix_overlap_bottom_k": 0.1394132822751999,
        "effective_rank": -0.15931841731071472,
        "effective_rank_mergeability_score": 0.24318835139274597,
        "stable_rank": 0.4027305543422699,
        "spectral_gap": -0.4312356412410736,
        "singular_value_ratio": 0.16221918165683746,
        "layerwise_effective_rank": -0.0882672369480133,
        "layerwise_effective_rank_mergeability_score": -0.14505328238010406,
        "task_vector_cosine_similarity": 0.01231206301599741,
        "task_vector_l2_distance": -0.1264183521270752,
        "task_vector_dot_product": 0.267981618642807,
        "weight_space_angle": 0.38865476846694946,
        "task_vector_magnitude_ratio": -0.7352321743965149,
        "singular_value_overlap": 0.24837738275527954,
        "subspace_overlap": -0.14864054322242737,
        "right_subspace_overlap": 0.23653343319892883,
        "activation_l2_distance": 0.1681593656539917,
        "activation_cosine_similarity": 0.12256532907485962,
        "activation_magnitude_ratio": 0.18066371977329254,
        "activation_dot_product": 0.17003029584884644,
        "encoder_gradient_cosine_similarity": 0.25297102332115173,
        "encoder_gradient_l2_distance": 0.25820547342300415,
        "encoder_gradient_dot_product": 0.29318609833717346,
        "input_gradient_cosine_similarity": 0.34268683195114136,
        "input_gradient_l2_distance": -0.5038148760795593,
        "input_gradient_dot_product": 0.22924640774726868
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.022007930506065386,
      "train_r2": -0.5347321888455399,
      "train_pearson_r": 0.16212267041583137,
      "val_mse": 0.02101953949657413,
      "val_r2": -1.708401933624193,
      "val_pearson_r": 0.07580421530086985,
      "n_iterations": 273,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.2010032832622528,
        "right_subspace_overlap_bottom_k": 0.21644149720668793,
        "interaction_matrix_overlap_top_k": -0.20289652049541473,
        "interaction_matrix_overlap_bottom_k": -0.16857990622520447,
        "effective_rank": 0.25186455249786377,
        "effective_rank_mergeability_score": -0.769839346408844,
        "stable_rank": -0.387478768825531,
        "spectral_gap": 0.7485547661781311,
        "singular_value_ratio": -0.5752421021461487,
        "layerwise_effective_rank": 0.051385197788476944,
        "layerwise_effective_rank_mergeability_score": 0.6748127341270447,
        "task_vector_cosine_similarity": -0.7937504053115845,
        "task_vector_l2_distance": -0.15732939541339874,
        "task_vector_dot_product": 0.5753923654556274,
        "weight_space_angle": 0.44830232858657837,
        "task_vector_magnitude_ratio": 1.2598754167556763,
        "singular_value_overlap": 0.06649716198444366,
        "subspace_overlap": 0.13846705853939056,
        "right_subspace_overlap": -0.0748104527592659,
        "activation_l2_distance": -0.216685950756073,
        "activation_cosine_similarity": -0.10149048268795013,
        "activation_magnitude_ratio": -0.02198087051510811,
        "activation_dot_product": 0.018865231424570084,
        "encoder_gradient_cosine_similarity": 0.03154822438955307,
        "encoder_gradient_l2_distance": 0.019539568573236465,
        "encoder_gradient_dot_product": 0.13049036264419556,
        "input_gradient_cosine_similarity": -0.0896737277507782,
        "input_gradient_l2_distance": -0.17866277694702148,
        "input_gradient_dot_product": -0.09715614467859268
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_mse": 0.07566599856537536,
      "train_r2": -4.129556784182318,
      "train_pearson_r": -0.08582047151559989,
      "val_mse": 0.08372529546886703,
      "val_r2": -25.688724585069064,
      "val_pearson_r": -0.4233888720585314,
      "n_iterations": 129,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.2709823250770569,
        "right_subspace_overlap_bottom_k": -0.11834828555583954,
        "interaction_matrix_overlap_top_k": 0.3342590034008026,
        "interaction_matrix_overlap_bottom_k": -0.20566080510616302,
        "effective_rank": -0.4248369336128235,
        "effective_rank_mergeability_score": -0.5747389197349548,
        "stable_rank": 0.4327804744243622,
        "spectral_gap": 0.6802686452865601,
        "singular_value_ratio": -0.151575967669487,
        "layerwise_effective_rank": 0.21569392085075378,
        "layerwise_effective_rank_mergeability_score": 0.15005946159362793,
        "task_vector_cosine_similarity": -0.029348358511924744,
        "task_vector_l2_distance": 0.28623276948928833,
        "task_vector_dot_product": 0.047459255903959274,
        "weight_space_angle": 0.027144838124513626,
        "task_vector_magnitude_ratio": 0.2623170018196106,
        "singular_value_overlap": 0.18974068760871887,
        "subspace_overlap": 0.02200273983180523,
        "right_subspace_overlap": -0.1700102984905243,
        "activation_l2_distance": -0.30003538727760315,
        "activation_cosine_similarity": 0.009352131746709347,
        "activation_magnitude_ratio": 0.14064809679985046,
        "activation_dot_product": -0.32661381363868713,
        "encoder_gradient_cosine_similarity": 0.4007464647293091,
        "encoder_gradient_l2_distance": 0.5473209619522095,
        "encoder_gradient_dot_product": 0.5584323406219482,
        "input_gradient_cosine_similarity": -0.29397088289260864,
        "input_gradient_l2_distance": -0.3661019504070282,
        "input_gradient_dot_product": -0.07928495109081268
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_mse": 0.05732439203951912,
      "train_r2": -3.242368949649726,
      "train_pearson_r": -0.08071871614525698,
      "val_mse": 0.04803586844570328,
      "val_r2": -4.500231258181488,
      "val_pearson_r": -0.10452900722106641,
      "n_iterations": 53,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.36678817868232727,
        "right_subspace_overlap_bottom_k": -0.10240638256072998,
        "interaction_matrix_overlap_top_k": -0.005736851133406162,
        "interaction_matrix_overlap_bottom_k": -0.253375381231308,
        "effective_rank": 0.09633847326040268,
        "effective_rank_mergeability_score": -0.3706459701061249,
        "stable_rank": -0.04588766396045685,
        "spectral_gap": 0.16882406175136566,
        "singular_value_ratio": -0.07623786479234695,
        "layerwise_effective_rank": 0.19505266845226288,
        "layerwise_effective_rank_mergeability_score": 0.3162865936756134,
        "task_vector_cosine_similarity": -0.2525257170200348,
        "task_vector_l2_distance": 0.1552565097808838,
        "task_vector_dot_product": 0.21713915467262268,
        "weight_space_angle": 0.3243441879749298,
        "task_vector_magnitude_ratio": -0.0702962651848793,
        "singular_value_overlap": 0.17593492567539215,
        "subspace_overlap": 0.10246460139751434,
        "right_subspace_overlap": -0.1321127563714981,
        "activation_l2_distance": 0.11989389359951019,
        "activation_cosine_similarity": 0.3046671450138092,
        "activation_magnitude_ratio": -0.0806131586432457,
        "activation_dot_product": 0.08444967120885849,
        "encoder_gradient_cosine_similarity": 0.16440218687057495,
        "encoder_gradient_l2_distance": -0.3414521813392639,
        "encoder_gradient_dot_product": -0.10264937579631805,
        "input_gradient_cosine_similarity": 0.14797484874725342,
        "input_gradient_l2_distance": -0.04715326055884361,
        "input_gradient_dot_product": -0.05475600063800812
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.6171973214986177,
      "train_r2": -45.222475993450466,
      "train_pearson_r": 0.24063188054785734,
      "val_mse": 2.475624301000171,
      "val_r2": -355.18543286337444,
      "val_pearson_r": 0.043371043863279765,
      "n_iterations": 68,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.8156259655952454,
        "right_subspace_overlap_bottom_k": 0.5783103704452515,
        "interaction_matrix_overlap_top_k": -0.04246046766638756,
        "interaction_matrix_overlap_bottom_k": 0.940304160118103,
        "effective_rank": -0.1158786341547966,
        "effective_rank_mergeability_score": 1.0872894525527954,
        "stable_rank": 0.4768866300582886,
        "spectral_gap": -0.3715202808380127,
        "singular_value_ratio": 0.9001718163490295,
        "layerwise_effective_rank": 0.578191339969635,
        "layerwise_effective_rank_mergeability_score": 1.3070114850997925,
        "task_vector_cosine_similarity": 1.5991392135620117,
        "task_vector_l2_distance": -0.25386688113212585,
        "task_vector_dot_product": -1.3137412071228027,
        "weight_space_angle": -0.9332020282745361,
        "task_vector_magnitude_ratio": -0.11599310487508774,
        "singular_value_overlap": -0.4723815619945526,
        "subspace_overlap": -1.681596279144287,
        "right_subspace_overlap": -1.2277145385742188,
        "activation_l2_distance": -0.9375064373016357,
        "activation_cosine_similarity": -0.279215931892395,
        "activation_magnitude_ratio": 0.5944496393203735,
        "activation_dot_product": 0.24791671335697174,
        "encoder_gradient_cosine_similarity": 0.9315415024757385,
        "encoder_gradient_l2_distance": -0.920303225517273,
        "encoder_gradient_dot_product": 0.3550508916378021,
        "input_gradient_cosine_similarity": 0.8104203939437866,
        "input_gradient_l2_distance": -1.8797580003738403,
        "input_gradient_dot_product": 0.3015323579311371
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_mse": 0.01871625914204895,
      "train_r2": -0.3093434369614263,
      "train_pearson_r": 0.27920157957387554,
      "val_mse": 0.021285715760628154,
      "val_r2": -1.7483725510232042,
      "val_pearson_r": 0.27548929689401797,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.06643776595592499,
        "right_subspace_overlap_bottom_k": 0.2323455512523651,
        "interaction_matrix_overlap_top_k": -0.3255864381790161,
        "interaction_matrix_overlap_bottom_k": -0.19660262763500214,
        "effective_rank": 0.6165199279785156,
        "effective_rank_mergeability_score": 0.33310002088546753,
        "stable_rank": 0.19410596787929535,
        "spectral_gap": 0.3054255247116089,
        "singular_value_ratio": -0.0037266691215336323,
        "layerwise_effective_rank": -0.006032327655702829,
        "layerwise_effective_rank_mergeability_score": 0.2340167909860611,
        "task_vector_cosine_similarity": 0.046656910330057144,
        "task_vector_l2_distance": -0.09690306335687637,
        "task_vector_dot_product": 0.3327848017215729,
        "weight_space_angle": 0.49361905455589294,
        "task_vector_magnitude_ratio": 0.022687070071697235,
        "singular_value_overlap": -0.024208806455135345,
        "subspace_overlap": -0.43659162521362305,
        "right_subspace_overlap": 0.4737972915172577,
        "activation_l2_distance": -0.4657137393951416,
        "activation_cosine_similarity": -0.3170008659362793,
        "activation_magnitude_ratio": -0.040928684175014496,
        "activation_dot_product": -0.005997750908136368,
        "encoder_gradient_cosine_similarity": 0.01143110916018486,
        "encoder_gradient_l2_distance": -0.2550084888935089,
        "encoder_gradient_dot_product": 0.2089548408985138,
        "input_gradient_cosine_similarity": -0.13859950006008148,
        "input_gradient_l2_distance": -0.11091472953557968,
        "input_gradient_dot_product": -0.1476345658302307
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.03339524795251623,
      "train_r2": -1.311752446286341,
      "train_pearson_r": -0.07598841825832406,
      "val_mse": 0.15092354830886365,
      "val_r2": -18.99337022550123,
      "val_pearson_r": 0.2423800288798209,
      "n_iterations": 69,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.16700363159179688,
        "right_subspace_overlap_bottom_k": -0.06543021649122238,
        "interaction_matrix_overlap_top_k": -0.05275604873895645,
        "interaction_matrix_overlap_bottom_k": -0.1438804566860199,
        "effective_rank": 0.18223436176776886,
        "effective_rank_mergeability_score": 0.29056480526924133,
        "stable_rank": 0.1692027747631073,
        "spectral_gap": -0.11875621974468231,
        "singular_value_ratio": -0.08984585106372833,
        "layerwise_effective_rank": 0.26404112577438354,
        "layerwise_effective_rank_mergeability_score": 0.04640854522585869,
        "task_vector_cosine_similarity": -0.011000963859260082,
        "task_vector_l2_distance": 0.08656211197376251,
        "task_vector_dot_product": -0.26480233669281006,
        "weight_space_angle": 0.19965898990631104,
        "task_vector_magnitude_ratio": -0.25994378328323364,
        "singular_value_overlap": 0.12307320535182953,
        "subspace_overlap": 0.018332209438085556,
        "right_subspace_overlap": 0.1864997297525406,
        "activation_l2_distance": -0.053501371294260025,
        "activation_cosine_similarity": 0.1524784415960312,
        "activation_magnitude_ratio": -0.04367846995592117,
        "activation_dot_product": 0.060151007026433945,
        "encoder_gradient_cosine_similarity": 0.19461920857429504,
        "encoder_gradient_l2_distance": -0.04324115440249443,
        "encoder_gradient_dot_product": 0.27408209443092346,
        "input_gradient_cosine_similarity": -0.1395675092935562,
        "input_gradient_l2_distance": 0.12733229994773865,
        "input_gradient_dot_product": -0.2544173300266266
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.020655769875513135,
      "train_r2": -0.5138173383543616,
      "train_pearson_r": 0.21881326775680715,
      "val_mse": 0.023187115194873664,
      "val_r2": -2.5942219953725574,
      "val_pearson_r": 0.23623717034598618,
      "n_iterations": 684,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.33562472462654114,
        "right_subspace_overlap_bottom_k": -0.003911852370947599,
        "interaction_matrix_overlap_top_k": 0.21029222011566162,
        "interaction_matrix_overlap_bottom_k": -0.028179533779621124,
        "effective_rank": 0.19199302792549133,
        "effective_rank_mergeability_score": 0.09540669620037079,
        "stable_rank": 0.7631844878196716,
        "spectral_gap": 0.30247727036476135,
        "singular_value_ratio": 0.37575870752334595,
        "layerwise_effective_rank": -0.17946085333824158,
        "layerwise_effective_rank_mergeability_score": 0.48552635312080383,
        "task_vector_cosine_similarity": -0.5758309960365295,
        "task_vector_l2_distance": -0.051148414611816406,
        "task_vector_dot_product": 0.35741519927978516,
        "weight_space_angle": 0.24600638449192047,
        "task_vector_magnitude_ratio": -0.4099389314651489,
        "singular_value_overlap": -0.0181930810213089,
        "subspace_overlap": 0.21531282365322113,
        "right_subspace_overlap": -0.5059317350387573,
        "activation_l2_distance": -0.10997681319713593,
        "activation_cosine_similarity": 0.20472963154315948,
        "activation_magnitude_ratio": -0.02669086493551731,
        "activation_dot_product": -0.2553488314151764,
        "encoder_gradient_cosine_similarity": 0.020084606483578682,
        "encoder_gradient_l2_distance": -0.32940179109573364,
        "encoder_gradient_dot_product": 0.12995518743991852,
        "input_gradient_cosine_similarity": -0.16170059144496918,
        "input_gradient_l2_distance": -0.07728023827075958,
        "input_gradient_dot_product": -0.19977699220180511
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.03121371046677691,
      "train_r2": -1.2228208790714565,
      "train_pearson_r": -0.05760864064165855,
      "val_mse": 0.04158052221190128,
      "val_r2": -4.1535188654614315,
      "val_pearson_r": 0.173490732025642,
      "n_iterations": 88,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.15460322797298431,
        "right_subspace_overlap_bottom_k": 0.007142743095755577,
        "interaction_matrix_overlap_top_k": 0.039927657693624496,
        "interaction_matrix_overlap_bottom_k": -0.2313234508037567,
        "effective_rank": 0.12071073055267334,
        "effective_rank_mergeability_score": -0.04400436207652092,
        "stable_rank": 0.09495391696691513,
        "spectral_gap": 0.028473805636167526,
        "singular_value_ratio": -0.10256113111972809,
        "layerwise_effective_rank": 0.1394275575876236,
        "layerwise_effective_rank_mergeability_score": 0.07845255732536316,
        "task_vector_cosine_similarity": -0.20609503984451294,
        "task_vector_l2_distance": 0.17534027993679047,
        "task_vector_dot_product": 0.03782368078827858,
        "weight_space_angle": 0.20041611790657043,
        "task_vector_magnitude_ratio": -0.14791828393936157,
        "singular_value_overlap": 0.19844083487987518,
        "subspace_overlap": 0.06150832027196884,
        "right_subspace_overlap": -0.11138883978128433,
        "activation_l2_distance": 0.10734984278678894,
        "activation_cosine_similarity": 0.3112514615058899,
        "activation_magnitude_ratio": 0.08714526891708374,
        "activation_dot_product": -0.1637451946735382,
        "encoder_gradient_cosine_similarity": -0.03355364501476288,
        "encoder_gradient_l2_distance": -0.09475056082010269,
        "encoder_gradient_dot_product": 0.2748792767524719,
        "input_gradient_cosine_similarity": 0.030419638380408287,
        "input_gradient_l2_distance": -0.07338276505470276,
        "input_gradient_dot_product": 0.05625540018081665
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.0174633709367742,
      "train_r2": -0.2729599287217308,
      "train_pearson_r": 0.2646041667033699,
      "val_mse": 0.010513649706170265,
      "val_r2": -0.29687930598217815,
      "val_pearson_r": 0.0659451947085101,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.1346723884344101,
        "right_subspace_overlap_bottom_k": 0.1090913787484169,
        "interaction_matrix_overlap_top_k": -0.252265065908432,
        "interaction_matrix_overlap_bottom_k": -0.020532628521323204,
        "effective_rank": 0.07171681523323059,
        "effective_rank_mergeability_score": -0.09120988845825195,
        "stable_rank": 0.11651550233364105,
        "spectral_gap": 0.42119115591049194,
        "singular_value_ratio": -0.26584163308143616,
        "layerwise_effective_rank": 0.09656523168087006,
        "layerwise_effective_rank_mergeability_score": 0.19862698018550873,
        "task_vector_cosine_similarity": -0.028705598786473274,
        "task_vector_l2_distance": 0.005623443517833948,
        "task_vector_dot_product": -0.26417437195777893,
        "weight_space_angle": 0.028597472235560417,
        "task_vector_magnitude_ratio": 0.5168934464454651,
        "singular_value_overlap": -0.023368775844573975,
        "subspace_overlap": -0.02177434228360653,
        "right_subspace_overlap": 0.11406834423542023,
        "activation_l2_distance": 0.33872368931770325,
        "activation_cosine_similarity": 0.4838255047798157,
        "activation_magnitude_ratio": 0.004292149096727371,
        "activation_dot_product": -0.1812146157026291,
        "encoder_gradient_cosine_similarity": 0.022702300921082497,
        "encoder_gradient_l2_distance": -0.21376827359199524,
        "encoder_gradient_dot_product": 0.0880030021071434,
        "input_gradient_cosine_similarity": -0.12476466596126556,
        "input_gradient_l2_distance": -0.13633781671524048,
        "input_gradient_dot_product": -0.12677478790283203
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 4.5222265512025555,
      "train_r2": -313.4317335818656,
      "train_pearson_r": 0.03420793839144419,
      "val_mse": 2.7497627040858363,
      "val_r2": -384.64493594542563,
      "val_pearson_r": 0.068903676741998,
      "n_iterations": 71,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.1167153120040894,
        "right_subspace_overlap_bottom_k": -3.4645447731018066,
        "interaction_matrix_overlap_top_k": 0.6166225671768188,
        "interaction_matrix_overlap_bottom_k": -0.03298034891486168,
        "effective_rank": -1.92387056350708,
        "effective_rank_mergeability_score": -0.9445991516113281,
        "stable_rank": -1.258697748184204,
        "spectral_gap": 1.8363059759140015,
        "singular_value_ratio": -1.3876265287399292,
        "layerwise_effective_rank": 1.3420864343643188,
        "layerwise_effective_rank_mergeability_score": -1.7565510272979736,
        "task_vector_cosine_similarity": -0.37087419629096985,
        "task_vector_l2_distance": -0.40089482069015503,
        "task_vector_dot_product": 2.0431625843048096,
        "weight_space_angle": 0.31637799739837646,
        "task_vector_magnitude_ratio": 2.116156816482544,
        "singular_value_overlap": 1.8940269947052002,
        "subspace_overlap": -1.2902984619140625,
        "right_subspace_overlap": 1.3568426370620728,
        "activation_l2_distance": 0.30084148049354553,
        "activation_cosine_similarity": -1.1440469026565552,
        "activation_magnitude_ratio": 1.2083725929260254,
        "activation_dot_product": 0.15406541526317596,
        "encoder_gradient_cosine_similarity": 0.8183530569076538,
        "encoder_gradient_l2_distance": -1.527817726135254,
        "encoder_gradient_dot_product": 0.7079795598983765,
        "input_gradient_cosine_similarity": 2.059434175491333,
        "input_gradient_l2_distance": -2.5712339878082275,
        "input_gradient_dot_product": 1.1805471181869507
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.018720093649809897,
      "train_r2": -0.3752118280005887,
      "train_pearson_r": 0.2323750168169028,
      "val_mse": 0.011611218029369843,
      "val_r2": -0.5187591532421765,
      "val_pearson_r": 0.30364056797049815,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5654332041740417,
        "right_subspace_overlap_bottom_k": -0.1163962334394455,
        "interaction_matrix_overlap_top_k": -0.14730985462665558,
        "interaction_matrix_overlap_bottom_k": 0.1384912133216858,
        "effective_rank": 0.22015798091888428,
        "effective_rank_mergeability_score": 0.08371734619140625,
        "stable_rank": 0.21987231075763702,
        "spectral_gap": 0.30916550755500793,
        "singular_value_ratio": -0.10473345965147018,
        "layerwise_effective_rank": 0.16965800523757935,
        "layerwise_effective_rank_mergeability_score": 0.31887540221214294,
        "task_vector_cosine_similarity": 0.13927657902240753,
        "task_vector_l2_distance": 0.06328056752681732,
        "task_vector_dot_product": -0.2795405685901642,
        "weight_space_angle": 0.17517401278018951,
        "task_vector_magnitude_ratio": 0.21433496475219727,
        "singular_value_overlap": -0.01681407541036606,
        "subspace_overlap": -0.1382717788219452,
        "right_subspace_overlap": -0.2927826941013336,
        "activation_l2_distance": -0.004481689538806677,
        "activation_cosine_similarity": 0.19722002744674683,
        "activation_magnitude_ratio": -0.008791325613856316,
        "activation_dot_product": -0.16482175886631012,
        "encoder_gradient_cosine_similarity": 0.022260844707489014,
        "encoder_gradient_l2_distance": -0.24199692904949188,
        "encoder_gradient_dot_product": 0.08983836323022842,
        "input_gradient_cosine_similarity": -0.1563229113817215,
        "input_gradient_l2_distance": -0.1390535980463028,
        "input_gradient_dot_product": -0.11516446620225906
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_mse": 4020.9066875446288,
      "train_r2": -289016.23395019106,
      "train_pearson_r": 0.019461331355954372,
      "val_mse": 4494.122129493438,
      "val_r2": -615857.117881244,
      "val_pearson_r": 0.17487932024029185,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.6118670701980591,
        "right_subspace_overlap_bottom_k": -9.542757987976074,
        "interaction_matrix_overlap_top_k": 5.160565376281738,
        "interaction_matrix_overlap_bottom_k": 7.43651819229126,
        "effective_rank": -31.63255500793457,
        "effective_rank_mergeability_score": 3.453791856765747,
        "stable_rank": -4.904798984527588,
        "spectral_gap": 24.491239547729492,
        "singular_value_ratio": 17.654401779174805,
        "layerwise_effective_rank": 17.627653121948242,
        "layerwise_effective_rank_mergeability_score": 50.496578216552734,
        "task_vector_cosine_similarity": -17.643896102905273,
        "task_vector_l2_distance": -13.577522277832031,
        "task_vector_dot_product": 14.393957138061523,
        "weight_space_angle": -16.7708740234375,
        "task_vector_magnitude_ratio": -0.06452257186174393,
        "singular_value_overlap": -9.896339416503906,
        "subspace_overlap": -18.524438858032227,
        "right_subspace_overlap": -14.225059509277344,
        "activation_l2_distance": -7.954945087432861,
        "activation_cosine_similarity": 2.434908628463745,
        "activation_magnitude_ratio": 0.9264131188392639,
        "activation_dot_product": 7.800567150115967,
        "encoder_gradient_cosine_similarity": -8.885515213012695,
        "encoder_gradient_l2_distance": 20.814794540405273,
        "encoder_gradient_dot_product": -11.83228874206543,
        "input_gradient_cosine_similarity": -5.360095977783203,
        "input_gradient_l2_distance": 14.93886947631836,
        "input_gradient_dot_product": -15.241864204406738
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.02471407815340622,
      "train_r2": -0.7336050287777043,
      "train_pearson_r": 0.21636691737231423,
      "val_mse": 0.014389097418093027,
      "val_r2": -0.8524382261943566,
      "val_pearson_r": 0.18292652362773013,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.30641865730285645,
        "right_subspace_overlap_bottom_k": -0.10111521929502487,
        "interaction_matrix_overlap_top_k": 0.1300947666168213,
        "interaction_matrix_overlap_bottom_k": 0.0635281354188919,
        "effective_rank": 0.42717236280441284,
        "effective_rank_mergeability_score": -0.19988735020160675,
        "stable_rank": 0.22691205143928528,
        "spectral_gap": 0.4725838899612427,
        "singular_value_ratio": 0.12132862955331802,
        "layerwise_effective_rank": -0.1615477055311203,
        "layerwise_effective_rank_mergeability_score": 0.5550568103790283,
        "task_vector_cosine_similarity": 0.0552908331155777,
        "task_vector_l2_distance": -0.09239697456359863,
        "task_vector_dot_product": 0.6199172735214233,
        "weight_space_angle": 1.290113925933838,
        "task_vector_magnitude_ratio": 0.1004074364900589,
        "singular_value_overlap": -0.004865450784564018,
        "subspace_overlap": -0.0654321163892746,
        "right_subspace_overlap": -0.2641024887561798,
        "activation_l2_distance": -1.0971685647964478,
        "activation_cosine_similarity": -0.8715413212776184,
        "activation_magnitude_ratio": -0.06257279962301254,
        "activation_dot_product": 0.08808605372905731,
        "encoder_gradient_cosine_similarity": 0.04496210813522339,
        "encoder_gradient_l2_distance": -0.29237955808639526,
        "encoder_gradient_dot_product": 0.13424378633499146,
        "input_gradient_cosine_similarity": -0.1885412037372589,
        "input_gradient_l2_distance": -0.0642007514834404,
        "input_gradient_dot_product": -0.1695239096879959
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.13295347021656248,
      "train_r2": -8.578980533957623,
      "train_pearson_r": 0.08248939939052713,
      "val_mse": 0.2496618714417287,
      "val_r2": -26.101062436098022,
      "val_pearson_r": -0.027126628676181076,
      "n_iterations": 62,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007649797480553389,
        "right_subspace_overlap_bottom_k": -0.015060123056173325,
        "interaction_matrix_overlap_top_k": 0.6745287775993347,
        "interaction_matrix_overlap_bottom_k": 0.056865494698286057,
        "effective_rank": 0.4438819885253906,
        "effective_rank_mergeability_score": -0.012405982241034508,
        "stable_rank": -0.45166805386543274,
        "spectral_gap": 0.2886503338813782,
        "singular_value_ratio": -0.18400925397872925,
        "layerwise_effective_rank": 0.4166649281978607,
        "layerwise_effective_rank_mergeability_score": -0.14303714036941528,
        "task_vector_cosine_similarity": -0.5649294853210449,
        "task_vector_l2_distance": 0.110977403819561,
        "task_vector_dot_product": 0.36880454421043396,
        "weight_space_angle": -0.06492877751588821,
        "task_vector_magnitude_ratio": -0.16148369014263153,
        "singular_value_overlap": 0.35136082768440247,
        "subspace_overlap": 0.07513581961393356,
        "right_subspace_overlap": -0.4374106824398041,
        "activation_l2_distance": 0.17816323041915894,
        "activation_cosine_similarity": 0.442600280046463,
        "activation_magnitude_ratio": 0.041053272783756256,
        "activation_dot_product": 0.21676774322986603,
        "encoder_gradient_cosine_similarity": 0.13722525537014008,
        "encoder_gradient_l2_distance": 0.1315709948539734,
        "encoder_gradient_dot_product": 0.248941108584404,
        "input_gradient_cosine_similarity": -0.6000494956970215,
        "input_gradient_l2_distance": -0.20111620426177979,
        "input_gradient_dot_product": -0.3628319799900055
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.08521092452206942,
      "train_r2": -14.567760458289616,
      "train_pearson_r": 0.12596295622833129,
      "val_mse": 0.25694975656363656,
      "val_r2": -98.53307584079761,
      "val_pearson_r": -0.07720969050116017,
      "n_iterations": 59,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.34099695086479187,
        "right_subspace_overlap_bottom_k": 0.08095736056566238,
        "interaction_matrix_overlap_top_k": 0.04169771447777748,
        "interaction_matrix_overlap_bottom_k": 0.10584711283445358,
        "effective_rank": 0.08844999969005585,
        "effective_rank_mergeability_score": -0.9095003604888916,
        "stable_rank": 0.10266386717557907,
        "spectral_gap": 0.26748964190483093,
        "singular_value_ratio": -0.15510404109954834,
        "layerwise_effective_rank": 0.09228667616844177,
        "layerwise_effective_rank_mergeability_score": 0.3784360885620117,
        "task_vector_cosine_similarity": 0.0011536860838532448,
        "task_vector_l2_distance": 0.08357290178537369,
        "task_vector_dot_product": 0.09140007197856903,
        "weight_space_angle": 0.28769850730895996,
        "task_vector_magnitude_ratio": -0.437042236328125,
        "singular_value_overlap": 0.38371920585632324,
        "subspace_overlap": -0.1383332908153534,
        "right_subspace_overlap": 0.1934049427509308,
        "activation_l2_distance": 0.26540184020996094,
        "activation_cosine_similarity": 0.2857900857925415,
        "activation_magnitude_ratio": -0.22965911030769348,
        "activation_dot_product": 0.19003993272781372,
        "encoder_gradient_cosine_similarity": -0.27438148856163025,
        "encoder_gradient_l2_distance": -0.3008715510368347,
        "encoder_gradient_dot_product": 0.41537711024284363,
        "input_gradient_cosine_similarity": 0.2150467336177826,
        "input_gradient_l2_distance": -0.07454285770654678,
        "input_gradient_dot_product": 0.28864869475364685
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.11026777032683543,
      "train_r2": -6.900536548808766,
      "train_pearson_r": -0.17840858245878205,
      "val_mse": 0.06336117846971595,
      "val_r2": -6.650416829560535,
      "val_pearson_r": -0.19965404960668123,
      "n_iterations": 95,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.22930796444416046,
        "right_subspace_overlap_bottom_k": -0.10462449491024017,
        "interaction_matrix_overlap_top_k": 0.4836118817329407,
        "interaction_matrix_overlap_bottom_k": -0.1447957158088684,
        "effective_rank": 0.0963669940829277,
        "effective_rank_mergeability_score": -0.09005729854106903,
        "stable_rank": -0.7687874436378479,
        "spectral_gap": -0.3251200318336487,
        "singular_value_ratio": 0.20165495574474335,
        "layerwise_effective_rank": 0.1460687667131424,
        "layerwise_effective_rank_mergeability_score": 0.5343624949455261,
        "task_vector_cosine_similarity": -0.4784340560436249,
        "task_vector_l2_distance": 0.16285981237888336,
        "task_vector_dot_product": 0.055038921535015106,
        "weight_space_angle": 0.015324750915169716,
        "task_vector_magnitude_ratio": 0.3995676040649414,
        "singular_value_overlap": 0.3622218668460846,
        "subspace_overlap": -0.2828082740306854,
        "right_subspace_overlap": -0.24369873106479645,
        "activation_l2_distance": -0.009047038853168488,
        "activation_cosine_similarity": 0.21375831961631775,
        "activation_magnitude_ratio": 0.30831584334373474,
        "activation_dot_product": 0.05034558102488518,
        "encoder_gradient_cosine_similarity": 0.1769859790802002,
        "encoder_gradient_l2_distance": -0.30788496136665344,
        "encoder_gradient_dot_product": 0.33368295431137085,
        "input_gradient_cosine_similarity": -0.10540717840194702,
        "input_gradient_l2_distance": 0.1215275451540947,
        "input_gradient_dot_product": 0.4210260510444641
      }
    }
  ],
  "optimization_params": {
    "objective": "MSE",
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 1e-06
  }
}