{
  "aggregate_metrics": {
    "train_r": 0.16745305142733635,
    "train_p": 1.0791130678971927e-21,
    "val_r": 0.03647584855723399,
    "val_p": 0.4914711841320714
  },
  "per_fold_stats": {
    "train_r_mean": 0.513228962810178,
    "train_r_std": 0.098987496299683,
    "val_r_mean": 0.34301506465074305,
    "val_r_std": 0.25026134220250595
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 13.296053886413574,
    "right_subspace_overlap_bottom_k": 0.3819707930088043,
    "interaction_matrix_overlap_top_k": 11.524757385253906,
    "interaction_matrix_overlap_bottom_k": 10.952803611755371,
    "effective_rank": -4.897871017456055,
    "effective_rank_mergeability_score": 7.494375705718994,
    "stable_rank": -6.738584995269775,
    "spectral_gap": 1.649207353591919,
    "singular_value_ratio": -5.166529178619385,
    "layerwise_effective_rank": 5.575184345245361,
    "layerwise_effective_rank_mergeability_score": -7.721571922302246,
    "task_vector_cosine_similarity": 7.331564903259277,
    "task_vector_l2_distance": -15.874887466430664,
    "task_vector_dot_product": 11.606367111206055,
    "weight_space_angle": 5.395224094390869,
    "task_vector_magnitude_ratio": -2.448523998260498,
    "singular_value_overlap": -24.71865463256836,
    "subspace_overlap": 15.3593168258667,
    "activation_l2_distance": -12.398675918579102,
    "activation_cosine_similarity": 0.7132774591445923,
    "activation_magnitude_ratio": -10.82280158996582,
    "activation_dot_product": 17.93488121032715,
    "encoder_gradient_cosine_similarity": 11.417364120483398,
    "encoder_gradient_l2_distance": -20.842166900634766,
    "encoder_gradient_dot_product": 11.989802360534668,
    "input_gradient_cosine_similarity": 13.858589172363281,
    "input_gradient_l2_distance": -23.00103759765625,
    "input_gradient_dot_product": -20.89816665649414
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 27.658754348754883,
    "right_subspace_overlap_bottom_k": 19.054357528686523,
    "interaction_matrix_overlap_top_k": 19.10521125793457,
    "interaction_matrix_overlap_bottom_k": 25.61505126953125,
    "effective_rank": 21.274715423583984,
    "effective_rank_mergeability_score": 31.627084732055664,
    "stable_rank": 23.9805965423584,
    "spectral_gap": 23.217695236206055,
    "singular_value_ratio": 16.135746002197266,
    "layerwise_effective_rank": 11.349695205688477,
    "layerwise_effective_rank_mergeability_score": 17.889965057373047,
    "task_vector_cosine_similarity": 13.524582862854004,
    "task_vector_l2_distance": 28.308582305908203,
    "task_vector_dot_product": 18.536222457885742,
    "weight_space_angle": 22.338916778564453,
    "task_vector_magnitude_ratio": 20.986133575439453,
    "singular_value_overlap": 30.350122451782227,
    "subspace_overlap": 24.808218002319336,
    "activation_l2_distance": 15.513692855834961,
    "activation_cosine_similarity": 14.383776664733887,
    "activation_magnitude_ratio": 12.312728881835938,
    "activation_dot_product": 32.80759811401367,
    "encoder_gradient_cosine_similarity": 17.378984451293945,
    "encoder_gradient_l2_distance": 24.068511962890625,
    "encoder_gradient_dot_product": 19.975566864013672,
    "input_gradient_cosine_similarity": 27.170021057128906,
    "input_gradient_l2_distance": 27.049890518188477,
    "input_gradient_dot_product": 26.54823112487793
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5690103359665781,
      "val_r": 0.6077772834676073,
      "n_iterations": 653,
      "coefficients": {
        "right_subspace_overlap_top_k": 51.03010940551758,
        "right_subspace_overlap_bottom_k": 2.578686475753784,
        "interaction_matrix_overlap_top_k": 13.202207565307617,
        "interaction_matrix_overlap_bottom_k": 16.167341232299805,
        "effective_rank": -0.9634279012680054,
        "effective_rank_mergeability_score": 27.27933120727539,
        "stable_rank": 8.339449882507324,
        "spectral_gap": 31.21343231201172,
        "singular_value_ratio": -1.542934775352478,
        "layerwise_effective_rank": 40.925392150878906,
        "layerwise_effective_rank_mergeability_score": -9.351269721984863,
        "task_vector_cosine_similarity": -3.285290479660034,
        "task_vector_l2_distance": -40.72236633300781,
        "task_vector_dot_product": 18.136962890625,
        "weight_space_angle": 31.2823543548584,
        "task_vector_magnitude_ratio": -8.35678482055664,
        "singular_value_overlap": -56.42145919799805,
        "subspace_overlap": 13.019948959350586,
        "activation_l2_distance": -36.82781219482422,
        "activation_cosine_similarity": -3.5596389770507812,
        "activation_magnitude_ratio": -26.031923294067383,
        "activation_dot_product": -7.7995781898498535,
        "encoder_gradient_cosine_similarity": 22.59792137145996,
        "encoder_gradient_l2_distance": -27.905906677246094,
        "encoder_gradient_dot_product": 23.97896957397461,
        "input_gradient_cosine_similarity": 19.23334312438965,
        "input_gradient_l2_distance": -41.470252990722656,
        "input_gradient_dot_product": -72.76932525634766
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.60326950075928,
      "val_r": 0.5353254166425191,
      "n_iterations": 434,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.27467986941337585,
        "right_subspace_overlap_bottom_k": -0.06921114772558212,
        "interaction_matrix_overlap_top_k": 0.16189953684806824,
        "interaction_matrix_overlap_bottom_k": 1.0983797311782837,
        "effective_rank": 0.5754945278167725,
        "effective_rank_mergeability_score": 1.1482141017913818,
        "stable_rank": 0.06657201796770096,
        "spectral_gap": 0.14443811774253845,
        "singular_value_ratio": 0.2675056457519531,
        "layerwise_effective_rank": -0.07400647550821304,
        "layerwise_effective_rank_mergeability_score": -0.5421178936958313,
        "task_vector_cosine_similarity": 0.8387504816055298,
        "task_vector_l2_distance": -0.9363387823104858,
        "task_vector_dot_product": -0.4302295744419098,
        "weight_space_angle": 0.519457221031189,
        "task_vector_magnitude_ratio": -0.4049391448497772,
        "singular_value_overlap": -0.6477499604225159,
        "subspace_overlap": 0.21326465904712677,
        "activation_l2_distance": 0.546093225479126,
        "activation_cosine_similarity": 0.6427323222160339,
        "activation_magnitude_ratio": -0.19323870539665222,
        "activation_dot_product": 0.054031144827604294,
        "encoder_gradient_cosine_similarity": 0.06654704362154007,
        "encoder_gradient_l2_distance": -1.164494276046753,
        "encoder_gradient_dot_product": 0.24234534800052643,
        "input_gradient_cosine_similarity": 0.14701974391937256,
        "input_gradient_l2_distance": -1.190631628036499,
        "input_gradient_dot_product": -0.2815804183483124
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5123585842021424,
      "val_r": 0.35743426636208053,
      "n_iterations": 566,
      "coefficients": {
        "right_subspace_overlap_top_k": -21.455482482910156,
        "right_subspace_overlap_bottom_k": 10.591191291809082,
        "interaction_matrix_overlap_top_k": 0.26116567850112915,
        "interaction_matrix_overlap_bottom_k": -2.3124351501464844,
        "effective_rank": -8.71925163269043,
        "effective_rank_mergeability_score": 6.982450485229492,
        "stable_rank": 1.5752309560775757,
        "spectral_gap": 27.355510711669922,
        "singular_value_ratio": -16.287118911743164,
        "layerwise_effective_rank": -16.987552642822266,
        "layerwise_effective_rank_mergeability_score": -7.5095696449279785,
        "task_vector_cosine_similarity": -3.6971678733825684,
        "task_vector_l2_distance": -20.569353103637695,
        "task_vector_dot_product": 29.392770767211914,
        "weight_space_angle": 30.430124282836914,
        "task_vector_magnitude_ratio": 41.09474563598633,
        "singular_value_overlap": -40.71236038208008,
        "subspace_overlap": 46.85479736328125,
        "activation_l2_distance": -42.90866470336914,
        "activation_cosine_similarity": -11.62248420715332,
        "activation_magnitude_ratio": -12.838310241699219,
        "activation_dot_product": 17.87136459350586,
        "encoder_gradient_cosine_similarity": 11.628484725952148,
        "encoder_gradient_l2_distance": -38.93916702270508,
        "encoder_gradient_dot_product": 24.223363876342773,
        "input_gradient_cosine_similarity": 14.856185913085938,
        "input_gradient_l2_distance": -29.743854522705078,
        "input_gradient_dot_product": -48.714813232421875
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5204341472096797,
      "val_r": 0.2741956183169245,
      "n_iterations": 58,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.2750799655914307,
        "right_subspace_overlap_bottom_k": 0.8258106112480164,
        "interaction_matrix_overlap_top_k": -0.021013030782341957,
        "interaction_matrix_overlap_bottom_k": -0.47876712679862976,
        "effective_rank": 0.825473964214325,
        "effective_rank_mergeability_score": 1.0576292276382446,
        "stable_rank": -0.09351302683353424,
        "spectral_gap": 0.5342305302619934,
        "singular_value_ratio": 1.6862962245941162,
        "layerwise_effective_rank": -1.1076271533966064,
        "layerwise_effective_rank_mergeability_score": -0.23789112269878387,
        "task_vector_cosine_similarity": 0.011572815477848053,
        "task_vector_l2_distance": -1.5742182731628418,
        "task_vector_dot_product": 0.12261909991502762,
        "weight_space_angle": -1.8482050895690918,
        "task_vector_magnitude_ratio": -1.4650416374206543,
        "singular_value_overlap": -1.8035717010498047,
        "subspace_overlap": 1.7033979892730713,
        "activation_l2_distance": 1.0453368425369263,
        "activation_cosine_similarity": 1.489193320274353,
        "activation_magnitude_ratio": -0.6239452362060547,
        "activation_dot_product": 0.5725274085998535,
        "encoder_gradient_cosine_similarity": 1.0345369577407837,
        "encoder_gradient_l2_distance": -2.381279706954956,
        "encoder_gradient_dot_product": 1.0077006816864014,
        "input_gradient_cosine_similarity": 1.2182689905166626,
        "input_gradient_l2_distance": -1.8113454580307007,
        "input_gradient_dot_product": -1.3621151447296143
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.526889305716344,
      "val_r": 0.46267536522287106,
      "n_iterations": 598,
      "coefficients": {
        "right_subspace_overlap_top_k": 28.694650650024414,
        "right_subspace_overlap_bottom_k": 40.89944839477539,
        "interaction_matrix_overlap_top_k": 26.15945816040039,
        "interaction_matrix_overlap_bottom_k": -0.3178020417690277,
        "effective_rank": 0.671822190284729,
        "effective_rank_mergeability_score": -0.11947738379240036,
        "stable_rank": -2.9442570209503174,
        "spectral_gap": 25.387134552001953,
        "singular_value_ratio": -2.8274190425872803,
        "layerwise_effective_rank": 14.356609344482422,
        "layerwise_effective_rank_mergeability_score": -10.754535675048828,
        "task_vector_cosine_similarity": -2.1870551109313965,
        "task_vector_l2_distance": -64.702880859375,
        "task_vector_dot_product": -3.452604055404663,
        "weight_space_angle": -6.898242950439453,
        "task_vector_magnitude_ratio": -13.30142593383789,
        "singular_value_overlap": -44.584896087646484,
        "subspace_overlap": 35.64731216430664,
        "activation_l2_distance": -5.457095146179199,
        "activation_cosine_similarity": -19.19826316833496,
        "activation_magnitude_ratio": -20.22203826904297,
        "activation_dot_product": 49.70189666748047,
        "encoder_gradient_cosine_similarity": 18.62147331237793,
        "encoder_gradient_l2_distance": -45.244659423828125,
        "encoder_gradient_dot_product": 41.11552810668945,
        "input_gradient_cosine_similarity": 29.727571487426758,
        "input_gradient_l2_distance": -31.477066040039062,
        "input_gradient_dot_product": -56.17942428588867
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.4095843535063962,
      "val_r": 0.6404406959306077,
      "n_iterations": 287,
      "coefficients": {
        "right_subspace_overlap_top_k": 38.251243591308594,
        "right_subspace_overlap_bottom_k": 3.333575487136841,
        "interaction_matrix_overlap_top_k": 11.25088882446289,
        "interaction_matrix_overlap_bottom_k": 13.00234317779541,
        "effective_rank": 0.5836756229400635,
        "effective_rank_mergeability_score": 12.465267181396484,
        "stable_rank": -26.055397033691406,
        "spectral_gap": -40.27873992919922,
        "singular_value_ratio": -27.866172790527344,
        "layerwise_effective_rank": 18.79156494140625,
        "layerwise_effective_rank_mergeability_score": 18.916034698486328,
        "task_vector_cosine_similarity": 12.798273086547852,
        "task_vector_l2_distance": -15.67981243133545,
        "task_vector_dot_product": 40.39371871948242,
        "weight_space_angle": -26.60549545288086,
        "task_vector_magnitude_ratio": -3.5626726150512695,
        "singular_value_overlap": -24.968017578125,
        "subspace_overlap": -13.564486503601074,
        "activation_l2_distance": -23.695743560791016,
        "activation_cosine_similarity": 16.876474380493164,
        "activation_magnitude_ratio": -27.254858016967773,
        "activation_dot_product": 10.619412422180176,
        "encoder_gradient_cosine_similarity": 33.535789489746094,
        "encoder_gradient_l2_distance": -31.22893524169922,
        "encoder_gradient_dot_product": 27.53123664855957,
        "input_gradient_cosine_similarity": 21.071924209594727,
        "input_gradient_l2_distance": 2.379992723464966,
        "input_gradient_dot_product": -39.45030975341797
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.44605056383421055,
      "val_r": 0.21370854769137984,
      "n_iterations": 54,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.3053792715072632,
        "right_subspace_overlap_bottom_k": -0.5538750290870667,
        "interaction_matrix_overlap_top_k": 1.258569598197937,
        "interaction_matrix_overlap_bottom_k": 0.34728220105171204,
        "effective_rank": 0.5036842823028564,
        "effective_rank_mergeability_score": 0.4209989309310913,
        "stable_rank": -1.4275684356689453,
        "spectral_gap": -0.11005834490060806,
        "singular_value_ratio": -0.28495585918426514,
        "layerwise_effective_rank": 0.7133463025093079,
        "layerwise_effective_rank_mergeability_score": -0.6549616456031799,
        "task_vector_cosine_similarity": -0.07567419856786728,
        "task_vector_l2_distance": -0.1146177276968956,
        "task_vector_dot_product": -1.1733803749084473,
        "weight_space_angle": 0.6533597111701965,
        "task_vector_magnitude_ratio": -0.18681477010250092,
        "singular_value_overlap": -1.5245444774627686,
        "subspace_overlap": 1.6490048170089722,
        "activation_l2_distance": -0.3470243513584137,
        "activation_cosine_similarity": 0.9415438771247864,
        "activation_magnitude_ratio": 0.20363204181194305,
        "activation_dot_product": 0.3492506146430969,
        "encoder_gradient_cosine_similarity": 0.8812928795814514,
        "encoder_gradient_l2_distance": -1.1622134447097778,
        "encoder_gradient_dot_product": 0.8731623888015747,
        "input_gradient_cosine_similarity": 0.04979425296187401,
        "input_gradient_l2_distance": -0.4832877218723297,
        "input_gradient_dot_product": -1.089110255241394
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4113800762503088,
      "val_r": -0.01798747575859143,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.4942426085472107,
        "right_subspace_overlap_bottom_k": 0.10880579054355621,
        "interaction_matrix_overlap_top_k": 0.9209040999412537,
        "interaction_matrix_overlap_bottom_k": 0.8614187836647034,
        "effective_rank": -0.2599610984325409,
        "effective_rank_mergeability_score": -0.41791579127311707,
        "stable_rank": 0.24326947331428528,
        "spectral_gap": 0.13088500499725342,
        "singular_value_ratio": -0.810853898525238,
        "layerwise_effective_rank": -0.10791292786598206,
        "layerwise_effective_rank_mergeability_score": -0.16047795116901398,
        "task_vector_cosine_similarity": 1.1115113496780396,
        "task_vector_l2_distance": -0.983818531036377,
        "task_vector_dot_product": -0.008175872266292572,
        "weight_space_angle": -1.2017241716384888,
        "task_vector_magnitude_ratio": -0.4506934583187103,
        "singular_value_overlap": -0.14496351778507233,
        "subspace_overlap": 1.5556724071502686,
        "activation_l2_distance": -0.7817996740341187,
        "activation_cosine_similarity": 0.027391131967306137,
        "activation_magnitude_ratio": -0.4790499210357666,
        "activation_dot_product": 0.8611674308776855,
        "encoder_gradient_cosine_similarity": 1.0501689910888672,
        "encoder_gradient_l2_distance": -1.0980055332183838,
        "encoder_gradient_dot_product": 1.0210132598876953,
        "input_gradient_cosine_similarity": 0.27588537335395813,
        "input_gradient_l2_distance": -0.959780752658844,
        "input_gradient_dot_product": 0.30535683035850525
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.4344566628211467,
      "val_r": -0.2124867727816542,
      "n_iterations": 64,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.320817232131958,
        "right_subspace_overlap_bottom_k": 0.6558763384819031,
        "interaction_matrix_overlap_top_k": 0.9163430333137512,
        "interaction_matrix_overlap_bottom_k": -0.15351784229278564,
        "effective_rank": -0.07150984555482864,
        "effective_rank_mergeability_score": 0.15136146545410156,
        "stable_rank": -1.0678653717041016,
        "spectral_gap": -1.1334558725357056,
        "singular_value_ratio": -0.7116017937660217,
        "layerwise_effective_rank": -1.2412219047546387,
        "layerwise_effective_rank_mergeability_score": 1.1619259119033813,
        "task_vector_cosine_similarity": 1.6136198043823242,
        "task_vector_l2_distance": -1.5574026107788086,
        "task_vector_dot_product": 1.3161256313323975,
        "weight_space_angle": -1.2961779832839966,
        "task_vector_magnitude_ratio": 0.027231276035308838,
        "singular_value_overlap": -0.579566240310669,
        "subspace_overlap": 1.153377652168274,
        "activation_l2_distance": -0.2225896269083023,
        "activation_cosine_similarity": 1.5695383548736572,
        "activation_magnitude_ratio": -1.1840916872024536,
        "activation_dot_product": 1.4933464527130127,
        "encoder_gradient_cosine_similarity": 2.040302276611328,
        "encoder_gradient_l2_distance": -0.7919341325759888,
        "encoder_gradient_dot_product": 1.373292326927185,
        "input_gradient_cosine_similarity": -0.04179272800683975,
        "input_gradient_l2_distance": -1.7906320095062256,
        "input_gradient_dot_product": -2.1344034671783447
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4758694891594627,
      "val_r": 0.032070729269804796,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.430480718612671,
        "right_subspace_overlap_bottom_k": 0.8247535824775696,
        "interaction_matrix_overlap_top_k": 0.48691317439079285,
        "interaction_matrix_overlap_bottom_k": 1.3451530933380127,
        "effective_rank": -1.4923444986343384,
        "effective_rank_mergeability_score": 3.6059722900390625,
        "stable_rank": -1.5480579137802124,
        "spectral_gap": -1.0925501585006714,
        "singular_value_ratio": 0.082816481590271,
        "layerwise_effective_rank": 3.0468218326568604,
        "layerwise_effective_rank_mergeability_score": -0.6634852886199951,
        "task_vector_cosine_similarity": 1.0222707986831665,
        "task_vector_l2_distance": -4.898500442504883,
        "task_vector_dot_product": 5.029423236846924,
        "weight_space_angle": 2.0002176761627197,
        "task_vector_magnitude_ratio": -1.613713026046753,
        "singular_value_overlap": -1.5355497598648071,
        "subspace_overlap": 1.7511708736419678,
        "activation_l2_distance": -3.1096887588500977,
        "activation_cosine_similarity": -5.1236252784729,
        "activation_magnitude_ratio": 2.440434217453003,
        "activation_dot_product": 3.9137585163116455,
        "encoder_gradient_cosine_similarity": 2.774693727493286,
        "encoder_gradient_l2_distance": -5.657060146331787,
        "encoder_gradient_dot_product": 0.496726930141449,
        "input_gradient_cosine_similarity": 1.4649903774261475,
        "input_gradient_l2_distance": -2.547091245651245,
        "input_gradient_dot_product": -3.217073440551758
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5402624314815903,
      "val_r": 0.24605584513661757,
      "n_iterations": 72,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.05097665637731552,
        "right_subspace_overlap_bottom_k": 0.5725411772727966,
        "interaction_matrix_overlap_top_k": 0.6881452798843384,
        "interaction_matrix_overlap_bottom_k": 1.189568042755127,
        "effective_rank": 0.24582678079605103,
        "effective_rank_mergeability_score": 1.089765191078186,
        "stable_rank": -0.1976088136434555,
        "spectral_gap": -0.06581579148769379,
        "singular_value_ratio": -1.8212767839431763,
        "layerwise_effective_rank": 1.3808252811431885,
        "layerwise_effective_rank_mergeability_score": 0.2179640382528305,
        "task_vector_cosine_similarity": -0.3450024724006653,
        "task_vector_l2_distance": -1.7333165407180786,
        "task_vector_dot_product": 0.2502911388874054,
        "weight_space_angle": 0.7759913802146912,
        "task_vector_magnitude_ratio": 0.665760338306427,
        "singular_value_overlap": -1.545485496520996,
        "subspace_overlap": 0.23768070340156555,
        "activation_l2_distance": -0.0733952447772026,
        "activation_cosine_similarity": 0.7671086192131042,
        "activation_magnitude_ratio": -0.26226022839546204,
        "activation_dot_product": 1.7385507822036743,
        "encoder_gradient_cosine_similarity": 0.2303048074245453,
        "encoder_gradient_l2_distance": -2.910008430480957,
        "encoder_gradient_dot_product": 0.1302841752767563,
        "input_gradient_cosine_similarity": 1.480812430381775,
        "input_gradient_l2_distance": -0.9520339965820312,
        "input_gradient_dot_product": -1.7786154747009277
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5455700852188665,
      "val_r": 0.4438227712627764,
      "n_iterations": 926,
      "coefficients": {
        "right_subspace_overlap_top_k": -12.291982650756836,
        "right_subspace_overlap_bottom_k": -8.000214576721191,
        "interaction_matrix_overlap_top_k": 20.519237518310547,
        "interaction_matrix_overlap_bottom_k": 42.28584671020508,
        "effective_rank": -0.9896414875984192,
        "effective_rank_mergeability_score": 118.54064178466797,
        "stable_rank": -16.440576553344727,
        "spectral_gap": -52.30946350097656,
        "singular_value_ratio": 25.25296974182129,
        "layerwise_effective_rank": 6.192306995391846,
        "layerwise_effective_rank_mergeability_score": -63.011680603027344,
        "task_vector_cosine_similarity": 17.411720275878906,
        "task_vector_l2_distance": -35.002784729003906,
        "task_vector_dot_product": 35.069026947021484,
        "weight_space_angle": 59.51445007324219,
        "task_vector_magnitude_ratio": -38.85870361328125,
        "singular_value_overlap": -40.87267303466797,
        "subspace_overlap": 41.35482406616211,
        "activation_l2_distance": 0.9236084222793579,
        "activation_cosine_similarity": 46.367645263671875,
        "activation_magnitude_ratio": -13.279208183288574,
        "activation_dot_product": 4.0466413497924805,
        "encoder_gradient_cosine_similarity": 15.301006317138672,
        "encoder_gradient_l2_distance": -83.60974884033203,
        "encoder_gradient_dot_product": -3.0440807342529297,
        "input_gradient_cosine_similarity": -0.1955074667930603,
        "input_gradient_l2_distance": -92.87298583984375,
        "input_gradient_dot_product": 7.16798734664917
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4364231566715455,
      "val_r": 0.46643927177431727,
      "n_iterations": 384,
      "coefficients": {
        "right_subspace_overlap_top_k": 29.426319122314453,
        "right_subspace_overlap_bottom_k": 16.142683029174805,
        "interaction_matrix_overlap_top_k": 65.93655395507812,
        "interaction_matrix_overlap_bottom_k": 15.692445755004883,
        "effective_rank": -5.945303440093994,
        "effective_rank_mergeability_score": -37.49040985107422,
        "stable_rank": -52.917320251464844,
        "spectral_gap": 55.89363098144531,
        "singular_value_ratio": 5.738622188568115,
        "layerwise_effective_rank": 17.083660125732422,
        "layerwise_effective_rank_mergeability_score": -1.9743391275405884,
        "task_vector_cosine_similarity": -2.8153505325317383,
        "task_vector_l2_distance": -1.831562876701355,
        "task_vector_dot_product": 21.97808265686035,
        "weight_space_angle": 34.40476989746094,
        "task_vector_magnitude_ratio": 37.56373977661133,
        "singular_value_overlap": -30.20838737487793,
        "subspace_overlap": 29.722742080688477,
        "activation_l2_distance": -33.217655181884766,
        "activation_cosine_similarity": 17.07735252380371,
        "activation_magnitude_ratio": -32.89870071411133,
        "activation_dot_product": -5.206292629241943,
        "encoder_gradient_cosine_similarity": 21.235652923583984,
        "encoder_gradient_l2_distance": -62.45842742919922,
        "encoder_gradient_dot_product": -21.59337043762207,
        "input_gradient_cosine_similarity": 12.993361473083496,
        "input_gradient_l2_distance": -29.712099075317383,
        "input_gradient_dot_product": -46.37088394165039
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5427946514004536,
      "val_r": 0.729594345604001,
      "n_iterations": 463,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.86621379852295,
        "right_subspace_overlap_bottom_k": -11.850199699401855,
        "interaction_matrix_overlap_top_k": -7.310124397277832,
        "interaction_matrix_overlap_bottom_k": 41.57493209838867,
        "effective_rank": 17.086896896362305,
        "effective_rank_mergeability_score": 38.93622589111328,
        "stable_rank": -5.08089542388916,
        "spectral_gap": 1.5874253511428833,
        "singular_value_ratio": -7.709202289581299,
        "layerwise_effective_rank": 10.572263717651367,
        "layerwise_effective_rank_mergeability_score": -21.775461196899414,
        "task_vector_cosine_similarity": 21.935781478881836,
        "task_vector_l2_distance": -15.877445220947266,
        "task_vector_dot_product": 6.041308879852295,
        "weight_space_angle": 24.15760040283203,
        "task_vector_magnitude_ratio": -10.384069442749023,
        "singular_value_overlap": -14.625484466552734,
        "subspace_overlap": 9.772543907165527,
        "activation_l2_distance": -11.536285400390625,
        "activation_cosine_similarity": 1.4460417032241821,
        "activation_magnitude_ratio": -6.909881114959717,
        "activation_dot_product": 24.64700698852539,
        "encoder_gradient_cosine_similarity": -3.8050804138183594,
        "encoder_gradient_l2_distance": -34.82926559448242,
        "encoder_gradient_dot_product": 0.9487921595573425,
        "input_gradient_cosine_similarity": 9.922460556030273,
        "input_gradient_l2_distance": -53.8760871887207,
        "input_gradient_dot_product": -8.491686820983887
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3125463051093166,
      "val_r": 0.5421903501193377,
      "n_iterations": 602,
      "coefficients": {
        "right_subspace_overlap_top_k": -21.232948303222656,
        "right_subspace_overlap_bottom_k": 35.03164291381836,
        "interaction_matrix_overlap_top_k": 41.41282653808594,
        "interaction_matrix_overlap_bottom_k": -44.122188568115234,
        "effective_rank": -90.47598266601562,
        "effective_rank_mergeability_score": -3.3712520599365234,
        "stable_rank": 61.45185089111328,
        "spectral_gap": -9.501459121704102,
        "singular_value_ratio": -57.053279876708984,
        "layerwise_effective_rank": -0.2670879364013672,
        "layerwise_effective_rank_mergeability_score": -48.63814163208008,
        "task_vector_cosine_similarity": 24.050853729248047,
        "task_vector_l2_distance": 35.393165588378906,
        "task_vector_dot_product": 54.22669219970703,
        "weight_space_angle": -50.43867492675781,
        "task_vector_magnitude_ratio": -47.20144271850586,
        "singular_value_overlap": -53.144927978515625,
        "subspace_overlap": 61.4846076965332,
        "activation_l2_distance": -27.287546157836914,
        "activation_cosine_similarity": 4.24669075012207,
        "activation_magnitude_ratio": -15.255441665649414,
        "activation_dot_product": 108.87320709228516,
        "encoder_gradient_cosine_similarity": 8.554911613464355,
        "encoder_gradient_l2_distance": 3.7783045768737793,
        "encoder_gradient_dot_product": 38.811676025390625,
        "input_gradient_cosine_similarity": 24.71049690246582,
        "input_gradient_l2_distance": -61.2934684753418,
        "input_gradient_dot_product": -16.40106773376465
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5593380098179652,
      "val_r": 0.04657858956688325,
      "n_iterations": 82,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.5575430393218994,
        "right_subspace_overlap_bottom_k": -0.5596252083778381,
        "interaction_matrix_overlap_top_k": 2.839726686477661,
        "interaction_matrix_overlap_bottom_k": 1.167256236076355,
        "effective_rank": -0.11004746705293655,
        "effective_rank_mergeability_score": 0.5568341612815857,
        "stable_rank": -1.5077052116394043,
        "spectral_gap": 1.8607685565948486,
        "singular_value_ratio": 0.754018247127533,
        "layerwise_effective_rank": 0.1910262554883957,
        "layerwise_effective_rank_mergeability_score": -1.3732330799102783,
        "task_vector_cosine_similarity": 1.9422258138656616,
        "task_vector_l2_distance": -2.90183687210083,
        "task_vector_dot_product": -0.33140385150909424,
        "weight_space_angle": 2.4822447299957275,
        "task_vector_magnitude_ratio": 0.6655574440956116,
        "singular_value_overlap": 0.9368748068809509,
        "subspace_overlap": 2.9332385063171387,
        "activation_l2_distance": -0.7901437282562256,
        "activation_cosine_similarity": 0.29847201704978943,
        "activation_magnitude_ratio": -2.0199382305145264,
        "activation_dot_product": 0.6206237077713013,
        "encoder_gradient_cosine_similarity": 0.5411211252212524,
        "encoder_gradient_l2_distance": -3.660367965698242,
        "encoder_gradient_dot_product": 2.439671277999878,
        "input_gradient_cosine_similarity": 0.20098081231117249,
        "input_gradient_l2_distance": -3.3904271125793457,
        "input_gradient_dot_product": -3.866161584854126
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5332814475923957,
      "val_r": 0.35146048394360185,
      "n_iterations": 764,
      "coefficients": {
        "right_subspace_overlap_top_k": 67.25897216796875,
        "right_subspace_overlap_bottom_k": -25.013975143432617,
        "interaction_matrix_overlap_top_k": 49.130531311035156,
        "interaction_matrix_overlap_bottom_k": 39.88640213012695,
        "effective_rank": 15.31657886505127,
        "effective_rank_mergeability_score": 28.511253356933594,
        "stable_rank": -37.2973518371582,
        "spectral_gap": 16.752912521362305,
        "singular_value_ratio": 4.984354019165039,
        "layerwise_effective_rank": 14.005823135375977,
        "layerwise_effective_rank_mergeability_score": 3.194840431213379,
        "task_vector_cosine_similarity": 24.92837142944336,
        "task_vector_l2_distance": -41.064308166503906,
        "task_vector_dot_product": -16.30060386657715,
        "weight_space_angle": 4.430484771728516,
        "task_vector_magnitude_ratio": 27.757638931274414,
        "singular_value_overlap": -64.58381652832031,
        "subspace_overlap": -9.325819969177246,
        "activation_l2_distance": -31.81072425842285,
        "activation_cosine_similarity": -14.769776344299316,
        "activation_magnitude_ratio": -22.660810470581055,
        "activation_dot_product": 42.27481460571289,
        "encoder_gradient_cosine_similarity": 17.931289672851562,
        "encoder_gradient_l2_distance": -39.53450393676758,
        "encoder_gradient_dot_product": 36.82197952270508,
        "input_gradient_cosine_similarity": 13.555611610412598,
        "input_gradient_l2_distance": -54.54294204711914,
        "input_gradient_dot_product": -75.6277084350586
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6028453507848948,
      "val_r": 0.3771145186163264,
      "n_iterations": 101,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.8210006952285767,
        "right_subspace_overlap_bottom_k": -0.15056569874286652,
        "interaction_matrix_overlap_top_k": -0.6412796974182129,
        "interaction_matrix_overlap_bottom_k": 2.891528844833374,
        "effective_rank": 1.7878915071487427,
        "effective_rank_mergeability_score": -0.7035937905311584,
        "stable_rank": -2.0675437450408936,
        "spectral_gap": 0.7686418890953064,
        "singular_value_ratio": 0.5198497772216797,
        "layerwise_effective_rank": -0.02876179851591587,
        "layerwise_effective_rank_mergeability_score": 0.6284816861152649,
        "task_vector_cosine_similarity": 1.440178394317627,
        "task_vector_l2_distance": -2.40437388420105,
        "task_vector_dot_product": -0.10308153182268143,
        "weight_space_angle": 1.8056291341781616,
        "task_vector_magnitude_ratio": -0.6623445153236389,
        "singular_value_overlap": -1.6620337963104248,
        "subspace_overlap": -0.3860682547092438,
        "activation_l2_distance": 0.6859055757522583,
        "activation_cosine_similarity": 1.3564730882644653,
        "activation_magnitude_ratio": -0.6559566259384155,
        "activation_dot_product": 0.46570244431495667,
        "encoder_gradient_cosine_similarity": 0.11811262369155884,
        "encoder_gradient_l2_distance": -2.210766077041626,
        "encoder_gradient_dot_product": 0.6715587377548218,
        "input_gradient_cosine_similarity": 1.5613633394241333,
        "input_gradient_l2_distance": -4.040473937988281,
        "input_gradient_dot_product": -0.5458477139472961
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8131460980706349,
      "val_r": 0.6730171496755554,
      "n_iterations": 139,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.9404190182685852,
        "right_subspace_overlap_bottom_k": -1.7105122804641724,
        "interaction_matrix_overlap_top_k": 0.5709906816482544,
        "interaction_matrix_overlap_bottom_k": 0.7855408191680908,
        "effective_rank": -0.09485536813735962,
        "effective_rank_mergeability_score": -0.1252785176038742,
        "stable_rank": 0.2827313244342804,
        "spectral_gap": 0.4481615722179413,
        "singular_value_ratio": 0.19336213171482086,
        "layerwise_effective_rank": -0.645535945892334,
        "layerwise_effective_rank_mergeability_score": 0.2113039344549179,
        "task_vector_cosine_similarity": -0.4309379458427429,
        "task_vector_l2_distance": 0.09540344029664993,
        "task_vector_dot_product": 0.19553320109844208,
        "weight_space_angle": 0.9972664713859558,
        "task_vector_magnitude_ratio": 0.4607841968536377,
        "singular_value_overlap": -0.05735386162996292,
        "subspace_overlap": -0.01397744007408619,
        "activation_l2_distance": -0.055361662060022354,
        "activation_cosine_similarity": 0.5713040828704834,
        "activation_magnitude_ratio": -0.06478659063577652,
        "activation_dot_product": 0.24264618754386902,
        "encoder_gradient_cosine_similarity": 0.38252151012420654,
        "encoder_gradient_l2_distance": -1.1327948570251465,
        "encoder_gradient_dot_product": 0.33494439721107483,
        "input_gradient_cosine_similarity": -0.028754454106092453,
        "input_gradient_l2_distance": -0.9915743470191956,
        "input_gradient_dot_product": -0.7836977243423462
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4690687006303482,
      "val_r": 0.0908742929518947,
      "n_iterations": 791,
      "coefficients": {
        "right_subspace_overlap_top_k": 85.90338134765625,
        "right_subspace_overlap_bottom_k": -56.017417907714844,
        "interaction_matrix_overlap_top_k": 2.7512047290802,
        "interaction_matrix_overlap_bottom_k": 88.14535522460938,
        "effective_rank": -26.432449340820312,
        "effective_rank_mergeability_score": -48.63050842285156,
        "stable_rank": -58.085140228271484,
        "spectral_gap": -24.601478576660156,
        "singular_value_ratio": -25.895572662353516,
        "layerwise_effective_rank": 4.703769207000732,
        "layerwise_effective_rank_mergeability_score": -12.11481761932373,
        "task_vector_cosine_similarity": 50.362667083740234,
        "task_vector_l2_distance": -100.43136596679688,
        "task_vector_dot_product": 41.77426528930664,
        "weight_space_angle": 2.7390525341033936,
        "task_vector_magnitude_ratio": -30.757299423217773,
        "singular_value_overlap": -115.68717193603516,
        "subspace_overlap": 81.42311096191406,
        "activation_l2_distance": -33.052947998046875,
        "activation_cosine_similarity": -25.138626098632812,
        "activation_magnitude_ratio": -36.26564407348633,
        "activation_dot_product": 103.3575439453125,
        "encoder_gradient_cosine_similarity": 73.6261978149414,
        "encoder_gradient_l2_distance": -34.70211410522461,
        "encoder_gradient_dot_product": 62.41127014160156,
        "input_gradient_cosine_similarity": 124.96775817871094,
        "input_gradient_l2_distance": -49.25468444824219,
        "input_gradient_dot_product": -46.372859954833984
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}