{
  "aggregate_metrics": {
    "train_mse": 25.369529973883203,
    "train_r2": -7183.166842571682,
    "train_pearson_r": -0.00840698615932825,
    "train_pearson_p": 0.6333434719933269,
    "val_mse": 36.654481386195805,
    "val_r2": -10378.849694729162,
    "val_pearson_r": -0.0029448080897597952,
    "val_pearson_p": 0.9557212942646698
  },
  "per_fold_stats": {
    "train_mse_mean": 25.53688115633603,
    "train_mse_std": 103.57236926618279,
    "val_mse_mean": 34.54967890944381,
    "val_mse_std": 144.46447303261232,
    "train_r_mean": 0.1792491015710598,
    "train_r_std": 0.2829509031001972,
    "val_r_mean": 0.07050800523315728,
    "val_r_std": 0.3108038543721988
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.49118074774742126,
    "right_subspace_overlap_bottom_k": -0.07264728844165802,
    "interaction_matrix_overlap_top_k": -0.2584740221500397,
    "interaction_matrix_overlap_bottom_k": -0.2751474380493164,
    "effective_rank": 0.04194309189915657,
    "effective_rank_mergeability_score": -0.5323687195777893,
    "stable_rank": 0.2875727117061615,
    "spectral_gap": -0.5615673065185547,
    "singular_value_ratio": 0.13742555677890778,
    "layerwise_effective_rank": -0.24619996547698975,
    "layerwise_effective_rank_mergeability_score": -0.33378154039382935,
    "task_vector_cosine_similarity": 0.3877089321613312,
    "task_vector_l2_distance": 0.141163632273674,
    "task_vector_dot_product": 0.4344313144683838,
    "weight_space_angle": 0.5862447023391724,
    "task_vector_magnitude_ratio": 0.11917342990636826,
    "singular_value_overlap": 0.13661114871501923,
    "subspace_overlap": -0.9108210802078247,
    "right_subspace_overlap": -0.4325525760650635,
    "activation_l2_distance": 0.3966771960258484,
    "activation_cosine_similarity": 0.0922483280301094,
    "activation_magnitude_ratio": 0.14647266268730164,
    "activation_dot_product": 0.4417017102241516,
    "encoder_gradient_cosine_similarity": 0.4309094548225403,
    "encoder_gradient_l2_distance": 0.33690136671066284,
    "encoder_gradient_dot_product": -0.5964588522911072,
    "input_gradient_cosine_similarity": 0.37651506066322327,
    "input_gradient_l2_distance": 0.19318506121635437,
    "input_gradient_dot_product": 0.034424297511577606
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 2.212162494659424,
    "right_subspace_overlap_bottom_k": 0.9689323902130127,
    "interaction_matrix_overlap_top_k": 1.8773070573806763,
    "interaction_matrix_overlap_bottom_k": 3.2985281944274902,
    "effective_rank": 1.4739174842834473,
    "effective_rank_mergeability_score": 1.8611639738082886,
    "stable_rank": 2.244232416152954,
    "spectral_gap": 2.880911350250244,
    "singular_value_ratio": 2.7769079208374023,
    "layerwise_effective_rank": 2.0178842544555664,
    "layerwise_effective_rank_mergeability_score": 1.0447567701339722,
    "task_vector_cosine_similarity": 4.206647872924805,
    "task_vector_l2_distance": 1.811143398284912,
    "task_vector_dot_product": 1.7809165716171265,
    "weight_space_angle": 2.673119068145752,
    "task_vector_magnitude_ratio": 0.8952328562736511,
    "singular_value_overlap": 1.5416101217269897,
    "subspace_overlap": 4.117164611816406,
    "right_subspace_overlap": 3.4015040397644043,
    "activation_l2_distance": 1.56473970413208,
    "activation_cosine_similarity": 1.8943023681640625,
    "activation_magnitude_ratio": 0.8496588468551636,
    "activation_dot_product": 2.0479447841644287,
    "encoder_gradient_cosine_similarity": 1.0532304048538208,
    "encoder_gradient_l2_distance": 2.3635878562927246,
    "encoder_gradient_dot_product": 2.1953823566436768,
    "input_gradient_cosine_similarity": 1.9505232572555542,
    "input_gradient_l2_distance": 0.9390873312950134,
    "input_gradient_dot_product": 1.638098955154419
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 2.335065632448343,
      "train_r2": -699.4341433497739,
      "train_pearson_r": -0.10667782378333449,
      "val_mse": 2.3663696248017936,
      "val_r2": -1551.201244029165,
      "val_pearson_r": -0.03771063536156652,
      "n_iterations": 61,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.8046399354934692,
        "right_subspace_overlap_bottom_k": 0.01310704741626978,
        "interaction_matrix_overlap_top_k": 1.4372572898864746,
        "interaction_matrix_overlap_bottom_k": 1.2640669345855713,
        "effective_rank": -2.0103468894958496,
        "effective_rank_mergeability_score": -1.6488672494888306,
        "stable_rank": -0.29944777488708496,
        "spectral_gap": -0.056719981133937836,
        "singular_value_ratio": 0.38229095935821533,
        "layerwise_effective_rank": -0.10535129904747009,
        "layerwise_effective_rank_mergeability_score": -0.41558966040611267,
        "task_vector_cosine_similarity": -0.9740012288093567,
        "task_vector_l2_distance": 2.411975622177124,
        "task_vector_dot_product": -0.8806260228157043,
        "weight_space_angle": 1.4059170484542847,
        "task_vector_magnitude_ratio": -0.43879491090774536,
        "singular_value_overlap": -0.34815680980682373,
        "subspace_overlap": 1.7406615018844604,
        "right_subspace_overlap": 0.06845008581876755,
        "activation_l2_distance": 0.2565516233444214,
        "activation_cosine_similarity": -0.23517026007175446,
        "activation_magnitude_ratio": 0.7604434490203857,
        "activation_dot_product": -0.0794607624411583,
        "encoder_gradient_cosine_similarity": 1.007149577140808,
        "encoder_gradient_l2_distance": -0.6068378686904907,
        "encoder_gradient_dot_product": 0.3245680034160614,
        "input_gradient_cosine_similarity": -0.029024118557572365,
        "input_gradient_l2_distance": 0.4482973515987396,
        "input_gradient_dot_product": -1.6253703832626343
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.4980280091951502,
      "train_r2": -136.56115282844675,
      "train_pearson_r": -0.3242885978209018,
      "val_mse": 0.492406637483008,
      "val_r2": -291.5110784044485,
      "val_pearson_r": -0.2622825839666062,
      "n_iterations": 55,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.32506832480430603,
        "right_subspace_overlap_bottom_k": -0.2530561089515686,
        "interaction_matrix_overlap_top_k": -0.09380067884922028,
        "interaction_matrix_overlap_bottom_k": 0.42403414845466614,
        "effective_rank": -0.9093276858329773,
        "effective_rank_mergeability_score": 0.5760561227798462,
        "stable_rank": 0.240371435880661,
        "spectral_gap": 0.15242400765419006,
        "singular_value_ratio": 0.6690794825553894,
        "layerwise_effective_rank": -0.18650589883327484,
        "layerwise_effective_rank_mergeability_score": -0.5361496210098267,
        "task_vector_cosine_similarity": -0.2007555067539215,
        "task_vector_l2_distance": 0.6217156052589417,
        "task_vector_dot_product": -0.5779979825019836,
        "weight_space_angle": -0.3871016502380371,
        "task_vector_magnitude_ratio": 0.444272518157959,
        "singular_value_overlap": -0.028744805604219437,
        "subspace_overlap": -0.7189441919326782,
        "right_subspace_overlap": -0.771342933177948,
        "activation_l2_distance": -0.10053893178701401,
        "activation_cosine_similarity": -0.10845425724983215,
        "activation_magnitude_ratio": 1.141802191734314,
        "activation_dot_product": -0.1925705075263977,
        "encoder_gradient_cosine_similarity": 0.8066096901893616,
        "encoder_gradient_l2_distance": 1.2067508697509766,
        "encoder_gradient_dot_product": 0.36606064438819885,
        "input_gradient_cosine_similarity": -0.3507368862628937,
        "input_gradient_l2_distance": -0.49010491371154785,
        "input_gradient_dot_product": -0.07402987033128738
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 22.428593858772167,
      "train_r2": -6176.212330071324,
      "train_pearson_r": -0.06403056944861224,
      "val_mse": 20.786403336861085,
      "val_r2": -10318.235809848444,
      "val_pearson_r": -0.11300886962898024,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": -2.4669930934906006,
        "right_subspace_overlap_bottom_k": 3.469865083694458,
        "interaction_matrix_overlap_top_k": 0.5845297574996948,
        "interaction_matrix_overlap_bottom_k": 6.1941237449646,
        "effective_rank": -4.441277503967285,
        "effective_rank_mergeability_score": -1.8942112922668457,
        "stable_rank": 1.5079234838485718,
        "spectral_gap": 3.9129257202148438,
        "singular_value_ratio": -4.806225299835205,
        "layerwise_effective_rank": 3.4819657802581787,
        "layerwise_effective_rank_mergeability_score": -2.151150941848755,
        "task_vector_cosine_similarity": -9.829425811767578,
        "task_vector_l2_distance": -0.759151816368103,
        "task_vector_dot_product": 1.2689749002456665,
        "weight_space_angle": -5.371304035186768,
        "task_vector_magnitude_ratio": 2.098572015762329,
        "singular_value_overlap": 3.0177316665649414,
        "subspace_overlap": -4.763068675994873,
        "right_subspace_overlap": 3.471689462661743,
        "activation_l2_distance": 2.254373550415039,
        "activation_cosine_similarity": 2.8649661540985107,
        "activation_magnitude_ratio": 0.49800026416778564,
        "activation_dot_product": 4.686839580535889,
        "encoder_gradient_cosine_similarity": -0.2743563652038574,
        "encoder_gradient_l2_distance": -2.9759511947631836,
        "encoder_gradient_dot_product": -9.30392074584961,
        "input_gradient_cosine_similarity": 3.96216082572937,
        "input_gradient_l2_distance": 2.3309409618377686,
        "input_gradient_dot_product": 4.4100022315979
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 1.0123356334900682,
      "train_r2": -283.97247629158284,
      "train_pearson_r": -0.12744178913649387,
      "val_mse": 0.7342876896213559,
      "val_r2": -418.85609672198916,
      "val_pearson_r": -0.23808876944796897,
      "n_iterations": 123,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.9413014054298401,
        "right_subspace_overlap_bottom_k": -1.0604901313781738,
        "interaction_matrix_overlap_top_k": -3.641871929168701,
        "interaction_matrix_overlap_bottom_k": 1.5133858919143677,
        "effective_rank": 1.1871129274368286,
        "effective_rank_mergeability_score": 1.2689976692199707,
        "stable_rank": -0.8481199741363525,
        "spectral_gap": -1.755454659461975,
        "singular_value_ratio": 0.21181055903434753,
        "layerwise_effective_rank": 0.4099409580230713,
        "layerwise_effective_rank_mergeability_score": 1.2801849842071533,
        "task_vector_cosine_similarity": 3.2292120456695557,
        "task_vector_l2_distance": 1.299109935760498,
        "task_vector_dot_product": 0.1807389259338379,
        "weight_space_angle": -0.2600492835044861,
        "task_vector_magnitude_ratio": -0.1517050713300705,
        "singular_value_overlap": 0.09215690195560455,
        "subspace_overlap": -1.8515243530273438,
        "right_subspace_overlap": 2.1683874130249023,
        "activation_l2_distance": -0.27276042103767395,
        "activation_cosine_similarity": 1.0673532485961914,
        "activation_magnitude_ratio": -0.3546810746192932,
        "activation_dot_product": -0.8126624822616577,
        "encoder_gradient_cosine_similarity": 0.10368287563323975,
        "encoder_gradient_l2_distance": 1.6842199563980103,
        "encoder_gradient_dot_product": 0.839338481426239,
        "input_gradient_cosine_similarity": -2.7399771213531494,
        "input_gradient_l2_distance": -0.4181748032569885,
        "input_gradient_dot_product": -0.43668434023857117
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.05012060933014964,
      "train_r2": -12.98927364975714,
      "train_pearson_r": 0.1875404646163995,
      "val_mse": 0.043135508793776416,
      "val_r2": -18.004003841075985,
      "val_pearson_r": 0.02560232922128426,
      "n_iterations": 296,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5259504318237305,
        "right_subspace_overlap_bottom_k": -0.4307129383087158,
        "interaction_matrix_overlap_top_k": 0.42386552691459656,
        "interaction_matrix_overlap_bottom_k": 0.1848170906305313,
        "effective_rank": -0.001318363705649972,
        "effective_rank_mergeability_score": 0.8342218995094299,
        "stable_rank": -0.1504540592432022,
        "spectral_gap": -0.6599244475364685,
        "singular_value_ratio": -0.3269902169704437,
        "layerwise_effective_rank": 0.9106295108795166,
        "layerwise_effective_rank_mergeability_score": -0.1864033043384552,
        "task_vector_cosine_similarity": 0.08535809069871902,
        "task_vector_l2_distance": 0.18835383653640747,
        "task_vector_dot_product": -0.44694745540618896,
        "weight_space_angle": 0.37348031997680664,
        "task_vector_magnitude_ratio": -0.3352809250354767,
        "singular_value_overlap": 0.3788592517375946,
        "subspace_overlap": -0.0718473270535469,
        "right_subspace_overlap": -0.5799144506454468,
        "activation_l2_distance": 0.18240800499916077,
        "activation_cosine_similarity": 0.13785672187805176,
        "activation_magnitude_ratio": 0.028685610741376877,
        "activation_dot_product": 0.14060263335704803,
        "encoder_gradient_cosine_similarity": 0.2887648046016693,
        "encoder_gradient_l2_distance": 0.06229483336210251,
        "encoder_gradient_dot_product": 0.18317361176013947,
        "input_gradient_cosine_similarity": -0.14768750965595245,
        "input_gradient_l2_distance": 0.01591760478913784,
        "input_gradient_dot_product": -0.6101395487785339
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_mse": 6.827197209487792,
      "train_r2": -1905.4914882380167,
      "train_pearson_r": -0.11035815380615344,
      "val_mse": 1.4426218877903965,
      "val_r2": -823.1078642698473,
      "val_pearson_r": 0.04695408427247934,
      "n_iterations": 60,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.1095550060272217,
        "right_subspace_overlap_bottom_k": -1.8060457706451416,
        "interaction_matrix_overlap_top_k": -3.588289499282837,
        "interaction_matrix_overlap_bottom_k": -0.9053723216056824,
        "effective_rank": -0.4872592091560364,
        "effective_rank_mergeability_score": -3.946514129638672,
        "stable_rank": -2.2907629013061523,
        "spectral_gap": -1.3679742813110352,
        "singular_value_ratio": -1.9120988845825195,
        "layerwise_effective_rank": -1.76518976688385,
        "layerwise_effective_rank_mergeability_score": -0.06779622286558151,
        "task_vector_cosine_similarity": 0.7049704790115356,
        "task_vector_l2_distance": 4.490325450897217,
        "task_vector_dot_product": -0.29328882694244385,
        "weight_space_angle": 0.140584796667099,
        "task_vector_magnitude_ratio": 1.4452416896820068,
        "singular_value_overlap": 3.127925157546997,
        "subspace_overlap": 2.5143048763275146,
        "right_subspace_overlap": 0.6779171228408813,
        "activation_l2_distance": -2.691465377807617,
        "activation_cosine_similarity": 1.2171456813812256,
        "activation_magnitude_ratio": 2.1358160972595215,
        "activation_dot_product": -2.3482718467712402,
        "encoder_gradient_cosine_similarity": 1.5407594442367554,
        "encoder_gradient_l2_distance": -1.2301616668701172,
        "encoder_gradient_dot_product": -2.8533568382263184,
        "input_gradient_cosine_similarity": 0.9525247812271118,
        "input_gradient_l2_distance": 3.2889063358306885,
        "input_gradient_dot_product": 4.155373573303223
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_mse": 0.008221230631572454,
      "train_r2": -1.3444249776163577,
      "train_pearson_r": 0.39174710945141106,
      "val_mse": 0.06757216360098722,
      "val_r2": -49.05602565720321,
      "val_pearson_r": -0.3731535034946855,
      "n_iterations": 498,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.16957594454288483,
        "right_subspace_overlap_bottom_k": 0.030012689530849457,
        "interaction_matrix_overlap_top_k": -0.11760368198156357,
        "interaction_matrix_overlap_bottom_k": -0.11357004195451736,
        "effective_rank": 0.039740752428770065,
        "effective_rank_mergeability_score": 0.011882560327649117,
        "stable_rank": -0.24854609370231628,
        "spectral_gap": 0.21703346073627472,
        "singular_value_ratio": 0.08003011345863342,
        "layerwise_effective_rank": 0.32903268933296204,
        "layerwise_effective_rank_mergeability_score": 0.002698990050703287,
        "task_vector_cosine_similarity": 0.3125002384185791,
        "task_vector_l2_distance": 0.09372766315937042,
        "task_vector_dot_product": -0.4546149671077728,
        "weight_space_angle": 0.3322305977344513,
        "task_vector_magnitude_ratio": 0.12068261951208115,
        "singular_value_overlap": 0.12021558731794357,
        "subspace_overlap": -0.03953051194548607,
        "right_subspace_overlap": 0.025439472869038582,
        "activation_l2_distance": 0.21233844757080078,
        "activation_cosine_similarity": 0.24785888195037842,
        "activation_magnitude_ratio": 0.056187137961387634,
        "activation_dot_product": -0.01972304843366146,
        "encoder_gradient_cosine_similarity": 0.04635559394955635,
        "encoder_gradient_l2_distance": -0.18165425956249237,
        "encoder_gradient_dot_product": 0.07677225023508072,
        "input_gradient_cosine_similarity": -0.23282453417778015,
        "input_gradient_l2_distance": -0.054235681891441345,
        "input_gradient_dot_product": -0.062378499656915665
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.013601017052557693,
      "train_r2": -3.0580782750281426,
      "train_pearson_r": 0.28273183678852454,
      "val_mse": 0.05006858778932872,
      "val_r2": -26.088317312813146,
      "val_pearson_r": 0.3316140819784963,
      "n_iterations": 113,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.07568168640136719,
        "right_subspace_overlap_bottom_k": -0.06294771283864975,
        "interaction_matrix_overlap_top_k": -0.023612072691321373,
        "interaction_matrix_overlap_bottom_k": 0.006939372513443232,
        "effective_rank": 0.4070219397544861,
        "effective_rank_mergeability_score": 0.15917754173278809,
        "stable_rank": -0.2245718389749527,
        "spectral_gap": 0.22193248569965363,
        "singular_value_ratio": -0.18865567445755005,
        "layerwise_effective_rank": 0.1620994210243225,
        "layerwise_effective_rank_mergeability_score": 0.09978175908327103,
        "task_vector_cosine_similarity": -0.03345513343811035,
        "task_vector_l2_distance": 0.03593230992555618,
        "task_vector_dot_product": 0.13845835626125336,
        "weight_space_angle": 0.2710597515106201,
        "task_vector_magnitude_ratio": 0.3517487645149231,
        "singular_value_overlap": 0.18943169713020325,
        "subspace_overlap": -0.3366999626159668,
        "right_subspace_overlap": 0.1472785770893097,
        "activation_l2_distance": -0.04162700101733208,
        "activation_cosine_similarity": 0.036138057708740234,
        "activation_magnitude_ratio": 0.04009250923991203,
        "activation_dot_product": 0.0469173789024353,
        "encoder_gradient_cosine_similarity": 0.06310989707708359,
        "encoder_gradient_l2_distance": 0.03180878609418869,
        "encoder_gradient_dot_product": 0.18160417675971985,
        "input_gradient_cosine_similarity": -0.24092504382133484,
        "input_gradient_l2_distance": -0.2880406677722931,
        "input_gradient_dot_product": -0.0775517076253891
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_mse": 0.0271780178425261,
      "train_r2": -6.569035130795441,
      "train_pearson_r": 0.1230867284338681,
      "val_mse": 0.048402210889112784,
      "val_r2": -16.60688516473354,
      "val_pearson_r": 0.49137100520720844,
      "n_iterations": 112,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.011433741077780724,
        "right_subspace_overlap_bottom_k": -0.2635263204574585,
        "interaction_matrix_overlap_top_k": 0.03899678960442543,
        "interaction_matrix_overlap_bottom_k": 0.24006113409996033,
        "effective_rank": 0.055504895746707916,
        "effective_rank_mergeability_score": 0.13837452232837677,
        "stable_rank": 0.11394944787025452,
        "spectral_gap": 0.2577327787876129,
        "singular_value_ratio": 0.006635558325797319,
        "layerwise_effective_rank": 0.27438730001449585,
        "layerwise_effective_rank_mergeability_score": -0.13120393455028534,
        "task_vector_cosine_similarity": -0.04693824425339699,
        "task_vector_l2_distance": 0.08125706762075424,
        "task_vector_dot_product": 0.0641435980796814,
        "weight_space_angle": 0.28702354431152344,
        "task_vector_magnitude_ratio": -0.06771818548440933,
        "singular_value_overlap": 0.1039644181728363,
        "subspace_overlap": 0.05039007589221001,
        "right_subspace_overlap": -0.40174156427383423,
        "activation_l2_distance": 0.02260473370552063,
        "activation_cosine_similarity": 0.23264434933662415,
        "activation_magnitude_ratio": 0.09120301902294159,
        "activation_dot_product": -0.039715275168418884,
        "encoder_gradient_cosine_similarity": 0.09703658521175385,
        "encoder_gradient_l2_distance": -0.3219609558582306,
        "encoder_gradient_dot_product": -0.027163879945874214,
        "input_gradient_cosine_similarity": 0.1427600085735321,
        "input_gradient_l2_distance": -0.047350622713565826,
        "input_gradient_dot_product": 0.03676128014922142
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 476.47721267939517,
      "train_r2": -146478.89400616646,
      "train_pearson_r": -0.0010536826302935814,
      "val_mse": 663.9521788795038,
      "val_r2": -199727.08713760594,
      "val_pearson_r": 0.31508104744104976,
      "n_iterations": 52,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.434085845947266,
        "right_subspace_overlap_bottom_k": -0.7510902285575867,
        "interaction_matrix_overlap_top_k": 5.745115280151367,
        "interaction_matrix_overlap_bottom_k": -13.179398536682129,
        "effective_rank": 3.81300950050354,
        "effective_rank_mergeability_score": -7.065197944641113,
        "stable_rank": 9.489709854125977,
        "spectral_gap": -12.212890625,
        "singular_value_ratio": 11.182500839233398,
        "layerwise_effective_rank": -7.8725996017456055,
        "layerwise_effective_rank_mergeability_score": -3.440272808074951,
        "task_vector_cosine_similarity": 15.668519973754883,
        "task_vector_l2_distance": -6.093760013580322,
        "task_vector_dot_product": 7.775505542755127,
        "weight_space_angle": 10.604693412780762,
        "task_vector_magnitude_ratio": -2.6869091987609863,
        "singular_value_overlap": -5.244704246520996,
        "subspace_overlap": -17.630775451660156,
        "right_subspace_overlap": -14.681940078735352,
        "activation_l2_distance": 6.048007011413574,
        "activation_cosine_similarity": -7.602232456207275,
        "activation_magnitude_ratio": -2.7087066173553467,
        "activation_dot_product": 7.671995162963867,
        "encoder_gradient_cosine_similarity": 4.626860618591309,
        "encoder_gradient_l2_distance": 9.881120681762695,
        "encoder_gradient_dot_product": -2.6708288192749023,
        "input_gradient_cosine_similarity": 7.3700432777404785,
        "input_gradient_l2_distance": -0.9766027331352234,
        "input_gradient_dot_product": -3.5040931701660156
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.008373200191702086,
      "train_r2": -1.8483450247490976,
      "train_pearson_r": 0.538985638019935,
      "val_mse": 0.01717326979521916,
      "val_r2": -11.91012815194397,
      "val_pearson_r": 0.21833783217268507,
      "n_iterations": 232,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.12133743613958359,
        "right_subspace_overlap_bottom_k": -0.09956487268209457,
        "interaction_matrix_overlap_top_k": 0.0644129291176796,
        "interaction_matrix_overlap_bottom_k": -0.0486823134124279,
        "effective_rank": 0.14559583365917206,
        "effective_rank_mergeability_score": -0.16584190726280212,
        "stable_rank": -0.0860387533903122,
        "spectral_gap": 0.5456593632698059,
        "singular_value_ratio": 0.3294062912464142,
        "layerwise_effective_rank": 0.10892347991466522,
        "layerwise_effective_rank_mergeability_score": 0.1896226406097412,
        "task_vector_cosine_similarity": -0.10666650533676147,
        "task_vector_l2_distance": 0.06831710785627365,
        "task_vector_dot_product": 0.0726219192147255,
        "weight_space_angle": 0.17759576439857483,
        "task_vector_magnitude_ratio": 0.09978950023651123,
        "singular_value_overlap": 0.12655088305473328,
        "subspace_overlap": -0.2248317301273346,
        "right_subspace_overlap": 0.20007745921611786,
        "activation_l2_distance": 0.029311101883649826,
        "activation_cosine_similarity": 0.27074968814849854,
        "activation_magnitude_ratio": 0.023828303441405296,
        "activation_dot_product": -0.13085094094276428,
        "encoder_gradient_cosine_similarity": 0.009289327077567577,
        "encoder_gradient_l2_distance": -0.3029657006263733,
        "encoder_gradient_dot_product": 0.09781337529420853,
        "input_gradient_cosine_similarity": -0.11992551386356354,
        "input_gradient_l2_distance": -0.04441666603088379,
        "input_gradient_dot_product": -0.10840389877557755
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.007581749962365281,
      "train_r2": -1.077871830862029,
      "train_pearson_r": 0.5052572794519404,
      "val_mse": 0.007446269749013798,
      "val_r2": -3.361819093305029,
      "val_pearson_r": 0.3670579231039022,
      "n_iterations": 701,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.9120216965675354,
        "right_subspace_overlap_bottom_k": 0.5676639080047607,
        "interaction_matrix_overlap_top_k": 0.08839260041713715,
        "interaction_matrix_overlap_bottom_k": -0.7900233268737793,
        "effective_rank": 0.7804580926895142,
        "effective_rank_mergeability_score": 0.35171589255332947,
        "stable_rank": 0.04817047342658043,
        "spectral_gap": -0.1311623901128769,
        "singular_value_ratio": -0.5143970847129822,
        "layerwise_effective_rank": -0.5232419967651367,
        "layerwise_effective_rank_mergeability_score": -0.16976378858089447,
        "task_vector_cosine_similarity": 0.2563469409942627,
        "task_vector_l2_distance": -0.006178678013384342,
        "task_vector_dot_product": 0.05581904202699661,
        "weight_space_angle": 0.6481209397315979,
        "task_vector_magnitude_ratio": 0.24900779128074646,
        "singular_value_overlap": 0.060692280530929565,
        "subspace_overlap": -0.4858104884624481,
        "right_subspace_overlap": -0.356726735830307,
        "activation_l2_distance": 0.12725643813610077,
        "activation_cosine_similarity": 0.26355043053627014,
        "activation_magnitude_ratio": 0.003717282088473439,
        "activation_dot_product": -0.07980749011039734,
        "encoder_gradient_cosine_similarity": 0.035911232233047485,
        "encoder_gradient_l2_distance": -0.2292715609073639,
        "encoder_gradient_dot_product": 0.0741337388753891,
        "input_gradient_cosine_similarity": -0.10513201355934143,
        "input_gradient_l2_distance": -0.0319729782640934,
        "input_gradient_dot_product": -0.09965645521879196
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.053395387990758415,
      "train_r2": -14.275418292619982,
      "train_pearson_r": -0.027468227909470126,
      "val_mse": 0.14788070727069663,
      "val_r2": -88.39767187142797,
      "val_pearson_r": -0.21589840864048127,
      "n_iterations": 79,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.058340758085250854,
        "right_subspace_overlap_bottom_k": -0.00020018639042973518,
        "interaction_matrix_overlap_top_k": -0.5297384858131409,
        "interaction_matrix_overlap_bottom_k": -0.08637470752000809,
        "effective_rank": 0.7586565017700195,
        "effective_rank_mergeability_score": 0.18906241655349731,
        "stable_rank": 0.44810259342193604,
        "spectral_gap": -0.5072253942489624,
        "singular_value_ratio": -0.5484257936477661,
        "layerwise_effective_rank": -0.08491044491529465,
        "layerwise_effective_rank_mergeability_score": 0.18392841517925262,
        "task_vector_cosine_similarity": 0.597354531288147,
        "task_vector_l2_distance": 0.11620897799730301,
        "task_vector_dot_product": 0.33136287331581116,
        "weight_space_angle": 0.505297064781189,
        "task_vector_magnitude_ratio": -0.49573540687561035,
        "singular_value_overlap": 0.13240502774715424,
        "subspace_overlap": 0.07782711833715439,
        "right_subspace_overlap": -0.13993540406227112,
        "activation_l2_distance": 0.2178342044353485,
        "activation_cosine_similarity": 0.6821919083595276,
        "activation_magnitude_ratio": -0.10370177030563354,
        "activation_dot_product": -0.37101271748542786,
        "encoder_gradient_cosine_similarity": -0.10740114748477936,
        "encoder_gradient_l2_distance": -0.04763941094279289,
        "encoder_gradient_dot_product": 0.011838345788419247,
        "input_gradient_cosine_similarity": 0.0916684940457344,
        "input_gradient_l2_distance": 0.12310396879911423,
        "input_gradient_dot_product": -0.38513442873954773
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.007473485997693824,
      "train_r2": -1.0485066380846662,
      "train_pearson_r": 0.5032514071194463,
      "val_mse": 0.013926526509929142,
      "val_r2": -5.835584725934715,
      "val_pearson_r": 0.07838310425146591,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.21065513789653778,
        "right_subspace_overlap_bottom_k": 0.10578227043151855,
        "interaction_matrix_overlap_top_k": -0.07363462448120117,
        "interaction_matrix_overlap_bottom_k": -0.34568771719932556,
        "effective_rank": 0.5516208410263062,
        "effective_rank_mergeability_score": 0.3274126648902893,
        "stable_rank": 0.025105653330683708,
        "spectral_gap": 0.20078538358211517,
        "singular_value_ratio": -0.4745253324508667,
        "layerwise_effective_rank": -0.07915493100881577,
        "layerwise_effective_rank_mergeability_score": 0.005490483250468969,
        "task_vector_cosine_similarity": 0.009929175488650799,
        "task_vector_l2_distance": 0.10443376749753952,
        "task_vector_dot_product": -0.039466097950935364,
        "weight_space_angle": 0.2573816776275635,
        "task_vector_magnitude_ratio": 0.5552709102630615,
        "singular_value_overlap": 0.11088940501213074,
        "subspace_overlap": -0.0041067106649279594,
        "right_subspace_overlap": -0.09693554043769836,
        "activation_l2_distance": -0.031796377152204514,
        "activation_cosine_similarity": 0.2386624813079834,
        "activation_magnitude_ratio": 0.015147306956350803,
        "activation_dot_product": -0.15803754329681396,
        "encoder_gradient_cosine_similarity": 0.050895288586616516,
        "encoder_gradient_l2_distance": -0.275889128446579,
        "encoder_gradient_dot_product": 0.08285889029502869,
        "input_gradient_cosine_similarity": -0.11010342091321945,
        "input_gradient_l2_distance": -0.0227422583848238,
        "input_gradient_dot_product": -0.1399787962436676
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.3328334906865094,
      "train_r2": -93.91560780611995,
      "train_pearson_r": 0.16585201206816122,
      "val_mse": 0.20684336129828923,
      "val_r2": -75.35868620457529,
      "val_pearson_r": -0.10513814321962589,
      "n_iterations": 138,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.14269594848155975,
        "right_subspace_overlap_bottom_k": -1.080151081085205,
        "interaction_matrix_overlap_top_k": -2.568972110748291,
        "interaction_matrix_overlap_bottom_k": 0.3026536703109741,
        "effective_rank": -0.49502941966056824,
        "effective_rank_mergeability_score": -0.1985287219285965,
        "stable_rank": -1.6893633604049683,
        "spectral_gap": -1.1539297103881836,
        "singular_value_ratio": -0.8403965830802917,
        "layerwise_effective_rank": -1.6171220541000366,
        "layerwise_effective_rank_mergeability_score": -2.2002735137939453,
        "task_vector_cosine_similarity": -0.9578976631164551,
        "task_vector_l2_distance": -0.21606415510177612,
        "task_vector_dot_product": 1.7689549922943115,
        "weight_space_angle": 2.1735482215881348,
        "task_vector_magnitude_ratio": 0.9991854429244995,
        "singular_value_overlap": 0.9020894169807434,
        "subspace_overlap": 2.7647171020507812,
        "right_subspace_overlap": 0.4094597399234772,
        "activation_l2_distance": 1.60055673122406,
        "activation_cosine_similarity": 1.449082612991333,
        "activation_magnitude_ratio": 0.7230449318885803,
        "activation_dot_product": 0.04379895702004433,
        "encoder_gradient_cosine_similarity": -0.22591441869735718,
        "encoder_gradient_l2_distance": 0.7112831473350525,
        "encoder_gradient_dot_product": 0.6067808866500854,
        "input_gradient_cosine_similarity": -0.20730343461036682,
        "input_gradient_l2_distance": -0.2838560938835144,
        "input_gradient_dot_product": 0.12880158424377441
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_mse": 0.006742717899384497,
      "train_r2": -0.8303441850195947,
      "train_pearson_r": 0.5851824788689419,
      "val_mse": 0.020620405557306983,
      "val_r2": -8.939417617518941,
      "val_pearson_r": -0.07289612098670172,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.48031488060951233,
        "right_subspace_overlap_bottom_k": 0.1763298362493515,
        "interaction_matrix_overlap_top_k": -0.2503017485141754,
        "interaction_matrix_overlap_bottom_k": -0.376990407705307,
        "effective_rank": 0.19421450793743134,
        "effective_rank_mergeability_score": -0.08778615295886993,
        "stable_rank": -0.25290027260780334,
        "spectral_gap": 0.12533628940582275,
        "singular_value_ratio": -0.31338149309158325,
        "layerwise_effective_rank": 0.5683045983314514,
        "layerwise_effective_rank_mergeability_score": 0.4503321051597595,
        "task_vector_cosine_similarity": 0.21174515783786774,
        "task_vector_l2_distance": 0.11708679050207138,
        "task_vector_dot_product": -0.4173564314842224,
        "weight_space_angle": 0.07653466612100601,
        "task_vector_magnitude_ratio": 0.3895643651485443,
        "singular_value_overlap": 0.14994554221630096,
        "subspace_overlap": -0.1720498502254486,
        "right_subspace_overlap": 0.012127388268709183,
        "activation_l2_distance": 0.14989987015724182,
        "activation_cosine_similarity": 0.29919442534446716,
        "activation_magnitude_ratio": -0.010861700400710106,
        "activation_dot_product": -0.09592429548501968,
        "encoder_gradient_cosine_similarity": 0.03349417820572853,
        "encoder_gradient_l2_distance": -0.23991864919662476,
        "encoder_gradient_dot_product": 0.07495979964733124,
        "input_gradient_cosine_similarity": -0.12580282986164093,
        "input_gradient_l2_distance": -0.0544871911406517,
        "input_gradient_dot_product": -0.11107978224754333
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_mse": 0.5719975078029667,
      "train_r2": -154.79701182296688,
      "train_pearson_r": -0.23529878646670133,
      "val_mse": 0.36539921906748934,
      "val_r2": -176.63597067916072,
      "val_pearson_r": -0.48099142106763915,
      "n_iterations": 177,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.05816817656159401,
        "right_subspace_overlap_bottom_k": -0.07883394509553909,
        "interaction_matrix_overlap_top_k": -1.506447196006775,
        "interaction_matrix_overlap_bottom_k": 0.9402664303779602,
        "effective_rank": 0.8061920404434204,
        "effective_rank_mergeability_score": -0.02875431627035141,
        "stable_rank": -0.6863300800323486,
        "spectral_gap": 0.19855576753616333,
        "singular_value_ratio": -0.3876039981842041,
        "layerwise_effective_rank": 0.9128277897834778,
        "layerwise_effective_rank_mergeability_score": 0.5148007869720459,
        "task_vector_cosine_similarity": -1.162894606590271,
        "task_vector_l2_distance": 0.250436007976532,
        "task_vector_dot_product": -0.1022343635559082,
        "weight_space_angle": 0.1221405491232872,
        "task_vector_magnitude_ratio": -0.08451054245233536,
        "singular_value_overlap": -0.49561798572540283,
        "subspace_overlap": 0.8088626265525818,
        "right_subspace_overlap": 0.8053515553474426,
        "activation_l2_distance": -0.47530239820480347,
        "activation_cosine_similarity": -0.04056641086935997,
        "activation_magnitude_ratio": 0.25332504510879517,
        "activation_dot_product": 0.6001165509223938,
        "encoder_gradient_cosine_similarity": 0.44516605138778687,
        "encoder_gradient_l2_distance": 0.4055488705635071,
        "encoder_gradient_dot_product": -0.40362226963043213,
        "input_gradient_cosine_similarity": -0.187106654047966,
        "input_gradient_l2_distance": 0.5948416590690613,
        "input_gradient_dot_product": -1.0789297819137573
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.01298895338350799,
      "train_r2": -2.707625741768189,
      "train_pearson_r": 0.3720340981674511,
      "val_mse": 0.020796862023134615,
      "val_r2": -10.330021751836616,
      "val_pearson_r": 0.18815642957415898,
      "n_iterations": 247,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.02001882530748844,
        "right_subspace_overlap_bottom_k": 0.09779561311006546,
        "interaction_matrix_overlap_top_k": 0.09926808625459671,
        "interaction_matrix_overlap_bottom_k": -0.28349563479423523,
        "effective_rank": 0.0965496152639389,
        "effective_rank_mergeability_score": 0.17558255791664124,
        "stable_rank": 0.11570290476083755,
        "spectral_gap": 0.40161654353141785,
        "singular_value_ratio": 0.27622902393341064,
        "layerwise_effective_rank": 0.1105215847492218,
        "layerwise_effective_rank_mergeability_score": 0.005544034298509359,
        "task_vector_cosine_similarity": -0.14170101284980774,
        "task_vector_l2_distance": 0.07225042581558228,
        "task_vector_dot_product": 0.02495776116847992,
        "weight_space_angle": 0.2315635085105896,
        "task_vector_magnitude_ratio": 0.018511135131120682,
        "singular_value_overlap": 0.15082556009292603,
        "subspace_overlap": 0.18094094097614288,
        "right_subspace_overlap": -0.20388935506343842,
        "activation_l2_distance": 0.0058669145219028,
        "activation_cosine_similarity": 0.30286362767219543,
        "activation_magnitude_ratio": 0.013756593689322472,
        "activation_dot_product": -0.2099023312330246,
        "encoder_gradient_cosine_similarity": 0.015475327149033546,
        "encoder_gradient_l2_distance": -0.29493847489356995,
        "encoder_gradient_dot_product": 0.03612484410405159,
        "input_gradient_cosine_similarity": -0.24182912707328796,
        "input_gradient_l2_distance": -0.1142917275428772,
        "input_gradient_dot_product": 0.07877948135137558
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.006700902637991639,
      "train_r2": -0.8433961891311994,
      "train_pearson_r": 0.5600184732766369,
      "val_mse": 0.00549585257262164,
      "val_r2": -2.1848189725234914,
      "val_pearson_r": 0.6648739476486109,
      "n_iterations": 793,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.1370251327753067,
        "right_subspace_overlap_bottom_k": -0.08512023091316223,
        "interaction_matrix_overlap_top_k": -0.4961104393005371,
        "interaction_matrix_overlap_bottom_k": -0.13926613330841064,
        "effective_rank": 0.2783452868461609,
        "effective_rank_mergeability_score": 0.05715831741690636,
        "stable_rank": 0.13494719564914703,
        "spectral_gap": 0.08023453503847122,
        "singular_value_ratio": -0.23481889069080353,
        "layerwise_effective_rank": -0.19735436141490936,
        "layerwise_effective_rank_mergeability_score": 0.03576430305838585,
        "task_vector_cosine_similarity": 0.11269351840019226,
        "task_vector_l2_distance": 0.09038805216550827,
        "task_vector_dot_product": 0.0030702752992510796,
        "weight_space_angle": 0.43810346722602844,
        "task_vector_magnitude_ratio": 0.20131266117095947,
        "singular_value_overlap": 0.10546652227640152,
        "subspace_overlap": 0.0360400527715683,
        "right_subspace_overlap": 0.402768611907959,
        "activation_l2_distance": 0.15989205241203308,
        "activation_cosine_similarity": 0.38017934560775757,
        "activation_magnitude_ratio": 0.005942882504314184,
        "activation_dot_product": -0.1299624741077423,
        "encoder_gradient_cosine_similarity": 0.03855045139789581,
        "encoder_gradient_l2_distance": -0.19841378927230835,
        "encoder_gradient_dot_product": 0.07615713030099869,
        "input_gradient_cosine_similarity": -0.13508984446525574,
        "input_gradient_l2_distance": -0.068963423371315,
        "input_gradient_dot_product": -0.08872000873088837
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_mse": 0.0519818325223104,
      "train_r2": -13.880305702545748,
      "train_pearson_r": 0.36591213616044105,
      "val_mse": 0.2045491878979149,
      "val_r2": -130.67426743916945,
      "val_pearson_r": 0.5818967756060602,
      "n_iterations": 67,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.20462258160114288,
        "right_subspace_overlap_bottom_k": 0.0582372322678566,
        "interaction_matrix_overlap_top_k": -0.7609366178512573,
        "interaction_matrix_overlap_bottom_k": -0.3044355511665344,
        "effective_rank": 0.06939910352230072,
        "effective_rank_mergeability_score": 0.2986840605735779,
        "stable_rank": 0.4040059745311737,
        "spectral_gap": 0.2996985912322998,
        "singular_value_ratio": 0.15804752707481384,
        "layerwise_effective_rank": 0.2387971132993698,
        "layerwise_effective_rank_mergeability_score": -0.14517560601234436,
        "task_vector_cosine_similarity": 0.01928425021469593,
        "task_vector_l2_distance": -0.14309221506118774,
        "task_vector_dot_product": 0.21655063331127167,
        "weight_space_angle": -0.3019258975982666,
        "task_vector_magnitude_ratio": -0.32903674244880676,
        "singular_value_overlap": 0.08029758930206299,
        "subspace_overlap": -0.09097325056791306,
        "right_subspace_overlap": 0.19242805242538452,
        "activation_l2_distance": 0.28013360500335693,
        "activation_cosine_similarity": 0.14095249772071838,
        "activation_magnitude_ratio": 0.31641125679016113,
        "activation_dot_product": 0.3116651773452759,
        "encoder_gradient_cosine_similarity": 0.01674887351691723,
        "encoder_gradient_l2_distance": -0.33939746022224426,
        "encoder_gradient_dot_product": 0.29752951860427856,
        "input_gradient_cosine_similarity": -0.01538790576159954,
        "input_gradient_l2_distance": -0.04306715726852417,
        "input_gradient_dot_product": 0.280918687582016
      }
    }
  ],
  "optimization_params": {
    "objective": "MSE",
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 1e-06
  }
}