{
  "aggregate_metrics": {
    "train_r": 0.4147937331012865,
    "train_p": 3.2574223455771243e-134,
    "val_r": 0.020843985235486483,
    "val_p": 0.6942824418649248
  },
  "per_fold_stats": {
    "train_r_mean": 0.5712423172767996,
    "train_r_std": 0.05534274277158711,
    "val_r_mean": 0.44763060141709604,
    "val_r_std": 0.15894195465037525,
    "n_nonzero_mean": 17.45,
    "n_nonzero_std": 3.412843389316304
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.0028030972462147474,
    "right_subspace_overlap_bottom_k": 0.0004903459921479225,
    "interaction_matrix_overlap_top_k": 0.0005224839551374316,
    "interaction_matrix_overlap_bottom_k": 0.008815896697342396,
    "effective_rank": -0.000454981520306319,
    "effective_rank_mergeability_score": 0.0005226937355473638,
    "stable_rank": -0.0003909252700395882,
    "spectral_gap": 0.0005298836622387171,
    "singular_value_ratio": -0.0006090336246415973,
    "layerwise_effective_rank": -0.00011231003009015694,
    "layerwise_effective_rank_mergeability_score": 0.0001790237583918497,
    "task_vector_cosine_similarity": -0.0008003037655726075,
    "task_vector_l2_distance": -0.011536127887666225,
    "task_vector_dot_product": -0.0010758162243291736,
    "weight_space_angle": -7.76826636865735e-05,
    "task_vector_magnitude_ratio": -0.0009859405690804124,
    "singular_value_overlap": -0.00787513516843319,
    "subspace_overlap": 0.001652594655752182,
    "right_subspace_overlap": 0.003585358615964651,
    "activation_l2_distance": -0.0017347775865346193,
    "activation_cosine_similarity": 0.002635424956679344,
    "activation_magnitude_ratio": -0.0021983995102345943,
    "activation_dot_product": 0.001540964818559587,
    "encoder_gradient_cosine_similarity": 0.0011550105409696698,
    "encoder_gradient_l2_distance": -0.01664988324046135,
    "encoder_gradient_dot_product": 0.000519001972861588,
    "input_gradient_cosine_similarity": 0.00023654312826693058,
    "input_gradient_l2_distance": -0.017714932560920715,
    "input_gradient_dot_product": -0.0032727557700127363
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.003067811019718647,
    "right_subspace_overlap_bottom_k": 0.004936478100717068,
    "interaction_matrix_overlap_top_k": 0.0014241113094612956,
    "interaction_matrix_overlap_bottom_k": 0.003564826911315322,
    "effective_rank": 0.0008939383551478386,
    "effective_rank_mergeability_score": 0.0009914550464600325,
    "stable_rank": 0.000820521148853004,
    "spectral_gap": 0.0007799084996804595,
    "singular_value_ratio": 0.0008263746276497841,
    "layerwise_effective_rank": 0.0010042249923571944,
    "layerwise_effective_rank_mergeability_score": 0.0009583879727870226,
    "task_vector_cosine_similarity": 0.001886551035568118,
    "task_vector_l2_distance": 0.004114768002182245,
    "task_vector_dot_product": 0.0018538839649409056,
    "weight_space_angle": 0.0020573956426233053,
    "task_vector_magnitude_ratio": 0.0009510933887213469,
    "singular_value_overlap": 0.0030843899585306644,
    "subspace_overlap": 0.0024448151234537363,
    "right_subspace_overlap": 0.003706187242642045,
    "activation_l2_distance": 0.0018886368488892913,
    "activation_cosine_similarity": 0.0029842660296708345,
    "activation_magnitude_ratio": 0.002446080558001995,
    "activation_dot_product": 0.004189772997051477,
    "encoder_gradient_cosine_similarity": 0.0013420016039162874,
    "encoder_gradient_l2_distance": 0.0065916916355490685,
    "encoder_gradient_dot_product": 0.0010260860435664654,
    "input_gradient_cosine_similarity": 0.0013873182469978929,
    "input_gradient_l2_distance": 0.008349020965397358,
    "input_gradient_dot_product": 0.002887350507080555
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.85,
    "right_subspace_overlap_bottom_k": 0.55,
    "interaction_matrix_overlap_top_k": 0.6,
    "interaction_matrix_overlap_bottom_k": 1.0,
    "effective_rank": 0.25,
    "effective_rank_mergeability_score": 0.35,
    "stable_rank": 0.2,
    "spectral_gap": 0.35,
    "singular_value_ratio": 0.4,
    "layerwise_effective_rank": 0.2,
    "layerwise_effective_rank_mergeability_score": 0.15,
    "task_vector_cosine_similarity": 0.5,
    "task_vector_l2_distance": 1.0,
    "task_vector_dot_product": 0.75,
    "weight_space_angle": 0.55,
    "task_vector_magnitude_ratio": 0.55,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.6,
    "right_subspace_overlap": 0.8,
    "activation_l2_distance": 0.65,
    "activation_cosine_similarity": 0.7,
    "activation_magnitude_ratio": 0.55,
    "activation_dot_product": 0.6,
    "encoder_gradient_cosine_similarity": 0.6,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.35,
    "input_gradient_cosine_similarity": 0.5,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.85
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6180740509609756,
      "val_r": 0.5697157024299452,
      "n_iterations": 413,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0025912015698850155,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.001850802218541503,
        "interaction_matrix_overlap_bottom_k": 0.013703127391636372,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0012978933518752456,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.004984332248568535,
        "task_vector_l2_distance": -0.011455300264060497,
        "task_vector_dot_product": -0.004625027533620596,
        "weight_space_angle": -0.0011668243678286672,
        "task_vector_magnitude_ratio": -0.0029435730539262295,
        "singular_value_overlap": -0.011220894753932953,
        "subspace_overlap": 0.005533314310014248,
        "right_subspace_overlap": 0.0021229018457233906,
        "activation_l2_distance": -0.00490214116871357,
        "activation_cosine_similarity": 0.0043952129781246185,
        "activation_magnitude_ratio": -0.0030675118323415518,
        "activation_dot_product": -0.0031750304624438286,
        "encoder_gradient_cosine_similarity": 0.0020073307678103447,
        "encoder_gradient_l2_distance": -0.014844807796180248,
        "encoder_gradient_dot_product": 0.0016714174998924136,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.015275994315743446,
        "input_gradient_dot_product": -0.0014901345130056143
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5530037731338635,
      "val_r": 0.4480554617012103,
      "n_iterations": 263,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005299021955579519,
        "right_subspace_overlap_bottom_k": 0.00918323639780283,
        "interaction_matrix_overlap_top_k": 0.0017932374030351639,
        "interaction_matrix_overlap_bottom_k": 0.007101086899638176,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.001670884434133768,
        "singular_value_ratio": -0.0011015268974006176,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0013613011687994003,
        "task_vector_l2_distance": -0.021293068304657936,
        "task_vector_dot_product": -0.0024362814147025347,
        "weight_space_angle": 0.001655402360484004,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.011078942567110062,
        "subspace_overlap": 0.0011637123534455895,
        "right_subspace_overlap": 0.011486200615763664,
        "activation_l2_distance": -0.004545020870864391,
        "activation_cosine_similarity": 0.008167557418346405,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.003101891838014126,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.03233359009027481,
        "encoder_gradient_dot_product": 0.0015757342334836721,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.04078017920255661,
        "input_gradient_dot_product": 0.0017023596446961164
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5938880577119328,
      "val_r": 0.5326124420722137,
      "n_iterations": 509,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00626923656091094,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.009760092943906784,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0010753237875178456,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009734059683978558,
        "task_vector_dot_product": -0.0031163825187832117,
        "weight_space_angle": -0.0018549347296357155,
        "task_vector_magnitude_ratio": -0.0017506986623629928,
        "singular_value_overlap": -0.009148070588707924,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0033904770389199257,
        "activation_l2_distance": -0.002922898158431053,
        "activation_cosine_similarity": 0.003187878057360649,
        "activation_magnitude_ratio": -0.004333951510488987,
        "activation_dot_product": 0.0012891010846942663,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.013682209886610508,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01446079183369875,
        "input_gradient_dot_product": -0.0040163155645132065
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5576310828427178,
      "val_r": 0.44274717067207786,
      "n_iterations": 274,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.0017558863619342446,
        "interaction_matrix_overlap_top_k": -0.0010860721813514829,
        "interaction_matrix_overlap_bottom_k": 0.009966002777218819,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.001045015174895525,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.002106581348925829,
        "task_vector_l2_distance": -0.009376106783747673,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0019290063064545393,
        "singular_value_overlap": -0.008377136662602425,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0028619058430194855,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0031275073997676373,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0024589451495558023,
        "encoder_gradient_l2_distance": -0.010712896473705769,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01156396884471178,
        "input_gradient_dot_product": -0.002982771024107933
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5996700268457557,
      "val_r": 0.5378257155287615,
      "n_iterations": 288,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0033669748809188604,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.0015559939201921225,
        "interaction_matrix_overlap_bottom_k": 0.010958733037114143,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0010467363754287362,
        "singular_value_ratio": -0.001290816580876708,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.001644620206207037,
        "task_vector_l2_distance": -0.01293565146625042,
        "task_vector_dot_product": -0.0052776820957660675,
        "weight_space_angle": -0.0010852222330868244,
        "task_vector_magnitude_ratio": -0.0018712326418608427,
        "singular_value_overlap": -0.009386422112584114,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.003171292133629322,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.011280304752290249,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0020663058385252953,
        "input_gradient_l2_distance": -0.014173361472785473,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5682565025968028,
      "val_r": 0.700182021631748,
      "n_iterations": 227,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0012698968639597297,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0013212927151471376,
        "interaction_matrix_overlap_bottom_k": 0.010989099740982056,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009764018468558788,
        "task_vector_dot_product": 0.0010261695133522153,
        "weight_space_angle": -0.002242692979052663,
        "task_vector_magnitude_ratio": -0.001686474191956222,
        "singular_value_overlap": -0.007381747011095285,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.001069747842848301,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0014326197560876608,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.013281473889946938,
        "encoder_gradient_dot_product": 0.0017475341446697712,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.008017344400286674,
        "input_gradient_dot_product": -0.00499511044472456
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5637292220554269,
      "val_r": 0.09832021592144836,
      "n_iterations": 312,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002257884945720434,
        "right_subspace_overlap_bottom_k": 0.005898905452340841,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.00881099421530962,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0012296228669583797,
        "task_vector_l2_distance": -0.011332336813211441,
        "task_vector_dot_product": -0.0017710113897919655,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.00863081868737936,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0018596574664115906,
        "activation_l2_distance": -0.0011909845052286983,
        "activation_cosine_similarity": 0.004624588880687952,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0012100469321012497,
        "encoder_gradient_l2_distance": -0.018869707360863686,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.0028026695363223553,
        "input_gradient_l2_distance": -0.016840539872646332,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5359777945002492,
      "val_r": 0.2417519438454659,
      "n_iterations": 371,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0024138358421623707,
        "right_subspace_overlap_bottom_k": 0.0010972426971420646,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.010750856250524521,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01296668965369463,
        "task_vector_dot_product": -0.001235158764757216,
        "weight_space_angle": 0.0012883846648037434,
        "task_vector_magnitude_ratio": -0.0017859159270301461,
        "singular_value_overlap": -0.007205511908978224,
        "subspace_overlap": 0.004675840958952904,
        "right_subspace_overlap": 0.002247557742521167,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0017582315485924482,
        "activation_magnitude_ratio": -0.0014149498892948031,
        "activation_dot_product": 0.0010779963340610266,
        "encoder_gradient_cosine_similarity": 0.0024107815697789192,
        "encoder_gradient_l2_distance": -0.012344466522336006,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0014810537686571479,
        "input_gradient_l2_distance": -0.00581307802349329,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5306435373667916,
      "val_r": 0.42226760816373765,
      "n_iterations": 280,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006372908130288124,
        "right_subspace_overlap_bottom_k": -0.004079069010913372,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.008584539406001568,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0021788107696920633,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0016560384538024664,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0012206619139760733,
        "task_vector_l2_distance": -0.008314480073750019,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.008661511354148388,
        "subspace_overlap": 0.00380483316257596,
        "right_subspace_overlap": 0.005803849082440138,
        "activation_l2_distance": -0.003230154048651457,
        "activation_cosine_similarity": 0.0016289826016873121,
        "activation_magnitude_ratio": -0.0088586350902915,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.002262020716443658,
        "encoder_gradient_l2_distance": -0.019343174993991852,
        "encoder_gradient_dot_product": 0.0014067620504647493,
        "input_gradient_cosine_similarity": 0.00124455732293427,
        "input_gradient_l2_distance": -0.01708904467523098,
        "input_gradient_dot_product": -0.005698848515748978
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4934394145064822,
      "val_r": 0.23030771673113648,
      "n_iterations": 202,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0018849847838282585,
        "right_subspace_overlap_bottom_k": -0.004817419685423374,
        "interaction_matrix_overlap_top_k": -0.0020810826681554317,
        "interaction_matrix_overlap_bottom_k": 0.006901550572365522,
        "effective_rank": -0.0016517462208867073,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0023971975315362215,
        "task_vector_l2_distance": -0.007594594266265631,
        "task_vector_dot_product": -0.0010407879017293453,
        "weight_space_angle": 0.0017087750602513552,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.008830549195408821,
        "subspace_overlap": 0.007562167942523956,
        "right_subspace_overlap": 0.0026988808531314135,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": -0.0020148465409874916,
        "activation_magnitude_ratio": -0.004539362154901028,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0016230803448706865,
        "encoder_gradient_l2_distance": -0.012935216538608074,
        "encoder_gradient_dot_product": 0.003610592568293214,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.017048172652721405,
        "input_gradient_dot_product": -0.005586983636021614
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5259409505326678,
      "val_r": 0.24490894094100873,
      "n_iterations": 270,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0024048895575106144,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.012457373552024364,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": -0.0017239571316167712,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.010684722103178501,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.006503191776573658,
        "subspace_overlap": 0.0018446739995852113,
        "right_subspace_overlap": 0.0023592233192175627,
        "activation_l2_distance": -0.0035191038623452187,
        "activation_cosine_similarity": 0.005276487208902836,
        "activation_magnitude_ratio": -0.0026374992448836565,
        "activation_dot_product": 0.0023292938712984324,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.016549127176404,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.0012322269612923265,
        "input_gradient_l2_distance": -0.014573728665709496,
        "input_gradient_dot_product": -0.003661161055788398
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5373417834617251,
      "val_r": 0.40300571884931513,
      "n_iterations": 246,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005800649989396334,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.0010210494510829449,
        "interaction_matrix_overlap_bottom_k": 0.007865937426686287,
        "effective_rank": -0.0018672787118703127,
        "effective_rank_mergeability_score": 0.0015925299376249313,
        "stable_rank": -0.0017292345874011517,
        "spectral_gap": 0.001991115976125002,
        "singular_value_ratio": -0.0018630237318575382,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009514114819467068,
        "task_vector_dot_product": 0.0014904148411005735,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.002036771969869733,
        "singular_value_overlap": -0.008643779903650284,
        "subspace_overlap": 0.003172900527715683,
        "right_subspace_overlap": 0.0022965408861637115,
        "activation_l2_distance": -0.0018845407757908106,
        "activation_cosine_similarity": 0.0017240658635273576,
        "activation_magnitude_ratio": -0.004460501484572887,
        "activation_dot_product": 0.0034414397086948156,
        "encoder_gradient_cosine_similarity": 0.0038997577503323555,
        "encoder_gradient_l2_distance": -0.014896337874233723,
        "encoder_gradient_dot_product": -0.0010470146080479026,
        "input_gradient_cosine_similarity": 0.0012901341542601585,
        "input_gradient_l2_distance": -0.01682719960808754,
        "input_gradient_dot_product": -0.0030701656360179186
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5346878359573785,
      "val_r": 0.4178246258242257,
      "n_iterations": 372,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0023737442679703236,
        "right_subspace_overlap_bottom_k": 0.00179577455855906,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.010707186535000801,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": -0.0012485419865697622,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.002225802978500724,
        "task_vector_l2_distance": -0.009756104089319706,
        "task_vector_dot_product": -0.0019835284911096096,
        "weight_space_angle": -0.005975981242954731,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.007532523013651371,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0025259798858314753,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.013350347056984901,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.002246818970888853,
        "input_gradient_l2_distance": -0.01688302494585514,
        "input_gradient_dot_product": -0.005476631689816713
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5775014660482487,
      "val_r": 0.7056167519213473,
      "n_iterations": 260,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002461113967001438,
        "right_subspace_overlap_bottom_k": 0.003933696076273918,
        "interaction_matrix_overlap_top_k": 0.0026432503946125507,
        "interaction_matrix_overlap_bottom_k": 0.009421202354133129,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0018775924108922482,
        "stable_rank": -0.0012008303310722113,
        "spectral_gap": 0.00105118821375072,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0187627375125885,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.004829147830605507,
        "task_vector_magnitude_ratio": -0.0010939622297883034,
        "singular_value_overlap": -0.012115050107240677,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.003755392273887992,
        "activation_l2_distance": -0.0017992560751736164,
        "activation_cosine_similarity": 0.0056720152497291565,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0011950972257182002,
        "encoder_gradient_cosine_similarity": 0.002871211152523756,
        "encoder_gradient_l2_distance": -0.02368965744972229,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.001197035307995975,
        "input_gradient_l2_distance": -0.028053907677531242,
        "input_gradient_dot_product": -0.005214518867433071
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.553125014635638,
      "val_r": 0.5974703807181759,
      "n_iterations": 240,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004209619015455246,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0010667608585208654,
        "interaction_matrix_overlap_bottom_k": 0.004901506006717682,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0024309176951646805,
        "singular_value_ratio": -0.0025844494812190533,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.003619321621954441,
        "task_vector_l2_distance": -0.016736846417188644,
        "task_vector_dot_product": -0.0021864825394004583,
        "weight_space_angle": -0.0011690945830196142,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.012278140522539616,
        "subspace_overlap": 0.003481028601527214,
        "right_subspace_overlap": 0.011060098186135292,
        "activation_l2_distance": -0.005314438603818417,
        "activation_cosine_similarity": 0.00838241633027792,
        "activation_magnitude_ratio": -0.002529058838263154,
        "activation_dot_product": -0.002459646435454488,
        "encoder_gradient_cosine_similarity": -0.0013181365793570876,
        "encoder_gradient_l2_distance": -0.02412434294819832,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.029440024867653847,
        "input_gradient_dot_product": -0.0030148508958518505
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5870188809111748,
      "val_r": 0.3976643967322311,
      "n_iterations": 208,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0028502473141998053,
        "right_subspace_overlap_bottom_k": 0.010066690854728222,
        "interaction_matrix_overlap_top_k": 0.003371868748217821,
        "interaction_matrix_overlap_bottom_k": 0.0021019214764237404,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0022139435168355703,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.001056955079548061,
        "layerwise_effective_rank": 0.001415930804796517,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.014579412527382374,
        "task_vector_dot_product": -0.001267450861632824,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.005584617145359516,
        "subspace_overlap": -0.0015266051050275564,
        "right_subspace_overlap": 0.002102457918226719,
        "activation_l2_distance": 0.00149232754483819,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.005827720742672682,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.016661034896969795,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.001707547577098012,
        "input_gradient_l2_distance": -0.0129429055377841,
        "input_gradient_dot_product": -0.004515375476330519
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5348943106453159,
      "val_r": 0.43233557488152985,
      "n_iterations": 213,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0028318637050688267,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0015399992698803544,
        "interaction_matrix_overlap_bottom_k": 0.010690230876207352,
        "effective_rank": -0.0010792005341500044,
        "effective_rank_mergeability_score": 0.0016882349736988544,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009645210579037666,
        "task_vector_dot_product": 0.0010256454115733504,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.003587873186916113,
        "subspace_overlap": 0.002718030009418726,
        "right_subspace_overlap": 0.00406984519213438,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0011998547706753016,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.004721947014331818,
        "encoder_gradient_cosine_similarity": 0.0017431579763069749,
        "encoder_gradient_l2_distance": -0.009304019622504711,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.010593226179480553,
        "input_gradient_dot_product": -0.0014672355027869344
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5586999842673284,
      "val_r": 0.4104740048628927,
      "n_iterations": 259,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.01146433874964714,
        "effective_rank": -0.0011079671094194055,
        "effective_rank_mergeability_score": 0.0017309833783656359,
        "stable_rank": 0.0,
        "spectral_gap": 0.0011089369654655457,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0017836313927546144,
        "layerwise_effective_rank_mergeability_score": 0.0016595909837633371,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009064048528671265,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0017588441260159016,
        "singular_value_overlap": -0.003984325565397739,
        "subspace_overlap": 0.0028767383191734552,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0014894700143486261,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0017801033100113273,
        "encoder_gradient_cosine_similarity": 0.0010607612784951925,
        "encoder_gradient_l2_distance": -0.007313823327422142,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01280833501368761,
        "input_gradient_dot_product": -0.002021968364715576
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7642331175113852,
      "val_r": 0.6951574649622094,
      "n_iterations": 240,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010874333791434765,
        "right_subspace_overlap_bottom_k": -0.014201279729604721,
        "interaction_matrix_overlap_top_k": 0.002606664551422,
        "interaction_matrix_overlap_bottom_k": -0.0018746597925201058,
        "effective_rank": -0.0033934377133846283,
        "effective_rank_mergeability_score": 0.0025991322472691536,
        "stable_rank": -0.002709629014134407,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.003534538671374321,
        "layerwise_effective_rank_mergeability_score": 0.0036448414903134108,
        "task_vector_cosine_similarity": -0.004832164384424686,
        "task_vector_l2_distance": -0.002320024883374572,
        "task_vector_dot_product": -0.001875006128102541,
        "weight_space_angle": 0.0024593868292868137,
        "task_vector_magnitude_ratio": -0.0015089894877746701,
        "singular_value_overlap": 0.0012166521046310663,
        "subspace_overlap": -0.0022547421976923943,
        "right_subspace_overlap": 0.012522442266345024,
        "activation_l2_distance": -0.002863891888409853,
        "activation_cosine_similarity": 0.007273436989635229,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.01657721772789955,
        "encoder_gradient_cosine_similarity": 0.0028712530620396137,
        "encoder_gradient_l2_distance": -0.03180106729269028,
        "encoder_gradient_dot_product": 0.0014150140341371298,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.03194541484117508,
        "input_gradient_dot_product": -0.011932282708585262
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6370895390441352,
      "val_r": 0.4243681699512402,
      "n_iterations": 349,
      "n_nonzero_coefficients": 12,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.002685029525309801,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.011056805960834026,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0021635624580085278,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.014893029816448689,
        "task_vector_dot_product": 0.0017562464345246553,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0013533404562622309,
        "singular_value_overlap": -0.008568275719881058,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.00714366789907217,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.01568005420267582,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0033414720091968775,
        "input_gradient_l2_distance": -0.01916840299963951,
        "input_gradient_dot_product": -0.002013114746659994
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1.0,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}