{
  "weight_avg": {
    "aggregate_metrics": {
      "train_r": 0.45862220809299836,
      "train_p": 2.342416506584294e-167,
      "val_r": 0.3428637702189011,
      "val_p": 2.5969614126138596e-11
    },
    "per_fold_stats": {
      "train_r_mean": 0.720340186386959,
      "train_r_std": 0.06599608304768316,
      "val_r_mean": 0.5779734530769707,
      "val_r_std": 0.19911802713444862,
      "n_nonzero_mean": 18.15,
      "n_nonzero_std": 2.5937424698685874
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.004708465188741684,
      "right_subspace_overlap_bottom_k": -0.008010061457753181,
      "interaction_matrix_overlap_top_k": 0.0015117996372282505,
      "interaction_matrix_overlap_bottom_k": -0.00019290500495117158,
      "effective_rank": -0.000283978006336838,
      "effective_rank_mergeability_score": 0.0006323595298454165,
      "stable_rank": -0.0003956049622502178,
      "spectral_gap": 0.0002330624556634575,
      "singular_value_ratio": -0.0003000728029292077,
      "layerwise_effective_rank": -0.000856732833199203,
      "layerwise_effective_rank_mergeability_score": 0.000911047391127795,
      "task_vector_cosine_similarity": -0.0006947992369532585,
      "task_vector_l2_distance": -0.004098940175026655,
      "task_vector_dot_product": -0.0013496583560481668,
      "weight_space_angle": 0.000530845602042973,
      "task_vector_magnitude_ratio": -5.2877825510222465e-05,
      "singular_value_overlap": 0.0009850380010902882,
      "subspace_overlap": 0.00040016035200096667,
      "right_subspace_overlap": 0.004668528214097023,
      "activation_l2_distance": -0.0023866959381848574,
      "activation_cosine_similarity": 0.009782802313566208,
      "activation_magnitude_ratio": -0.0016007922822609544,
      "activation_dot_product": 0.0029884621035307646,
      "encoder_gradient_cosine_similarity": 0.0016119983047246933,
      "encoder_gradient_l2_distance": -0.025692543014883995,
      "encoder_gradient_dot_product": 0.0006849066121503711,
      "input_gradient_cosine_similarity": 0.0008259260794147849,
      "input_gradient_l2_distance": -0.02054845727980137,
      "input_gradient_dot_product": -0.0035039230715483427
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.003134737489745021,
      "right_subspace_overlap_bottom_k": 0.003873331705108285,
      "interaction_matrix_overlap_top_k": 0.0022193919867277145,
      "interaction_matrix_overlap_bottom_k": 0.001780700869858265,
      "effective_rank": 0.0006924796616658568,
      "effective_rank_mergeability_score": 0.0010346906492486596,
      "stable_rank": 0.0009219464845955372,
      "spectral_gap": 0.0005715602310374379,
      "singular_value_ratio": 0.0006091052200645208,
      "layerwise_effective_rank": 0.0012683514505624771,
      "layerwise_effective_rank_mergeability_score": 0.0011349187698215246,
      "task_vector_cosine_similarity": 0.0021343242842704058,
      "task_vector_l2_distance": 0.0030055013485252857,
      "task_vector_dot_product": 0.001533003174699843,
      "weight_space_angle": 0.002132633700966835,
      "task_vector_magnitude_ratio": 0.0008232959662564099,
      "singular_value_overlap": 0.0026589324697852135,
      "subspace_overlap": 0.0018979668384417892,
      "right_subspace_overlap": 0.003097441280260682,
      "activation_l2_distance": 0.003351302118971944,
      "activation_cosine_similarity": 0.005046244245022535,
      "activation_magnitude_ratio": 0.0023664399050176144,
      "activation_dot_product": 0.0052276779897511005,
      "encoder_gradient_cosine_similarity": 0.0020647828932851553,
      "encoder_gradient_l2_distance": 0.011126135475933552,
      "encoder_gradient_dot_product": 0.0010174321942031384,
      "input_gradient_cosine_similarity": 0.0015294657787308097,
      "input_gradient_l2_distance": 0.01357677485793829,
      "input_gradient_dot_product": 0.002385731553658843
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.9,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.6,
      "interaction_matrix_overlap_bottom_k": 0.75,
      "effective_rank": 0.15,
      "effective_rank_mergeability_score": 0.35,
      "stable_rank": 0.35,
      "spectral_gap": 0.15,
      "singular_value_ratio": 0.2,
      "layerwise_effective_rank": 0.4,
      "layerwise_effective_rank_mergeability_score": 0.5,
      "task_vector_cosine_similarity": 0.6,
      "task_vector_l2_distance": 0.9,
      "task_vector_dot_product": 0.6,
      "weight_space_angle": 0.55,
      "task_vector_magnitude_ratio": 0.35,
      "singular_value_overlap": 0.4,
      "subspace_overlap": 0.7,
      "right_subspace_overlap": 0.9,
      "activation_l2_distance": 0.75,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.9,
      "activation_dot_product": 0.75,
      "encoder_gradient_cosine_similarity": 0.75,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.45,
      "input_gradient_cosine_similarity": 0.4,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.8
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7142320952584036,
        "val_r": 0.5745901561715565,
        "n_iterations": 184,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0015505764167755842,
          "right_subspace_overlap_bottom_k": -0.0030455198138952255,
          "interaction_matrix_overlap_top_k": -0.001096482272259891,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.001764769316650927,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.001219011377543211,
          "task_vector_l2_distance": -0.006922009866684675,
          "task_vector_dot_product": -0.0011440652888268232,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0018811884801834822,
          "singular_value_overlap": -0.0024822596460580826,
          "subspace_overlap": 0.0026371534913778305,
          "right_subspace_overlap": 0.0035960637032985687,
          "activation_l2_distance": -0.010428403504192829,
          "activation_cosine_similarity": 0.011254296638071537,
          "activation_magnitude_ratio": -0.002598159946501255,
          "activation_dot_product": 0.0019810758531093597,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.03631575033068657,
          "encoder_gradient_dot_product": 0.0016058655455708504,
          "input_gradient_cosine_similarity": 0.002502165036275983,
          "input_gradient_l2_distance": -0.0267636738717556,
          "input_gradient_dot_product": -0.005458910018205643
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7120543569915314,
        "val_r": 0.7345470694528385,
        "n_iterations": 201,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.0017782171489670873,
          "interaction_matrix_overlap_top_k": 0.0013067340478301048,
          "interaction_matrix_overlap_bottom_k": -0.001181404571980238,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0013212535995990038,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0017322173807770014,
          "layerwise_effective_rank": -0.0010333836544305086,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0020167632028460503,
          "task_vector_dot_product": -0.002237907610833645,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0014868632424622774,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.002249185461550951,
          "right_subspace_overlap": 0.0026235952973365784,
          "activation_l2_distance": 0.00240729539655149,
          "activation_cosine_similarity": 0.012551973573863506,
          "activation_magnitude_ratio": -0.001923061441630125,
          "activation_dot_product": 0.0022060764022171497,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.023044977337121964,
          "encoder_gradient_dot_product": -0.001074282918125391,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010508600622415543,
          "input_gradient_dot_product": -0.006413630209863186
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7490220919379982,
        "val_r": 0.7453313871292506,
        "n_iterations": 352,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002335015218704939,
          "right_subspace_overlap_bottom_k": -0.004927630536258221,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.0016286910977214575,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0015210808487609029,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0010510787833482027,
          "task_vector_cosine_similarity": -0.0012538013979792595,
          "task_vector_l2_distance": -0.0029613724909722805,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0015555165009573102,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005444171838462353,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.012263309210538864,
          "activation_magnitude_ratio": -0.0015438786940649152,
          "activation_dot_product": -0.0010850277030840516,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.022303704172372818,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0025980209466069937,
          "input_gradient_l2_distance": -0.012941693887114525,
          "input_gradient_dot_product": -0.0022370892111212015
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6963257341040913,
        "val_r": 0.6990494955784806,
        "n_iterations": 362,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007211118936538696,
          "right_subspace_overlap_bottom_k": -0.01310938410460949,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.0029290392994880676,
          "effective_rank": -0.002138542477041483,
          "effective_rank_mergeability_score": 0.002165574347600341,
          "stable_rank": -0.002230934565886855,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.001130574382841587,
          "layerwise_effective_rank": -0.002937863813713193,
          "layerwise_effective_rank_mergeability_score": 0.003198445774614811,
          "task_vector_cosine_similarity": -0.00263264705426991,
          "task_vector_l2_distance": -0.006533414125442505,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0024168952368199825,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0010653652716428041,
          "subspace_overlap": -0.0025370363146066666,
          "right_subspace_overlap": 0.0065771122463047504,
          "activation_l2_distance": -0.0015108167426660657,
          "activation_cosine_similarity": 0.011037271469831467,
          "activation_magnitude_ratio": -0.00744458707049489,
          "activation_dot_product": 0.018945403397083282,
          "encoder_gradient_cosine_similarity": -0.0021738128270953894,
          "encoder_gradient_l2_distance": -0.03698243945837021,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.04434309899806976,
          "input_gradient_dot_product": -0.004918564576655626
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7372174208162828,
        "val_r": 0.7753947697783279,
        "n_iterations": 346,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005462018772959709,
          "right_subspace_overlap_bottom_k": -0.007268066518008709,
          "interaction_matrix_overlap_top_k": -0.0012512210523709655,
          "interaction_matrix_overlap_bottom_k": 0.003868637839332223,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.003752325428649783,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.004096112214028835,
          "activation_l2_distance": -0.004041851498186588,
          "activation_cosine_similarity": 0.00587376207113266,
          "activation_magnitude_ratio": -0.0038540896493941545,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0013166820863261819,
          "encoder_gradient_l2_distance": -0.014740494079887867,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0013467947719618678,
          "input_gradient_l2_distance": -0.01183545682579279,
          "input_gradient_dot_product": -0.0019522984512150288
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7429031056975902,
        "val_r": 0.7079855365335811,
        "n_iterations": 184,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003172781551256776,
          "right_subspace_overlap_bottom_k": -0.005626234225928783,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.001131538301706314,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0010951189324259758,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0014780198689550161,
          "layerwise_effective_rank": -0.001374860992655158,
          "layerwise_effective_rank_mergeability_score": 0.001274349633604288,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0031330029014497995,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0013606806751340628,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.003626270452514291,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.003600532654672861,
          "activation_cosine_similarity": 0.007075885310769081,
          "activation_magnitude_ratio": -0.0022692426573485136,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0028929715044796467,
          "encoder_gradient_l2_distance": -0.011354279704391956,
          "encoder_gradient_dot_product": 0.0014043329283595085,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.008439039811491966,
          "input_gradient_dot_product": -0.0027027695905417204
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.711639841025607,
        "val_r": 0.44336522999881833,
        "n_iterations": 258,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010054366663098335,
          "right_subspace_overlap_bottom_k": -0.01615528203547001,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.0015504604671150446,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.001319420407526195,
          "stable_rank": -0.001600738032720983,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0035055375192314386,
          "task_vector_l2_distance": -0.007660426199436188,
          "task_vector_dot_product": -0.0012952093966305256,
          "weight_space_angle": -0.0039044786244630814,
          "task_vector_magnitude_ratio": -0.0011620367877185345,
          "singular_value_overlap": 0.010733304545283318,
          "subspace_overlap": 0.004490875173360109,
          "right_subspace_overlap": 0.011563366279006004,
          "activation_l2_distance": -0.006445854436606169,
          "activation_cosine_similarity": 0.021804848685860634,
          "activation_magnitude_ratio": 0.005524040199816227,
          "activation_dot_product": 0.007254992611706257,
          "encoder_gradient_cosine_similarity": 0.005949615966528654,
          "encoder_gradient_l2_distance": -0.05869036540389061,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.059116534888744354,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6906306037295854,
        "val_r": 0.28008712394749946,
        "n_iterations": 182,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010399539023637772,
          "right_subspace_overlap_bottom_k": -0.008144683204591274,
          "interaction_matrix_overlap_top_k": 0.0018154419958591461,
          "interaction_matrix_overlap_bottom_k": 0.001551143010146916,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0011272861156612635,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0013704168377444148,
          "task_vector_l2_distance": -0.006208081729710102,
          "task_vector_dot_product": -0.0026863226667046547,
          "weight_space_angle": 0.0032166303135454655,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0010546661214902997,
          "right_subspace_overlap": 0.007008115760982037,
          "activation_l2_distance": -0.0035006124526262283,
          "activation_cosine_similarity": 0.010846312157809734,
          "activation_magnitude_ratio": -0.0015101071912795305,
          "activation_dot_product": 0.0024909661151468754,
          "encoder_gradient_cosine_similarity": 0.003228895366191864,
          "encoder_gradient_l2_distance": -0.026546437293291092,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.017432304099202156,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7421264779881397,
        "val_r": 0.32514149979641216,
        "n_iterations": 245,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006884252652525902,
          "right_subspace_overlap_bottom_k": -0.0129082715138793,
          "interaction_matrix_overlap_top_k": 0.00552317826077342,
          "interaction_matrix_overlap_bottom_k": -0.0013613314367830753,
          "effective_rank": -0.0021951664239168167,
          "effective_rank_mergeability_score": 0.004040190484374762,
          "stable_rank": -0.0022860351018607616,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0036802974063903093,
          "layerwise_effective_rank_mergeability_score": 0.0033415481448173523,
          "task_vector_cosine_similarity": -0.004138464108109474,
          "task_vector_l2_distance": -0.0038520931266248226,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0033449125476181507,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0010621591936796904,
          "right_subspace_overlap": 0.006382728461176157,
          "activation_l2_distance": -0.004896563943475485,
          "activation_cosine_similarity": 0.014415232464671135,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.003159543266519904,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.033173829317092896,
          "encoder_gradient_dot_product": 0.002110685920342803,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.03022642992436886,
          "input_gradient_dot_product": -0.007203240878880024
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7092050424315637,
        "val_r": 0.6619421841626209,
        "n_iterations": 204,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007671755738556385,
          "right_subspace_overlap_bottom_k": -0.011548801325261593,
          "interaction_matrix_overlap_top_k": 0.007027201354503632,
          "interaction_matrix_overlap_bottom_k": -0.0028668236918747425,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0012139265891164541,
          "stable_rank": -0.001110621728003025,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0016721533611416817,
          "task_vector_cosine_similarity": -0.0033443481661379337,
          "task_vector_l2_distance": -0.009238621219992638,
          "task_vector_dot_product": -0.0028063426725566387,
          "weight_space_angle": 0.005879449192434549,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0018323555123060942,
          "right_subspace_overlap": 0.004517781548202038,
          "activation_l2_distance": 0.0015341260004788637,
          "activation_cosine_similarity": -0.002358352765440941,
          "activation_magnitude_ratio": -0.0017736625159159303,
          "activation_dot_product": -0.003683757269755006,
          "encoder_gradient_cosine_similarity": 0.0012695660116150975,
          "encoder_gradient_l2_distance": -0.03571387007832527,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.00220216391608119,
          "input_gradient_l2_distance": -0.036335378885269165,
          "input_gradient_dot_product": -0.0038228286430239677
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7548584089287705,
        "val_r": 0.15509635174227562,
        "n_iterations": 209,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005043752957135439,
          "right_subspace_overlap_bottom_k": -0.004038091283291578,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.001514483941718936,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0011927869636565447,
          "task_vector_l2_distance": -0.002915172139182687,
          "task_vector_dot_product": -0.0035294590052217245,
          "weight_space_angle": -0.0012348243035376072,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0022567424457520247,
          "activation_cosine_similarity": 0.010790357366204262,
          "activation_magnitude_ratio": -0.003243571612983942,
          "activation_dot_product": 0.0010443661594763398,
          "encoder_gradient_cosine_similarity": 0.0032466158736497164,
          "encoder_gradient_l2_distance": -0.01851687766611576,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.005240581929683685,
          "input_gradient_dot_product": -0.0028288690373301506
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7370003410753476,
        "val_r": 0.7195878714971773,
        "n_iterations": 402,
        "n_nonzero_coefficients": 13,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005679874215275049,
          "right_subspace_overlap_bottom_k": -0.0073757171630859375,
          "interaction_matrix_overlap_top_k": 0.0013404058991000056,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0010896155145019293,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.001202290179207921,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.002638746751472354,
          "right_subspace_overlap": 0.0017428849823772907,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.011738738045096397,
          "activation_magnitude_ratio": -0.0023257285356521606,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.001752082840539515,
          "encoder_gradient_l2_distance": -0.024661622941493988,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.014047395437955856,
          "input_gradient_dot_product": -0.00256907707080245
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7191416390116987,
        "val_r": 0.7624549183763883,
        "n_iterations": 209,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0014541004784405231,
          "right_subspace_overlap_bottom_k": -0.00716800382360816,
          "interaction_matrix_overlap_top_k": 0.00117532501462847,
          "interaction_matrix_overlap_bottom_k": -0.002325912471860647,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0020177909173071384,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.004068927839398384,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0017483500996604562,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0015317999059334397,
          "right_subspace_overlap": 0.004004692658782005,
          "activation_l2_distance": -0.005424811039119959,
          "activation_cosine_similarity": 0.011370365507900715,
          "activation_magnitude_ratio": -0.0010379136074334383,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.005966357886791229,
          "encoder_gradient_l2_distance": -0.025538237765431404,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.004050276707857847,
          "input_gradient_l2_distance": -0.020463602617383003,
          "input_gradient_dot_product": -0.007505952846258879
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.712521014522835,
        "val_r": 0.7548653927281552,
        "n_iterations": 286,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005539420526474714,
          "right_subspace_overlap_bottom_k": -0.0058557442389428616,
          "interaction_matrix_overlap_top_k": 0.003372043138369918,
          "interaction_matrix_overlap_bottom_k": -0.0024496472906321287,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0015103832120075822,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0013504627859219909,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.001185794360935688,
          "singular_value_overlap": 0.0026224192697554827,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.004216058179736137,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.01045199204236269,
          "activation_magnitude_ratio": -0.0017180072609335184,
          "activation_dot_product": 0.003187564667314291,
          "encoder_gradient_cosine_similarity": 0.0029253684915602207,
          "encoder_gradient_l2_distance": -0.015568162314593792,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.009246883913874626,
          "input_gradient_dot_product": -0.0041497377678751945
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7308353472578193,
        "val_r": 0.7465830213193351,
        "n_iterations": 314,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0019079695921391249,
          "right_subspace_overlap_bottom_k": -0.010504363104701042,
          "interaction_matrix_overlap_top_k": 0.003439404536038637,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.001291878055781126,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.004172000102698803,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0016610368620604277,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.00198942213319242,
          "right_subspace_overlap": 0.00525627238675952,
          "activation_l2_distance": -0.004582843277603388,
          "activation_cosine_similarity": 0.016771679744124413,
          "activation_magnitude_ratio": -0.0016637388616800308,
          "activation_dot_product": -0.0019748916383832693,
          "encoder_gradient_cosine_similarity": 0.0013073517475277185,
          "encoder_gradient_l2_distance": -0.029658062383532524,
          "encoder_gradient_dot_product": 0.002269571181386709,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.026318933814764023,
          "input_gradient_dot_product": -0.0034264251589775085
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.7578084573307552,
        "val_r": 0.2713992810916517,
        "n_iterations": 254,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003711894853040576,
          "right_subspace_overlap_bottom_k": -0.006183141376823187,
          "interaction_matrix_overlap_top_k": 0.0029463947284966707,
          "interaction_matrix_overlap_bottom_k": 0.001910249819047749,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0010449578985571861,
          "task_vector_l2_distance": -0.0031339118722826242,
          "task_vector_dot_product": -0.0033547827042639256,
          "weight_space_angle": 0.0026013997849076986,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.004189696162939072,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0050026290118694305,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.00552396010607481,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0015798253007233143,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.015431406907737255,
          "encoder_gradient_dot_product": 0.0021611482370644808,
          "input_gradient_cosine_similarity": 0.0021344893611967564,
          "input_gradient_l2_distance": -0.007154466118663549,
          "input_gradient_dot_product": -0.006301587913185358
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7498605563649172,
        "val_r": 0.7163676589405585,
        "n_iterations": 239,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00916201714426279,
          "right_subspace_overlap_bottom_k": -0.007592316251248121,
          "interaction_matrix_overlap_top_k": 0.004637566860765219,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.001154064666479826,
          "layerwise_effective_rank_mergeability_score": 0.0010019266046583652,
          "task_vector_cosine_similarity": -0.001023646560497582,
          "task_vector_l2_distance": -0.006232148967683315,
          "task_vector_dot_product": -0.0033140024170279503,
          "weight_space_angle": 0.001857350580394268,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0012373242061585188,
          "right_subspace_overlap": 0.004218777641654015,
          "activation_l2_distance": -0.0025808727368712425,
          "activation_cosine_similarity": 0.005291348788887262,
          "activation_magnitude_ratio": -0.0015171397244557738,
          "activation_dot_product": 0.006660662591457367,
          "encoder_gradient_cosine_similarity": 0.002311134710907936,
          "encoder_gradient_l2_distance": -0.021714840084314346,
          "encoder_gradient_dot_product": 0.002462234813719988,
          "input_gradient_cosine_similarity": 0.0038369635585695505,
          "input_gradient_l2_distance": -0.018113460391759872,
          "input_gradient_dot_product": -0.0058984821662306786
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.45753214345728044,
        "val_r": 0.32041893222130086,
        "n_iterations": 409,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.009452849626541138,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.001109507866203785,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0014869080623611808,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.003928965888917446,
          "layerwise_effective_rank_mergeability_score": 0.0012053628452122211,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0027589979581534863,
          "task_vector_dot_product": -0.0032498687505722046,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0011452873004600406,
          "singular_value_overlap": -0.0011619104770943522,
          "subspace_overlap": -0.0012793560745194554,
          "right_subspace_overlap": 0.0028976015746593475,
          "activation_l2_distance": 0.0036557884886860847,
          "activation_cosine_similarity": 0.004957815166562796,
          "activation_magnitude_ratio": -0.003330943640321493,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.001994813559576869,
          "encoder_gradient_l2_distance": -0.008795679546892643,
          "encoder_gradient_dot_product": 0.0010355694685131311,
          "input_gradient_cosine_similarity": 0.002251974307000637,
          "input_gradient_l2_distance": -0.0066670202650129795,
          "input_gradient_dot_product": -0.0026889946311712265
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7787317134713179,
        "val_r": 0.4828688427270315,
        "n_iterations": 500,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005563536658883095,
          "right_subspace_overlap_bottom_k": -0.014120806939899921,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0013496499741449952,
          "effective_rank": -0.0013458512257784605,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0019460555631667376,
          "layerwise_effective_rank_mergeability_score": 0.003236202523112297,
          "task_vector_cosine_similarity": -0.0065154219046235085,
          "task_vector_l2_distance": -0.0026554642245173454,
          "task_vector_dot_product": -0.0013378177536651492,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0031786286272108555,
          "subspace_overlap": -0.0012030813377350569,
          "right_subspace_overlap": 0.012472288683056831,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.010225385427474976,
          "activation_magnitude_ratio": -0.0010984826367348433,
          "activation_dot_product": 0.00400898139923811,
          "encoder_gradient_cosine_similarity": 0.0018792040646076202,
          "encoder_gradient_l2_distance": -0.02201945148408413,
          "encoder_gradient_dot_product": 0.0017230070661753416,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01877264678478241,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8031573363376444,
        "val_r": 0.6823923383461539,
        "n_iterations": 242,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0013653264613822103,
          "right_subspace_overlap_bottom_k": -0.003398091997951269,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0011565500171855092,
          "singular_value_ratio": -0.0016606446588411927,
          "layerwise_effective_rank": -0.001079166424460709,
          "layerwise_effective_rank_mergeability_score": 0.0011502656852826476,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009282066486775875,
          "task_vector_dot_product": -0.0033878525719046593,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0015326421707868576,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0017503122799098492,
          "activation_l2_distance": -0.006061220541596413,
          "activation_cosine_similarity": 0.003769893432036042,
          "activation_magnitude_ratio": 0.0013124305987730622,
          "activation_dot_product": 0.013993466272950172,
          "encoder_gradient_cosine_similarity": -0.0016268800245597959,
          "encoder_gradient_l2_distance": -0.03308041766285896,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.027001911774277687,
          "input_gradient_dot_product": 0.0
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1.0,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "arithmetic": {
    "aggregate_metrics": {
      "train_r": 0.4147937331012865,
      "train_p": 3.2574223455771243e-134,
      "val_r": 0.020843985235486483,
      "val_p": 0.6942824418649248
    },
    "per_fold_stats": {
      "train_r_mean": 0.5712423172767996,
      "train_r_std": 0.05534274277158711,
      "val_r_mean": 0.44763060141709604,
      "val_r_std": 0.15894195465037525,
      "n_nonzero_mean": 17.45,
      "n_nonzero_std": 3.412843389316304
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.0028030972462147474,
      "right_subspace_overlap_bottom_k": 0.0004903459921479225,
      "interaction_matrix_overlap_top_k": 0.0005224839551374316,
      "interaction_matrix_overlap_bottom_k": 0.008815896697342396,
      "effective_rank": -0.000454981520306319,
      "effective_rank_mergeability_score": 0.0005226937355473638,
      "stable_rank": -0.0003909252700395882,
      "spectral_gap": 0.0005298836622387171,
      "singular_value_ratio": -0.0006090336246415973,
      "layerwise_effective_rank": -0.00011231003009015694,
      "layerwise_effective_rank_mergeability_score": 0.0001790237583918497,
      "task_vector_cosine_similarity": -0.0008003037655726075,
      "task_vector_l2_distance": -0.011536127887666225,
      "task_vector_dot_product": -0.0010758162243291736,
      "weight_space_angle": -7.76826636865735e-05,
      "task_vector_magnitude_ratio": -0.0009859405690804124,
      "singular_value_overlap": -0.00787513516843319,
      "subspace_overlap": 0.001652594655752182,
      "right_subspace_overlap": 0.003585358615964651,
      "activation_l2_distance": -0.0017347775865346193,
      "activation_cosine_similarity": 0.002635424956679344,
      "activation_magnitude_ratio": -0.0021983995102345943,
      "activation_dot_product": 0.001540964818559587,
      "encoder_gradient_cosine_similarity": 0.0011550105409696698,
      "encoder_gradient_l2_distance": -0.01664988324046135,
      "encoder_gradient_dot_product": 0.000519001972861588,
      "input_gradient_cosine_similarity": 0.00023654312826693058,
      "input_gradient_l2_distance": -0.017714932560920715,
      "input_gradient_dot_product": -0.0032727557700127363
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.003067811019718647,
      "right_subspace_overlap_bottom_k": 0.004936478100717068,
      "interaction_matrix_overlap_top_k": 0.0014241113094612956,
      "interaction_matrix_overlap_bottom_k": 0.003564826911315322,
      "effective_rank": 0.0008939383551478386,
      "effective_rank_mergeability_score": 0.0009914550464600325,
      "stable_rank": 0.000820521148853004,
      "spectral_gap": 0.0007799084996804595,
      "singular_value_ratio": 0.0008263746276497841,
      "layerwise_effective_rank": 0.0010042249923571944,
      "layerwise_effective_rank_mergeability_score": 0.0009583879727870226,
      "task_vector_cosine_similarity": 0.001886551035568118,
      "task_vector_l2_distance": 0.004114768002182245,
      "task_vector_dot_product": 0.0018538839649409056,
      "weight_space_angle": 0.0020573956426233053,
      "task_vector_magnitude_ratio": 0.0009510933887213469,
      "singular_value_overlap": 0.0030843899585306644,
      "subspace_overlap": 0.0024448151234537363,
      "right_subspace_overlap": 0.003706187242642045,
      "activation_l2_distance": 0.0018886368488892913,
      "activation_cosine_similarity": 0.0029842660296708345,
      "activation_magnitude_ratio": 0.002446080558001995,
      "activation_dot_product": 0.004189772997051477,
      "encoder_gradient_cosine_similarity": 0.0013420016039162874,
      "encoder_gradient_l2_distance": 0.0065916916355490685,
      "encoder_gradient_dot_product": 0.0010260860435664654,
      "input_gradient_cosine_similarity": 0.0013873182469978929,
      "input_gradient_l2_distance": 0.008349020965397358,
      "input_gradient_dot_product": 0.002887350507080555
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.85,
      "right_subspace_overlap_bottom_k": 0.55,
      "interaction_matrix_overlap_top_k": 0.6,
      "interaction_matrix_overlap_bottom_k": 1.0,
      "effective_rank": 0.25,
      "effective_rank_mergeability_score": 0.35,
      "stable_rank": 0.2,
      "spectral_gap": 0.35,
      "singular_value_ratio": 0.4,
      "layerwise_effective_rank": 0.2,
      "layerwise_effective_rank_mergeability_score": 0.15,
      "task_vector_cosine_similarity": 0.5,
      "task_vector_l2_distance": 1.0,
      "task_vector_dot_product": 0.75,
      "weight_space_angle": 0.55,
      "task_vector_magnitude_ratio": 0.55,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.6,
      "right_subspace_overlap": 0.8,
      "activation_l2_distance": 0.65,
      "activation_cosine_similarity": 0.7,
      "activation_magnitude_ratio": 0.55,
      "activation_dot_product": 0.6,
      "encoder_gradient_cosine_similarity": 0.6,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.35,
      "input_gradient_cosine_similarity": 0.5,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.85
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6180740509609756,
        "val_r": 0.5697157024299452,
        "n_iterations": 413,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0025912015698850155,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.001850802218541503,
          "interaction_matrix_overlap_bottom_k": 0.013703127391636372,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0012978933518752456,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.004984332248568535,
          "task_vector_l2_distance": -0.011455300264060497,
          "task_vector_dot_product": -0.004625027533620596,
          "weight_space_angle": -0.0011668243678286672,
          "task_vector_magnitude_ratio": -0.0029435730539262295,
          "singular_value_overlap": -0.011220894753932953,
          "subspace_overlap": 0.005533314310014248,
          "right_subspace_overlap": 0.0021229018457233906,
          "activation_l2_distance": -0.00490214116871357,
          "activation_cosine_similarity": 0.0043952129781246185,
          "activation_magnitude_ratio": -0.0030675118323415518,
          "activation_dot_product": -0.0031750304624438286,
          "encoder_gradient_cosine_similarity": 0.0020073307678103447,
          "encoder_gradient_l2_distance": -0.014844807796180248,
          "encoder_gradient_dot_product": 0.0016714174998924136,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.015275994315743446,
          "input_gradient_dot_product": -0.0014901345130056143
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5530037731338635,
        "val_r": 0.4480554617012103,
        "n_iterations": 263,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005299021955579519,
          "right_subspace_overlap_bottom_k": 0.00918323639780283,
          "interaction_matrix_overlap_top_k": 0.0017932374030351639,
          "interaction_matrix_overlap_bottom_k": 0.007101086899638176,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.001670884434133768,
          "singular_value_ratio": -0.0011015268974006176,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0013613011687994003,
          "task_vector_l2_distance": -0.021293068304657936,
          "task_vector_dot_product": -0.0024362814147025347,
          "weight_space_angle": 0.001655402360484004,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.011078942567110062,
          "subspace_overlap": 0.0011637123534455895,
          "right_subspace_overlap": 0.011486200615763664,
          "activation_l2_distance": -0.004545020870864391,
          "activation_cosine_similarity": 0.008167557418346405,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.003101891838014126,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.03233359009027481,
          "encoder_gradient_dot_product": 0.0015757342334836721,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.04078017920255661,
          "input_gradient_dot_product": 0.0017023596446961164
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5938880577119328,
        "val_r": 0.5326124420722137,
        "n_iterations": 509,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00626923656091094,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.009760092943906784,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0010753237875178456,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009734059683978558,
          "task_vector_dot_product": -0.0031163825187832117,
          "weight_space_angle": -0.0018549347296357155,
          "task_vector_magnitude_ratio": -0.0017506986623629928,
          "singular_value_overlap": -0.009148070588707924,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0033904770389199257,
          "activation_l2_distance": -0.002922898158431053,
          "activation_cosine_similarity": 0.003187878057360649,
          "activation_magnitude_ratio": -0.004333951510488987,
          "activation_dot_product": 0.0012891010846942663,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.013682209886610508,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01446079183369875,
          "input_gradient_dot_product": -0.0040163155645132065
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5576310828427178,
        "val_r": 0.44274717067207786,
        "n_iterations": 274,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.0017558863619342446,
          "interaction_matrix_overlap_top_k": -0.0010860721813514829,
          "interaction_matrix_overlap_bottom_k": 0.009966002777218819,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.001045015174895525,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.002106581348925829,
          "task_vector_l2_distance": -0.009376106783747673,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0019290063064545393,
          "singular_value_overlap": -0.008377136662602425,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0028619058430194855,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0031275073997676373,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0024589451495558023,
          "encoder_gradient_l2_distance": -0.010712896473705769,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01156396884471178,
          "input_gradient_dot_product": -0.002982771024107933
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5996700268457557,
        "val_r": 0.5378257155287615,
        "n_iterations": 288,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0033669748809188604,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.0015559939201921225,
          "interaction_matrix_overlap_bottom_k": 0.010958733037114143,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0010467363754287362,
          "singular_value_ratio": -0.001290816580876708,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.001644620206207037,
          "task_vector_l2_distance": -0.01293565146625042,
          "task_vector_dot_product": -0.0052776820957660675,
          "weight_space_angle": -0.0010852222330868244,
          "task_vector_magnitude_ratio": -0.0018712326418608427,
          "singular_value_overlap": -0.009386422112584114,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.003171292133629322,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.011280304752290249,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0020663058385252953,
          "input_gradient_l2_distance": -0.014173361472785473,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5682565025968028,
        "val_r": 0.700182021631748,
        "n_iterations": 227,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0012698968639597297,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0013212927151471376,
          "interaction_matrix_overlap_bottom_k": 0.010989099740982056,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009764018468558788,
          "task_vector_dot_product": 0.0010261695133522153,
          "weight_space_angle": -0.002242692979052663,
          "task_vector_magnitude_ratio": -0.001686474191956222,
          "singular_value_overlap": -0.007381747011095285,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.001069747842848301,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0014326197560876608,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.013281473889946938,
          "encoder_gradient_dot_product": 0.0017475341446697712,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.008017344400286674,
          "input_gradient_dot_product": -0.00499511044472456
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.5637292220554269,
        "val_r": 0.09832021592144836,
        "n_iterations": 312,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002257884945720434,
          "right_subspace_overlap_bottom_k": 0.005898905452340841,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.00881099421530962,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0012296228669583797,
          "task_vector_l2_distance": -0.011332336813211441,
          "task_vector_dot_product": -0.0017710113897919655,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.00863081868737936,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0018596574664115906,
          "activation_l2_distance": -0.0011909845052286983,
          "activation_cosine_similarity": 0.004624588880687952,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0012100469321012497,
          "encoder_gradient_l2_distance": -0.018869707360863686,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.0028026695363223553,
          "input_gradient_l2_distance": -0.016840539872646332,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5359777945002492,
        "val_r": 0.2417519438454659,
        "n_iterations": 371,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0024138358421623707,
          "right_subspace_overlap_bottom_k": 0.0010972426971420646,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.010750856250524521,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01296668965369463,
          "task_vector_dot_product": -0.001235158764757216,
          "weight_space_angle": 0.0012883846648037434,
          "task_vector_magnitude_ratio": -0.0017859159270301461,
          "singular_value_overlap": -0.007205511908978224,
          "subspace_overlap": 0.004675840958952904,
          "right_subspace_overlap": 0.002247557742521167,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0017582315485924482,
          "activation_magnitude_ratio": -0.0014149498892948031,
          "activation_dot_product": 0.0010779963340610266,
          "encoder_gradient_cosine_similarity": 0.0024107815697789192,
          "encoder_gradient_l2_distance": -0.012344466522336006,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0014810537686571479,
          "input_gradient_l2_distance": -0.00581307802349329,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5306435373667916,
        "val_r": 0.42226760816373765,
        "n_iterations": 280,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006372908130288124,
          "right_subspace_overlap_bottom_k": -0.004079069010913372,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.008584539406001568,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0021788107696920633,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0016560384538024664,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0012206619139760733,
          "task_vector_l2_distance": -0.008314480073750019,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.008661511354148388,
          "subspace_overlap": 0.00380483316257596,
          "right_subspace_overlap": 0.005803849082440138,
          "activation_l2_distance": -0.003230154048651457,
          "activation_cosine_similarity": 0.0016289826016873121,
          "activation_magnitude_ratio": -0.0088586350902915,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.002262020716443658,
          "encoder_gradient_l2_distance": -0.019343174993991852,
          "encoder_gradient_dot_product": 0.0014067620504647493,
          "input_gradient_cosine_similarity": 0.00124455732293427,
          "input_gradient_l2_distance": -0.01708904467523098,
          "input_gradient_dot_product": -0.005698848515748978
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.4934394145064822,
        "val_r": 0.23030771673113648,
        "n_iterations": 202,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0018849847838282585,
          "right_subspace_overlap_bottom_k": -0.004817419685423374,
          "interaction_matrix_overlap_top_k": -0.0020810826681554317,
          "interaction_matrix_overlap_bottom_k": 0.006901550572365522,
          "effective_rank": -0.0016517462208867073,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0023971975315362215,
          "task_vector_l2_distance": -0.007594594266265631,
          "task_vector_dot_product": -0.0010407879017293453,
          "weight_space_angle": 0.0017087750602513552,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.008830549195408821,
          "subspace_overlap": 0.007562167942523956,
          "right_subspace_overlap": 0.0026988808531314135,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": -0.0020148465409874916,
          "activation_magnitude_ratio": -0.004539362154901028,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0016230803448706865,
          "encoder_gradient_l2_distance": -0.012935216538608074,
          "encoder_gradient_dot_product": 0.003610592568293214,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.017048172652721405,
          "input_gradient_dot_product": -0.005586983636021614
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5259409505326678,
        "val_r": 0.24490894094100873,
        "n_iterations": 270,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0024048895575106144,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.012457373552024364,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": -0.0017239571316167712,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.010684722103178501,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.006503191776573658,
          "subspace_overlap": 0.0018446739995852113,
          "right_subspace_overlap": 0.0023592233192175627,
          "activation_l2_distance": -0.0035191038623452187,
          "activation_cosine_similarity": 0.005276487208902836,
          "activation_magnitude_ratio": -0.0026374992448836565,
          "activation_dot_product": 0.0023292938712984324,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.016549127176404,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.0012322269612923265,
          "input_gradient_l2_distance": -0.014573728665709496,
          "input_gradient_dot_product": -0.003661161055788398
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5373417834617251,
        "val_r": 0.40300571884931513,
        "n_iterations": 246,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005800649989396334,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.0010210494510829449,
          "interaction_matrix_overlap_bottom_k": 0.007865937426686287,
          "effective_rank": -0.0018672787118703127,
          "effective_rank_mergeability_score": 0.0015925299376249313,
          "stable_rank": -0.0017292345874011517,
          "spectral_gap": 0.001991115976125002,
          "singular_value_ratio": -0.0018630237318575382,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009514114819467068,
          "task_vector_dot_product": 0.0014904148411005735,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.002036771969869733,
          "singular_value_overlap": -0.008643779903650284,
          "subspace_overlap": 0.003172900527715683,
          "right_subspace_overlap": 0.0022965408861637115,
          "activation_l2_distance": -0.0018845407757908106,
          "activation_cosine_similarity": 0.0017240658635273576,
          "activation_magnitude_ratio": -0.004460501484572887,
          "activation_dot_product": 0.0034414397086948156,
          "encoder_gradient_cosine_similarity": 0.0038997577503323555,
          "encoder_gradient_l2_distance": -0.014896337874233723,
          "encoder_gradient_dot_product": -0.0010470146080479026,
          "input_gradient_cosine_similarity": 0.0012901341542601585,
          "input_gradient_l2_distance": -0.01682719960808754,
          "input_gradient_dot_product": -0.0030701656360179186
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5346878359573785,
        "val_r": 0.4178246258242257,
        "n_iterations": 372,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0023737442679703236,
          "right_subspace_overlap_bottom_k": 0.00179577455855906,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.010707186535000801,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": -0.0012485419865697622,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.002225802978500724,
          "task_vector_l2_distance": -0.009756104089319706,
          "task_vector_dot_product": -0.0019835284911096096,
          "weight_space_angle": -0.005975981242954731,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.007532523013651371,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0025259798858314753,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.013350347056984901,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.002246818970888853,
          "input_gradient_l2_distance": -0.01688302494585514,
          "input_gradient_dot_product": -0.005476631689816713
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5775014660482487,
        "val_r": 0.7056167519213473,
        "n_iterations": 260,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002461113967001438,
          "right_subspace_overlap_bottom_k": 0.003933696076273918,
          "interaction_matrix_overlap_top_k": 0.0026432503946125507,
          "interaction_matrix_overlap_bottom_k": 0.009421202354133129,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0018775924108922482,
          "stable_rank": -0.0012008303310722113,
          "spectral_gap": 0.00105118821375072,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0187627375125885,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.004829147830605507,
          "task_vector_magnitude_ratio": -0.0010939622297883034,
          "singular_value_overlap": -0.012115050107240677,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.003755392273887992,
          "activation_l2_distance": -0.0017992560751736164,
          "activation_cosine_similarity": 0.0056720152497291565,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0011950972257182002,
          "encoder_gradient_cosine_similarity": 0.002871211152523756,
          "encoder_gradient_l2_distance": -0.02368965744972229,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.001197035307995975,
          "input_gradient_l2_distance": -0.028053907677531242,
          "input_gradient_dot_product": -0.005214518867433071
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.553125014635638,
        "val_r": 0.5974703807181759,
        "n_iterations": 240,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004209619015455246,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0010667608585208654,
          "interaction_matrix_overlap_bottom_k": 0.004901506006717682,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0024309176951646805,
          "singular_value_ratio": -0.0025844494812190533,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.003619321621954441,
          "task_vector_l2_distance": -0.016736846417188644,
          "task_vector_dot_product": -0.0021864825394004583,
          "weight_space_angle": -0.0011690945830196142,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.012278140522539616,
          "subspace_overlap": 0.003481028601527214,
          "right_subspace_overlap": 0.011060098186135292,
          "activation_l2_distance": -0.005314438603818417,
          "activation_cosine_similarity": 0.00838241633027792,
          "activation_magnitude_ratio": -0.002529058838263154,
          "activation_dot_product": -0.002459646435454488,
          "encoder_gradient_cosine_similarity": -0.0013181365793570876,
          "encoder_gradient_l2_distance": -0.02412434294819832,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.029440024867653847,
          "input_gradient_dot_product": -0.0030148508958518505
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.5870188809111748,
        "val_r": 0.3976643967322311,
        "n_iterations": 208,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0028502473141998053,
          "right_subspace_overlap_bottom_k": 0.010066690854728222,
          "interaction_matrix_overlap_top_k": 0.003371868748217821,
          "interaction_matrix_overlap_bottom_k": 0.0021019214764237404,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0022139435168355703,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.001056955079548061,
          "layerwise_effective_rank": 0.001415930804796517,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.014579412527382374,
          "task_vector_dot_product": -0.001267450861632824,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.005584617145359516,
          "subspace_overlap": -0.0015266051050275564,
          "right_subspace_overlap": 0.002102457918226719,
          "activation_l2_distance": 0.00149232754483819,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.005827720742672682,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.016661034896969795,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.001707547577098012,
          "input_gradient_l2_distance": -0.0129429055377841,
          "input_gradient_dot_product": -0.004515375476330519
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5348943106453159,
        "val_r": 0.43233557488152985,
        "n_iterations": 213,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0028318637050688267,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0015399992698803544,
          "interaction_matrix_overlap_bottom_k": 0.010690230876207352,
          "effective_rank": -0.0010792005341500044,
          "effective_rank_mergeability_score": 0.0016882349736988544,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009645210579037666,
          "task_vector_dot_product": 0.0010256454115733504,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.003587873186916113,
          "subspace_overlap": 0.002718030009418726,
          "right_subspace_overlap": 0.00406984519213438,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0011998547706753016,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.004721947014331818,
          "encoder_gradient_cosine_similarity": 0.0017431579763069749,
          "encoder_gradient_l2_distance": -0.009304019622504711,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010593226179480553,
          "input_gradient_dot_product": -0.0014672355027869344
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5586999842673284,
        "val_r": 0.4104740048628927,
        "n_iterations": 259,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.01146433874964714,
          "effective_rank": -0.0011079671094194055,
          "effective_rank_mergeability_score": 0.0017309833783656359,
          "stable_rank": 0.0,
          "spectral_gap": 0.0011089369654655457,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0017836313927546144,
          "layerwise_effective_rank_mergeability_score": 0.0016595909837633371,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009064048528671265,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0017588441260159016,
          "singular_value_overlap": -0.003984325565397739,
          "subspace_overlap": 0.0028767383191734552,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0014894700143486261,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0017801033100113273,
          "encoder_gradient_cosine_similarity": 0.0010607612784951925,
          "encoder_gradient_l2_distance": -0.007313823327422142,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01280833501368761,
          "input_gradient_dot_product": -0.002021968364715576
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7642331175113852,
        "val_r": 0.6951574649622094,
        "n_iterations": 240,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010874333791434765,
          "right_subspace_overlap_bottom_k": -0.014201279729604721,
          "interaction_matrix_overlap_top_k": 0.002606664551422,
          "interaction_matrix_overlap_bottom_k": -0.0018746597925201058,
          "effective_rank": -0.0033934377133846283,
          "effective_rank_mergeability_score": 0.0025991322472691536,
          "stable_rank": -0.002709629014134407,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.003534538671374321,
          "layerwise_effective_rank_mergeability_score": 0.0036448414903134108,
          "task_vector_cosine_similarity": -0.004832164384424686,
          "task_vector_l2_distance": -0.002320024883374572,
          "task_vector_dot_product": -0.001875006128102541,
          "weight_space_angle": 0.0024593868292868137,
          "task_vector_magnitude_ratio": -0.0015089894877746701,
          "singular_value_overlap": 0.0012166521046310663,
          "subspace_overlap": -0.0022547421976923943,
          "right_subspace_overlap": 0.012522442266345024,
          "activation_l2_distance": -0.002863891888409853,
          "activation_cosine_similarity": 0.007273436989635229,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.01657721772789955,
          "encoder_gradient_cosine_similarity": 0.0028712530620396137,
          "encoder_gradient_l2_distance": -0.03180106729269028,
          "encoder_gradient_dot_product": 0.0014150140341371298,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.03194541484117508,
          "input_gradient_dot_product": -0.011932282708585262
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6370895390441352,
        "val_r": 0.4243681699512402,
        "n_iterations": 349,
        "n_nonzero_coefficients": 12,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.002685029525309801,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.011056805960834026,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0021635624580085278,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.014893029816448689,
          "task_vector_dot_product": 0.0017562464345246553,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0013533404562622309,
          "singular_value_overlap": -0.008568275719881058,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.00714366789907217,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.01568005420267582,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0033414720091968775,
          "input_gradient_l2_distance": -0.01916840299963951,
          "input_gradient_dot_product": -0.002013114746659994
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1.0,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "tsv": {
    "aggregate_metrics": {
      "train_r": 0.6160949380881315,
      "train_p": 0.0,
      "val_r": 0.39261808728019937,
      "val_p": 1.2129172197036777e-14
    },
    "per_fold_stats": {
      "train_r_mean": 0.7517868201672098,
      "train_r_std": 0.02884538250208843,
      "val_r_mean": 0.660020001724191,
      "val_r_std": 0.175968530047121,
      "n_nonzero_mean": 16.7,
      "n_nonzero_std": 3.4219877264537346
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.006533559411764145,
      "right_subspace_overlap_bottom_k": -0.013745452277362347,
      "interaction_matrix_overlap_top_k": 0.0007507792324759066,
      "interaction_matrix_overlap_bottom_k": -0.0007551218150183558,
      "effective_rank": -0.00019390031229704618,
      "effective_rank_mergeability_score": 0.00017324488726444542,
      "stable_rank": -0.0003448409552220255,
      "spectral_gap": 5.678176967194304e-05,
      "singular_value_ratio": -0.00019888598762918264,
      "layerwise_effective_rank": -0.000934633775614202,
      "layerwise_effective_rank_mergeability_score": 0.0009657128830440342,
      "task_vector_cosine_similarity": 0.0008784830570220947,
      "task_vector_l2_distance": -0.001598607050254941,
      "task_vector_dot_product": -0.0008031550096347928,
      "weight_space_angle": 0.0007103706011548638,
      "task_vector_magnitude_ratio": -0.00014764565275982022,
      "singular_value_overlap": 0.004652106203138828,
      "subspace_overlap": -0.00015884413733147085,
      "right_subspace_overlap": 0.006524239666759968,
      "activation_l2_distance": -0.001410651602782309,
      "activation_cosine_similarity": 0.010578606277704239,
      "activation_magnitude_ratio": -0.001965178642421961,
      "activation_dot_product": 0.002552092308178544,
      "encoder_gradient_cosine_similarity": 0.0013743110466748476,
      "encoder_gradient_l2_distance": -0.020633619278669357,
      "encoder_gradient_dot_product": 0.00018909941718447953,
      "input_gradient_cosine_similarity": 0.0004466112586669624,
      "input_gradient_l2_distance": -0.01256854273378849,
      "input_gradient_dot_product": -0.0014428261201828718
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.003112143138423562,
      "right_subspace_overlap_bottom_k": 0.002974230330437422,
      "interaction_matrix_overlap_top_k": 0.0014184248866513371,
      "interaction_matrix_overlap_bottom_k": 0.002221831353381276,
      "effective_rank": 0.0005951150669716299,
      "effective_rank_mergeability_score": 0.0006558449240401387,
      "stable_rank": 0.00061770313186571,
      "spectral_gap": 0.0006575153674930334,
      "singular_value_ratio": 0.0006621009088121355,
      "layerwise_effective_rank": 0.0011761042987927794,
      "layerwise_effective_rank_mergeability_score": 0.0013518346240743995,
      "task_vector_cosine_similarity": 0.0014307035598903894,
      "task_vector_l2_distance": 0.002546121599152684,
      "task_vector_dot_product": 0.0013121989322826266,
      "weight_space_angle": 0.0025951683055609465,
      "task_vector_magnitude_ratio": 0.00044738498399965465,
      "singular_value_overlap": 0.0028970432467758656,
      "subspace_overlap": 0.0006064486806280911,
      "right_subspace_overlap": 0.003317583119496703,
      "activation_l2_distance": 0.003036763286218047,
      "activation_cosine_similarity": 0.004192250315099955,
      "activation_magnitude_ratio": 0.0018638529581949115,
      "activation_dot_product": 0.005334638990461826,
      "encoder_gradient_cosine_similarity": 0.0013877105666324496,
      "encoder_gradient_l2_distance": 0.007479684427380562,
      "encoder_gradient_dot_product": 0.0011348134139552712,
      "input_gradient_cosine_similarity": 0.0010888047982007265,
      "input_gradient_l2_distance": 0.006578623317182064,
      "input_gradient_dot_product": 0.0024355826899409294
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.9,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.7,
      "interaction_matrix_overlap_bottom_k": 0.4,
      "effective_rank": 0.1,
      "effective_rank_mergeability_score": 0.2,
      "stable_rank": 0.25,
      "spectral_gap": 0.15,
      "singular_value_ratio": 0.1,
      "layerwise_effective_rank": 0.45,
      "layerwise_effective_rank_mergeability_score": 0.45,
      "task_vector_cosine_similarity": 0.6,
      "task_vector_l2_distance": 0.9,
      "task_vector_dot_product": 0.45,
      "weight_space_angle": 0.7,
      "task_vector_magnitude_ratio": 0.1,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.2,
      "right_subspace_overlap": 0.95,
      "activation_l2_distance": 0.6,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.65,
      "activation_dot_product": 0.75,
      "encoder_gradient_cosine_similarity": 0.65,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.3,
      "input_gradient_cosine_similarity": 0.5,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.65
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7481909694068627,
        "val_r": 0.5992775650168041,
        "n_iterations": 249,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.012530717067420483,
          "right_subspace_overlap_bottom_k": -0.010567175224423409,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.007265583146363497,
          "task_vector_dot_product": -0.002739576157182455,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0010759008582681417,
          "subspace_overlap": -0.0014187395572662354,
          "right_subspace_overlap": 0.004626449663192034,
          "activation_l2_distance": -0.005564774386584759,
          "activation_cosine_similarity": 0.013644526712596416,
          "activation_magnitude_ratio": -0.007078429684042931,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.03265593945980072,
          "encoder_gradient_dot_product": 0.003226625267416239,
          "input_gradient_cosine_similarity": 0.0011357793118804693,
          "input_gradient_l2_distance": -0.02408108487725258,
          "input_gradient_dot_product": -0.0031399428844451904
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7431710504276792,
        "val_r": 0.773532513869468,
        "n_iterations": 246,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006744374055415392,
          "right_subspace_overlap_bottom_k": -0.015159912407398224,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.001012285239994526,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0019757538102567196,
          "task_vector_l2_distance": -0.0021659620106220245,
          "task_vector_dot_product": -0.003647281788289547,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0041620731353759766,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.009679111652076244,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0127859553322196,
          "activation_magnitude_ratio": -0.0037905664648860693,
          "activation_dot_product": 0.0034611658193171024,
          "encoder_gradient_cosine_similarity": 0.0012327973963692784,
          "encoder_gradient_l2_distance": -0.029647061601281166,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.020900029689073563,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.770284137633837,
        "val_r": 0.7799682407632963,
        "n_iterations": 254,
        "n_nonzero_coefficients": 12,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004590072203427553,
          "right_subspace_overlap_bottom_k": -0.012331862933933735,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0011516135418787599,
          "layerwise_effective_rank_mergeability_score": 0.0013954895548522472,
          "task_vector_cosine_similarity": 0.001803043414838612,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.003940535243600607,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.008041040040552616,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.010987753048539162,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.013902591541409492,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0016817966243252158,
          "input_gradient_l2_distance": -0.007669184356927872,
          "input_gradient_dot_product": -0.0019293531076982617
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7602516039096148,
        "val_r": 0.7217151797216658,
        "n_iterations": 215,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0070540024898946285,
          "right_subspace_overlap_bottom_k": -0.013363191857933998,
          "interaction_matrix_overlap_top_k": 0.0026036137714982033,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0011917052324861288,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.001363168703392148,
          "task_vector_l2_distance": 0.0014569316990673542,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0013206556905061007,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0036546364426612854,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.004652974661439657,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.01106884516775608,
          "activation_magnitude_ratio": -0.0030538314022123814,
          "activation_dot_product": -0.0012146863155066967,
          "encoder_gradient_cosine_similarity": 0.0034809429198503494,
          "encoder_gradient_l2_distance": -0.014749893918633461,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.001192962285131216,
          "input_gradient_l2_distance": -0.004073450341820717,
          "input_gradient_dot_product": -0.004213355947285891
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7603276410851849,
        "val_r": 0.7539258253000004,
        "n_iterations": 408,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0045522586442530155,
          "right_subspace_overlap_bottom_k": -0.013780750334262848,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0010795542038977146,
          "task_vector_dot_product": -0.001647025696001947,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0018149936804547906,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.008705674670636654,
          "activation_l2_distance": -0.001159735256806016,
          "activation_cosine_similarity": 0.009042926132678986,
          "activation_magnitude_ratio": -0.0018150354735553265,
          "activation_dot_product": -0.0010289426427334547,
          "encoder_gradient_cosine_similarity": 0.0019899229519069195,
          "encoder_gradient_l2_distance": -0.0187973715364933,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.002167662139981985,
          "input_gradient_l2_distance": -0.009704677388072014,
          "input_gradient_dot_product": -0.0018674260936677456
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7074396003256063,
        "val_r": 0.7357687453416482,
        "n_iterations": 189,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009449849836528301,
          "right_subspace_overlap_bottom_k": -0.019527455791831017,
          "interaction_matrix_overlap_top_k": 0.002067153574898839,
          "interaction_matrix_overlap_bottom_k": -0.007974611595273018,
          "effective_rank": -0.0023363197688013315,
          "effective_rank_mergeability_score": 0.0015370349865406752,
          "stable_rank": -0.0019564335234463215,
          "spectral_gap": 0.0018869821215048432,
          "singular_value_ratio": -0.0028964770026504993,
          "layerwise_effective_rank": -0.0030851818155497313,
          "layerwise_effective_rank_mergeability_score": 0.005063203629106283,
          "task_vector_cosine_similarity": 0.0034783119335770607,
          "task_vector_l2_distance": -0.0046456605195999146,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.002119320910423994,
          "task_vector_magnitude_ratio": -0.0012774551287293434,
          "singular_value_overlap": 0.0055870614014565945,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.01035038661211729,
          "activation_l2_distance": -0.008249369449913502,
          "activation_cosine_similarity": 0.011532029137015343,
          "activation_magnitude_ratio": -0.003513963194563985,
          "activation_dot_product": 0.016417959704995155,
          "encoder_gradient_cosine_similarity": 0.0016414120327681303,
          "encoder_gradient_l2_distance": -0.026768654584884644,
          "encoder_gradient_dot_product": -0.002022180240601301,
          "input_gradient_cosine_similarity": 0.001455815159715712,
          "input_gradient_l2_distance": -0.022579330950975418,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7285658302726996,
        "val_r": 0.6176602237082307,
        "n_iterations": 432,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006165440194308758,
          "right_subspace_overlap_bottom_k": -0.012949502095580101,
          "interaction_matrix_overlap_top_k": 0.004293820820748806,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0010859213070943952,
          "task_vector_cosine_similarity": 0.0016055600717663765,
          "task_vector_l2_distance": -0.0024656662717461586,
          "task_vector_dot_product": -0.0011569365160539746,
          "weight_space_angle": -0.0030230311676859856,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.006751133129000664,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.006804970558732748,
          "activation_l2_distance": -0.004413940478116274,
          "activation_cosine_similarity": 0.011327262036502361,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0037936631124466658,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.021336624398827553,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01741921156644821,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.752156309008719,
        "val_r": 0.33574962345194354,
        "n_iterations": 255,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009502003900706768,
          "right_subspace_overlap_bottom_k": -0.01262452732771635,
          "interaction_matrix_overlap_top_k": -0.0012667356058955193,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002098728669807315,
          "layerwise_effective_rank_mergeability_score": 0.0017820419743657112,
          "task_vector_cosine_similarity": -0.0014584745513275266,
          "task_vector_l2_distance": -0.0018393568461760879,
          "task_vector_dot_product": -0.0014844076940789819,
          "weight_space_angle": -0.0010989318834617734,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0021742028184235096,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.00534145999699831,
          "activation_l2_distance": -0.0013329494977369905,
          "activation_cosine_similarity": 0.011269895359873772,
          "activation_magnitude_ratio": -0.002432728186249733,
          "activation_dot_product": -0.001976557308807969,
          "encoder_gradient_cosine_similarity": 0.0034162115771323442,
          "encoder_gradient_l2_distance": -0.013070221990346909,
          "encoder_gradient_dot_product": 0.0011020120000466704,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.008043471723794937,
          "input_gradient_dot_product": 0.0010765485931187868
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.778457596729628,
        "val_r": 0.6210952972721285,
        "n_iterations": 190,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011022589169442654,
          "right_subspace_overlap_bottom_k": -0.01359769981354475,
          "interaction_matrix_overlap_top_k": 0.0013250161428004503,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0019358096178621054,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.001214566407725215,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0021872848737984896,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0013818780425935984,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0019544889219105244,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.004404126666486263,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.01290079951286316,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.0040403567254543304,
          "encoder_gradient_cosine_similarity": 0.002139739226549864,
          "encoder_gradient_l2_distance": -0.015986299142241478,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0016816130373626947,
          "input_gradient_l2_distance": -0.00897759199142456,
          "input_gradient_dot_product": -0.0021365275606513023
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7343395509953744,
        "val_r": 0.7056925699712334,
        "n_iterations": 227,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004223972093313932,
          "right_subspace_overlap_bottom_k": -0.015559379942715168,
          "interaction_matrix_overlap_top_k": -0.0010706133907660842,
          "interaction_matrix_overlap_bottom_k": -0.0014661040622740984,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0011982677970081568,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0010640679392963648,
          "task_vector_l2_distance": -0.002369387773796916,
          "task_vector_dot_product": -0.0033723576925694942,
          "weight_space_angle": 0.0026097861118614674,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0015802818816155195,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.01186443492770195,
          "activation_l2_distance": 0.001234426163136959,
          "activation_cosine_similarity": -0.0012033339589834213,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.0028877747245132923,
          "encoder_gradient_cosine_similarity": 0.0029054107144474983,
          "encoder_gradient_l2_distance": -0.023722149431705475,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.016218796372413635,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7661608557842541,
        "val_r": 0.053362010209868194,
        "n_iterations": 361,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.012216389179229736,
          "interaction_matrix_overlap_top_k": -0.001155021833255887,
          "interaction_matrix_overlap_bottom_k": 0.0018325723940506577,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0043264091946184635,
          "task_vector_l2_distance": -0.0029646374750882387,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.001866612583398819,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.013985290192067623,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.009232636541128159,
          "activation_cosine_similarity": 0.017819851636886597,
          "activation_magnitude_ratio": -0.003793486161157489,
          "activation_dot_product": 0.0073711806908249855,
          "encoder_gradient_cosine_similarity": -0.0010827642399817705,
          "encoder_gradient_l2_distance": -0.04241575673222542,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.004192317835986614,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7263697658691181,
        "val_r": 0.6713162309422045,
        "n_iterations": 172,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.008591187186539173,
          "right_subspace_overlap_bottom_k": -0.015888188034296036,
          "interaction_matrix_overlap_top_k": 0.0012236040784046054,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0015380490804091096,
          "stable_rank": -0.0014365275856107473,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002062915824353695,
          "layerwise_effective_rank_mergeability_score": 0.0022570728324353695,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0033128811046481133,
          "task_vector_dot_product": -0.002074360614642501,
          "weight_space_angle": 0.007544898893684149,
          "task_vector_magnitude_ratio": -0.001675457926467061,
          "singular_value_overlap": 0.006201879121363163,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.006583229172974825,
          "activation_l2_distance": -0.002736788708716631,
          "activation_cosine_similarity": 0.006717224605381489,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.009946642443537712,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.025368375703692436,
          "encoder_gradient_dot_product": 0.0017848419956862926,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.025809668004512787,
          "input_gradient_dot_product": 0.0010502231307327747
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7141512215961582,
        "val_r": 0.7146388872654563,
        "n_iterations": 246,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006477988790720701,
          "right_subspace_overlap_bottom_k": -0.01586957275867462,
          "interaction_matrix_overlap_top_k": 0.001439468003809452,
          "interaction_matrix_overlap_bottom_k": -0.005393837578594685,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0034805366303771734,
          "layerwise_effective_rank_mergeability_score": 0.003298304509371519,
          "task_vector_cosine_similarity": 0.002154349349439144,
          "task_vector_l2_distance": 0.002402711659669876,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.004816691391170025,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.006551518104970455,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.008152984082698822,
          "activation_l2_distance": -0.0012436762917786837,
          "activation_cosine_similarity": 0.012276883237063885,
          "activation_magnitude_ratio": -0.0034222682006657124,
          "activation_dot_product": 0.006220444105565548,
          "encoder_gradient_cosine_similarity": 0.0028482056222856045,
          "encoder_gradient_l2_distance": -0.016530562192201614,
          "encoder_gradient_dot_product": -0.002094108145684004,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.008952366188168526,
          "input_gradient_dot_product": -0.009576952084898949
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7635301634147592,
        "val_r": 0.7610913105785797,
        "n_iterations": 407,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0050262585282325745,
          "right_subspace_overlap_bottom_k": -0.011115268804132938,
          "interaction_matrix_overlap_top_k": 0.001966975163668394,
          "interaction_matrix_overlap_bottom_k": 0.0011622421443462372,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0019292524084448814,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005104102659970522,
          "subspace_overlap": -0.0016720357816666365,
          "right_subspace_overlap": 0.008358077146112919,
          "activation_l2_distance": 0.0013096367474645376,
          "activation_cosine_similarity": 0.01058622170239687,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.014159198850393295,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0015916272532194853,
          "input_gradient_l2_distance": -0.005630462896078825,
          "input_gradient_dot_product": -0.0031767101027071476
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.766218101209297,
        "val_r": 0.7390701149446024,
        "n_iterations": 207,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005925776436924934,
          "right_subspace_overlap_bottom_k": -0.014833161607384682,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0010800051968544722,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0014665044145658612,
          "task_vector_l2_distance": 0.001426997478120029,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0034932238049805164,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.002168960403650999,
          "subspace_overlap": -0.0012775567593052983,
          "right_subspace_overlap": 0.007271558977663517,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.014022769406437874,
          "activation_magnitude_ratio": -0.0013304221211001277,
          "activation_dot_product": -0.00487874262034893,
          "encoder_gradient_cosine_similarity": 0.0014415476471185684,
          "encoder_gradient_l2_distance": -0.015329321846365929,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.002707290928810835,
          "input_gradient_l2_distance": -0.004078666679561138,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.7956610216670765,
        "val_r": 0.8747010435115844,
        "n_iterations": 483,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004295747727155685,
          "right_subspace_overlap_bottom_k": -0.016013644635677338,
          "interaction_matrix_overlap_top_k": 0.001422423985786736,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0010421816259622574,
          "task_vector_l2_distance": -0.0042541297152638435,
          "task_vector_dot_product": -0.0014868841972202063,
          "weight_space_angle": 0.0035336269065737724,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.008267699740827084,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.011223962530493736,
          "activation_l2_distance": 0.0017476719804108143,
          "activation_cosine_similarity": 0.01102382317185402,
          "activation_magnitude_ratio": -0.0037047727964818478,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.022395748645067215,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.001226160442456603,
          "input_gradient_l2_distance": -0.011874107643961906,
          "input_gradient_dot_product": 0.001316157984547317
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7547188768375466,
        "val_r": 0.7748558732854434,
        "n_iterations": 221,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00760407792404294,
          "right_subspace_overlap_bottom_k": -0.014370042830705643,
          "interaction_matrix_overlap_top_k": 0.001574160996824503,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0010421441402286291,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0017165369354188442,
          "layerwise_effective_rank_mergeability_score": 0.0010441081831231713,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0025996132753789425,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0029484834522008896,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005239992402493954,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005312396679073572,
          "activation_l2_distance": 0.0014291038969531655,
          "activation_cosine_similarity": 0.008447161875665188,
          "activation_magnitude_ratio": -0.0018299937946721911,
          "activation_dot_product": 0.003018053714185953,
          "encoder_gradient_cosine_similarity": 0.003176088212057948,
          "encoder_gradient_l2_distance": -0.013487215153872967,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.012485723942518234,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7577255219804372,
        "val_r": 0.6633278739207144,
        "n_iterations": 181,
        "n_nonzero_coefficients": 13,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00775822764262557,
          "right_subspace_overlap_bottom_k": -0.013725434429943562,
          "interaction_matrix_overlap_top_k": 0.0017220373265445232,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0015457309782505035,
          "weight_space_angle": -0.0010860887123271823,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.004191776271909475,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005399889312684536,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.01317095197737217,
          "activation_magnitude_ratio": -0.0014925316208973527,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0015883739106357098,
          "encoder_gradient_l2_distance": -0.019419198855757713,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.015111020766198635,
          "input_gradient_dot_product": -0.0016323423478752375
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6909546624300167,
        "val_r": 0.5730936455838425,
        "n_iterations": 228,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009156647138297558,
          "right_subspace_overlap_bottom_k": -0.017052579671144485,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.0016760316211730242,
          "effective_rank": -0.0015416864771395922,
          "effective_rank_mergeability_score": 0.0016779573634266853,
          "stable_rank": -0.0012634459417313337,
          "spectral_gap": 0.0011844629188999534,
          "singular_value_ratio": -0.0010812426917254925,
          "layerwise_effective_rank": -0.002825451549142599,
          "layerwise_effective_rank_mergeability_score": 0.0021735485643148422,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0022471360862255096,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005696613807231188,
          "subspace_overlap": 0.0011914493516087532,
          "right_subspace_overlap": 0.005685778800398111,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.01300010085105896,
          "activation_magnitude_ratio": -0.00204554945230484,
          "activation_dot_product": 0.00672561302781105,
          "encoder_gradient_cosine_similarity": 0.002708334242925048,
          "encoder_gradient_l2_distance": -0.01860889233648777,
          "encoder_gradient_dot_product": 0.001784797292202711,
          "input_gradient_cosine_similarity": -0.0010702371364459395,
          "input_gradient_l2_distance": -0.01274374034255743,
          "input_gradient_dot_product": -0.0013865700457245111
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8170619227603284,
        "val_r": 0.7305572598251051,
        "n_iterations": 292,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.00436329236254096,
          "interaction_matrix_overlap_top_k": -0.0011303190840408206,
          "interaction_matrix_overlap_bottom_k": -0.002598951105028391,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": -0.0012881439179182053,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0016817942960187793,
          "task_vector_l2_distance": -0.004165748134255409,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0011468935990706086,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.002938978374004364,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.0019737049005925655,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0011504924623295665,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.010114185512065887,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.014321299269795418,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01082594133913517,
          "input_gradient_dot_product": -0.0032402712386101484
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1.0,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "isotropic": {
    "aggregate_metrics": {
      "train_r": 0.4229345304529925,
      "train_p": 5.26258186418199e-140,
      "val_r": -0.0880221739229809,
      "val_p": 0.09634002949003403
    },
    "per_fold_stats": {
      "train_r_mean": 0.5446837725027,
      "train_r_std": 0.05272028548641055,
      "val_r_mean": 0.4472012323728304,
      "val_r_std": 0.13467487063992079,
      "n_nonzero_mean": 15.6,
      "n_nonzero_std": 3.352610922848042
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 6.552942795678973e-05,
      "right_subspace_overlap_bottom_k": 0.0022824849002063274,
      "interaction_matrix_overlap_top_k": -0.000125858437968418,
      "interaction_matrix_overlap_bottom_k": 0.018964434042572975,
      "effective_rank": -0.00028956783353351057,
      "effective_rank_mergeability_score": 0.0003153859288431704,
      "stable_rank": -0.0002790758153423667,
      "spectral_gap": 0.0005526760360226035,
      "singular_value_ratio": -0.0003730769385583699,
      "layerwise_effective_rank": -0.00045246435911394656,
      "layerwise_effective_rank_mergeability_score": 0.00032660976285114884,
      "task_vector_cosine_similarity": -1.3625865904032253e-05,
      "task_vector_l2_distance": -0.012670865282416344,
      "task_vector_dot_product": -0.00039465673035010695,
      "weight_space_angle": -0.0004812762199435383,
      "task_vector_magnitude_ratio": -0.0021063191816210747,
      "singular_value_overlap": -0.01109122484922409,
      "subspace_overlap": 0.0008735476294532418,
      "right_subspace_overlap": 0.0007022420759312809,
      "activation_l2_distance": -0.0007255393429659307,
      "activation_cosine_similarity": 0.00013696230598725379,
      "activation_magnitude_ratio": -0.0025946972891688347,
      "activation_dot_product": -0.001993908081203699,
      "encoder_gradient_cosine_similarity": 0.00046810711501166224,
      "encoder_gradient_l2_distance": -0.0072061107493937016,
      "encoder_gradient_dot_product": 0.0002226797805633396,
      "input_gradient_cosine_similarity": 0.0006472301320172846,
      "input_gradient_l2_distance": -0.013994483277201653,
      "input_gradient_dot_product": -0.0025119150523096323
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.0014700625324621797,
      "right_subspace_overlap_bottom_k": 0.0031030243262648582,
      "interaction_matrix_overlap_top_k": 0.0015834998339414597,
      "interaction_matrix_overlap_bottom_k": 0.004994598682969809,
      "effective_rank": 0.0005043584387749434,
      "effective_rank_mergeability_score": 0.0006583528593182564,
      "stable_rank": 0.0005742284120060503,
      "spectral_gap": 0.0007848274544812739,
      "singular_value_ratio": 0.0006799512193538249,
      "layerwise_effective_rank": 0.0008582131122238934,
      "layerwise_effective_rank_mergeability_score": 0.0007383339107036591,
      "task_vector_cosine_similarity": 0.0010622214758768678,
      "task_vector_l2_distance": 0.005000103265047073,
      "task_vector_dot_product": 0.001800523605197668,
      "weight_space_angle": 0.0013269133633002639,
      "task_vector_magnitude_ratio": 0.000998556730337441,
      "singular_value_overlap": 0.002995614428073168,
      "subspace_overlap": 0.0015844128793105483,
      "right_subspace_overlap": 0.0017606657929718494,
      "activation_l2_distance": 0.0032864955719560385,
      "activation_cosine_similarity": 0.0016776449047029018,
      "activation_magnitude_ratio": 0.0010854477295652032,
      "activation_dot_product": 0.002524887677282095,
      "encoder_gradient_cosine_similarity": 0.0009654632303863764,
      "encoder_gradient_l2_distance": 0.005611919332295656,
      "encoder_gradient_dot_product": 0.0013024749932810664,
      "input_gradient_cosine_similarity": 0.0011322472710162401,
      "input_gradient_l2_distance": 0.006393385585397482,
      "input_gradient_dot_product": 0.0022833894472569227
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.45,
      "right_subspace_overlap_bottom_k": 0.75,
      "interaction_matrix_overlap_top_k": 0.45,
      "interaction_matrix_overlap_bottom_k": 1.0,
      "effective_rank": 0.25,
      "effective_rank_mergeability_score": 0.2,
      "stable_rank": 0.2,
      "spectral_gap": 0.35,
      "singular_value_ratio": 0.25,
      "layerwise_effective_rank": 0.25,
      "layerwise_effective_rank_mergeability_score": 0.2,
      "task_vector_cosine_similarity": 0.4,
      "task_vector_l2_distance": 0.95,
      "task_vector_dot_product": 0.4,
      "weight_space_angle": 0.4,
      "task_vector_magnitude_ratio": 0.9,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.35,
      "right_subspace_overlap": 0.4,
      "activation_l2_distance": 0.4,
      "activation_cosine_similarity": 0.25,
      "activation_magnitude_ratio": 0.95,
      "activation_dot_product": 0.6,
      "encoder_gradient_cosine_similarity": 0.5,
      "encoder_gradient_l2_distance": 0.95,
      "encoder_gradient_dot_product": 0.35,
      "input_gradient_cosine_similarity": 0.6,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.85
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5984624886034957,
        "val_r": 0.5852707796854559,
        "n_iterations": 229,
        "n_nonzero_coefficients": 12,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0014381272485479712,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.01577678509056568,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0022318800911307335,
          "task_vector_l2_distance": -0.009619096294045448,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0030038238037377596,
          "singular_value_overlap": -0.0115586519241333,
          "subspace_overlap": 0.003089148085564375,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.003741474822163582,
          "activation_dot_product": -0.00449453154578805,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0057722777128219604,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.008563513867557049,
          "input_gradient_dot_product": -0.002137810690328479
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5507345099646073,
        "val_r": 0.45167722377696917,
        "n_iterations": 279,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0011070913169533014,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.020043691620230675,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0016062305076047778,
          "stable_rank": 0.0,
          "spectral_gap": 0.0010552393505349755,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.010855383239686489,
          "task_vector_dot_product": 0.0012525105848908424,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0030730199068784714,
          "singular_value_overlap": -0.007556232623755932,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.0023737361188977957,
          "activation_l2_distance": 0.0010407654335722327,
          "activation_cosine_similarity": 0.0010346666676923633,
          "activation_magnitude_ratio": -0.002030535601079464,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.007805325090885162,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.001657809130847454,
          "input_gradient_l2_distance": -0.010549671947956085,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5350124878764876,
        "val_r": 0.4734727476921665,
        "n_iterations": 234,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0029410962015390396,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.017254849895834923,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0015587566886097193,
          "task_vector_l2_distance": -0.013245494104921818,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0015584651846438646,
          "singular_value_overlap": -0.011879872530698776,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0032596811652183533,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002964272163808346,
          "activation_dot_product": -0.001548245083540678,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.005555889569222927,
          "encoder_gradient_dot_product": -0.001822206424549222,
          "input_gradient_cosine_similarity": 0.0012905977200716734,
          "input_gradient_l2_distance": -0.01207603607326746,
          "input_gradient_dot_product": -0.0019435224821791053
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5523572302846307,
        "val_r": 0.5141149891820217,
        "n_iterations": 318,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.003426416777074337,
          "interaction_matrix_overlap_top_k": 0.0011154416715726256,
          "interaction_matrix_overlap_bottom_k": 0.017352893948554993,
          "effective_rank": -0.0010910083074122667,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0010500943753868341,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0012323603732511401,
          "task_vector_l2_distance": -0.01165380235761404,
          "task_vector_dot_product": 0.0013758381828665733,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.001953958533704281,
          "singular_value_overlap": -0.012031862512230873,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0036610602401196957,
          "activation_dot_product": -0.003284701146185398,
          "encoder_gradient_cosine_similarity": -0.0012681677471846342,
          "encoder_gradient_l2_distance": -0.004441739059984684,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.001685662311501801,
          "input_gradient_l2_distance": -0.011261435225605965,
          "input_gradient_dot_product": -0.0033816820941865444
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5708241074038031,
        "val_r": 0.5951013632915878,
        "n_iterations": 243,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0012091738171875477,
          "right_subspace_overlap_bottom_k": 0.0030588367953896523,
          "interaction_matrix_overlap_top_k": 0.00194265425670892,
          "interaction_matrix_overlap_bottom_k": 0.02552112750709057,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0014485931023955345,
          "singular_value_ratio": -0.0010427285451442003,
          "layerwise_effective_rank": -0.0010899277403950691,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0013668397441506386,
          "task_vector_l2_distance": -0.020691031590104103,
          "task_vector_dot_product": -0.0032377205789089203,
          "weight_space_angle": -0.0012811279157176614,
          "task_vector_magnitude_ratio": -0.002033067401498556,
          "singular_value_overlap": -0.016274508088827133,
          "subspace_overlap": -0.0010156265925616026,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0020964238792657852,
          "activation_dot_product": -0.004218418151140213,
          "encoder_gradient_cosine_similarity": 0.0012201754143461585,
          "encoder_gradient_l2_distance": -0.004976240452378988,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.016778698191046715,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5257096412068283,
        "val_r": 0.6965171659214692,
        "n_iterations": 301,
        "n_nonzero_coefficients": 13,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.003384063486009836,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.022228214889764786,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0013943712692707777,
          "task_vector_l2_distance": -0.013342232443392277,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0023561534471809864,
          "singular_value_overlap": -0.013659429736435413,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.001089025754481554,
          "activation_l2_distance": -0.002182080876082182,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002557947300374508,
          "activation_dot_product": -0.0031952240969985723,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.006282821297645569,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0021890331991016865,
          "input_gradient_l2_distance": -0.01230686902999878,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.5525768067041729,
        "val_r": 0.24657392384193688,
        "n_iterations": 321,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0010649290634319186,
          "right_subspace_overlap_bottom_k": 0.006503187119960785,
          "interaction_matrix_overlap_top_k": -0.0019224865827709436,
          "interaction_matrix_overlap_bottom_k": 0.02238009311258793,
          "effective_rank": -0.0013025305233895779,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0020066520664840937,
          "singular_value_ratio": -0.0020946403965353966,
          "layerwise_effective_rank": -0.002138781826943159,
          "layerwise_effective_rank_mergeability_score": 0.001417043269611895,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.016403021290898323,
          "task_vector_dot_product": -0.005198238417506218,
          "weight_space_angle": 0.0022673048079013824,
          "task_vector_magnitude_ratio": -0.002549689495936036,
          "singular_value_overlap": -0.01655854843556881,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.003445724956691265,
          "activation_cosine_similarity": 0.0014984223525971174,
          "activation_magnitude_ratio": -0.001776242977939546,
          "activation_dot_product": -0.010769030079245567,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.012777618132531643,
          "encoder_gradient_dot_product": 0.00249113654717803,
          "input_gradient_cosine_similarity": -0.0020597197581082582,
          "input_gradient_l2_distance": -0.018921438604593277,
          "input_gradient_dot_product": -0.002296565566211939
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5277414561588265,
        "val_r": 0.3883309783984004,
        "n_iterations": 189,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.001449286355637014,
          "interaction_matrix_overlap_top_k": -0.003372735809534788,
          "interaction_matrix_overlap_bottom_k": 0.023899590596556664,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0013096937909722328,
          "spectral_gap": 0.0015864279121160507,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.012329088523983955,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0032918488141149282,
          "singular_value_overlap": -0.01094839908182621,
          "subspace_overlap": 0.0012138914316892624,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.003398518543690443,
          "activation_dot_product": -0.0023327942471951246,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.00523685896769166,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0061825113371014595,
          "input_gradient_dot_product": -0.0016045646043494344
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5351060054548051,
        "val_r": 0.39513481755547275,
        "n_iterations": 250,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.0017021982930600643,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.020674221217632294,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0022277701646089554,
          "stable_rank": 0.0,
          "spectral_gap": 0.001089185243472457,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0011633741669356823,
          "task_vector_cosine_similarity": -0.0015672000590711832,
          "task_vector_l2_distance": -0.007976889610290527,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0024591556284576654,
          "task_vector_magnitude_ratio": -0.0012200034689158201,
          "singular_value_overlap": -0.008226889185607433,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0017398596974089742,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.001615991466678679,
          "encoder_gradient_l2_distance": -0.005447461269795895,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.001363264280371368,
          "input_gradient_l2_distance": -0.00952247716486454,
          "input_gradient_dot_product": -0.0027236510068178177
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.56711061846266,
        "val_r": 0.1755846333171502,
        "n_iterations": 328,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0015877539990469813,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.018468273803591728,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0012182325590401888,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0010098416823893785,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01284770481288433,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0026327483355998993,
          "singular_value_overlap": -0.01206082385033369,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.0010976267512887716,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": -0.0018832720816135406,
          "activation_magnitude_ratio": -0.003323041135445237,
          "activation_dot_product": -0.0017477403162047267,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.005412775091826916,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.012251491658389568,
          "input_gradient_dot_product": -0.001264780294150114
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.47720659168573176,
        "val_r": 0.3088082983729836,
        "n_iterations": 433,
        "n_nonzero_coefficients": 12,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.004203435964882374,
          "interaction_matrix_overlap_top_k": -0.00110324053093791,
          "interaction_matrix_overlap_bottom_k": 0.015336010605096817,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.010317753069102764,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.001397250802256167,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.00807985384017229,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0027410676702857018,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.006698683835566044,
          "encoder_gradient_dot_product": 0.0013536084443330765,
          "input_gradient_cosine_similarity": 0.0017515176441520452,
          "input_gradient_l2_distance": -0.00844768900424242,
          "input_gradient_dot_product": -0.0016930440906435251
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5169677771677631,
        "val_r": 0.5192806448708999,
        "n_iterations": 347,
        "n_nonzero_coefficients": 11,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.020127054303884506,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.011425885371863842,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0016076158499345183,
          "singular_value_overlap": -0.011100009083747864,
          "subspace_overlap": 0.003186162794008851,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0021799455862492323,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0030756695196032524,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": -0.001267787185497582,
          "encoder_gradient_l2_distance": -0.005985839758068323,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.012938723899424076,
          "input_gradient_dot_product": -0.0024285325780510902
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5119461705363894,
        "val_r": 0.5255933366816106,
        "n_iterations": 408,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0011153401574119925,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.01683555729687214,
          "effective_rank": -0.0012644871603697538,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0010545613477006555,
          "task_vector_l2_distance": -0.011971622705459595,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.003126151394098997,
          "singular_value_overlap": -0.010248998180031776,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0013522951630875468,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.001529501168988645,
          "encoder_gradient_l2_distance": -0.004374487325549126,
          "encoder_gradient_dot_product": -0.0016332913655787706,
          "input_gradient_cosine_similarity": 0.0015230237040668726,
          "input_gradient_l2_distance": -0.010959535837173462,
          "input_gradient_dot_product": -0.004412577487528324
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.4302571207169676,
        "val_r": 0.5237598468849746,
        "n_iterations": 307,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003546022344380617,
          "right_subspace_overlap_bottom_k": 0.0031581528019160032,
          "interaction_matrix_overlap_top_k": 0.001408232725225389,
          "interaction_matrix_overlap_bottom_k": 0.017587922513484955,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0013541547814384103,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0025019075255841017,
          "task_vector_l2_distance": -0.008486184291541576,
          "task_vector_dot_product": 0.002355222124606371,
          "weight_space_angle": -0.0032818333711475134,
          "task_vector_magnitude_ratio": -0.002054717391729355,
          "singular_value_overlap": -0.006253937259316444,
          "subspace_overlap": 0.0025185521226376295,
          "right_subspace_overlap": 0.0024793411139398813,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0013093962334096432,
          "activation_dot_product": -0.0010847561061382294,
          "encoder_gradient_cosine_similarity": 0.0027072099037468433,
          "encoder_gradient_l2_distance": -0.008186860010027885,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0014802315272390842,
          "input_gradient_l2_distance": -0.012508882209658623,
          "input_gradient_dot_product": -0.011143351905047894
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.48810923896126734,
        "val_r": 0.5437359399986808,
        "n_iterations": 368,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.003903299570083618,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.017176367342472076,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.016214832663536072,
          "task_vector_dot_product": -0.004307907074689865,
          "weight_space_angle": -0.0011252772528678179,
          "task_vector_magnitude_ratio": -0.0021495455875992775,
          "singular_value_overlap": -0.01554578822106123,
          "subspace_overlap": 0.004939825274050236,
          "right_subspace_overlap": 0.0027221606578677893,
          "activation_l2_distance": -0.004161341581493616,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002906988374888897,
          "activation_dot_product": -0.0017216817941516638,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.00839540921151638,
          "encoder_gradient_dot_product": -0.001689306227490306,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01679784059524536,
          "input_gradient_dot_product": -0.0027049179188907146
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.5508619943793118,
        "val_r": 0.4013676940837619,
        "n_iterations": 384,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.001608472433872521,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.019609127193689346,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.016579635441303253,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.002390575595200062,
          "singular_value_overlap": -0.00858575664460659,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0019923921208828688,
          "activation_l2_distance": -0.0010713416850194335,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.005197542253881693,
          "activation_dot_product": -0.0037386626936495304,
          "encoder_gradient_cosine_similarity": 0.0010521163931116462,
          "encoder_gradient_l2_distance": -0.008018243126571178,
          "encoder_gradient_dot_product": 0.0020141489803791046,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.013926360756158829,
          "input_gradient_dot_product": -0.0033450969494879246
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5517792818319422,
        "val_r": 0.49588252050391185,
        "n_iterations": 353,
        "n_nonzero_coefficients": 11,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0010411972180008888,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.014196068979799747,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0014032311737537384,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009156021289527416,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0010920872446149588,
          "task_vector_magnitude_ratio": -0.0013156443601474166,
          "singular_value_overlap": -0.00791970081627369,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002389767440035939,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0038520474918186665,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.007561051286756992,
          "input_gradient_dot_product": -0.0012834734516218305
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5782033234843059,
        "val_r": 0.21701777119502325,
        "n_iterations": 192,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0023376040626317263,
          "right_subspace_overlap_bottom_k": 0.012536398135125637,
          "interaction_matrix_overlap_top_k": -0.0024718933273106813,
          "interaction_matrix_overlap_bottom_k": 0.029811635613441467,
          "effective_rank": -0.001026809448376298,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0019081333884969354,
          "spectral_gap": 0.0018707062117755413,
          "singular_value_ratio": -0.0010904375230893493,
          "layerwise_effective_rank": -0.001846124418079853,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.025020744651556015,
          "task_vector_dot_product": 0.0011320380726829171,
          "weight_space_angle": -0.003440272295847535,
          "task_vector_magnitude_ratio": -0.001680090557783842,
          "singular_value_overlap": -0.0139318173751235,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.005564758088439703,
          "activation_cosine_similarity": -0.003834816161543131,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.0017423788085579872,
          "encoder_gradient_cosine_similarity": 0.001090198871679604,
          "encoder_gradient_l2_distance": 0.0,
          "encoder_gradient_dot_product": 0.003739505773410201,
          "input_gradient_cosine_similarity": 0.0021431788336485624,
          "input_gradient_l2_distance": -0.030311817303299904,
          "input_gradient_dot_product": -0.002100628102198243
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7064033441266103,
        "val_r": 0.5681030280308375,
        "n_iterations": 360,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002624868182465434,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.004048763308674097,
          "interaction_matrix_overlap_bottom_k": 0.00411337660625577,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0010704864980652928,
          "stable_rank": -0.001145456568337977,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002924358006566763,
          "layerwise_effective_rank_mergeability_score": 0.002941936021670699,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.007309289183467627,
          "subspace_overlap": 0.003538999240845442,
          "right_subspace_overlap": 0.00597360311076045,
          "activation_l2_distance": -0.012435766868293285,
          "activation_cosine_similarity": 0.0059242453426122665,
          "activation_magnitude_ratio": -0.0033802823163568974,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0016118725761771202,
          "encoder_gradient_l2_distance": -0.02937040664255619,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0016361558809876442,
          "input_gradient_l2_distance": -0.030590400099754333,
          "input_gradient_dot_product": -0.0025904125068336725
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5663052550433917,
        "val_r": 0.3186969441712954,
        "n_iterations": 275,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0033771039452403784,
          "right_subspace_overlap_bottom_k": 0.0013747295597568154,
          "interaction_matrix_overlap_top_k": -0.002161904703825712,
          "interaction_matrix_overlap_bottom_k": 0.020895833149552345,
          "effective_rank": -0.001106521114706993,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0019967155531048775,
          "singular_value_ratio": -0.001879577524960041,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01528088841587305,
          "task_vector_dot_product": -0.0012648776173591614,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.004129265435039997,
          "singular_value_overlap": -0.012094134464859962,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002251556608825922,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0010710316710174084,
          "encoder_gradient_l2_distance": -0.005531218834221363,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0010103760287165642,
          "input_gradient_l2_distance": -0.01743323728442192,
          "input_gradient_dot_product": -0.003183686872944236
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 1.0,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  }
}