{
  "aggregate_metrics": {
    "train_r": 0.45407499129750556,
    "train_p": 1.0944677397522091e-163,
    "val_r": 0.044611329527150745,
    "val_p": 0.40003818347787967
  },
  "per_fold_stats": {
    "train_r_mean": 0.5545384121093118,
    "train_r_std": 0.04099603834025219,
    "val_r_mean": 0.4431387291223253,
    "val_r_std": 0.1459124731344027,
    "n_nonzero_mean": 18.7,
    "n_nonzero_std": 3.479942528261063
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.0009750762837938964,
    "right_subspace_overlap_bottom_k": 0.004742247052490711,
    "interaction_matrix_overlap_top_k": -0.000578699167817831,
    "interaction_matrix_overlap_bottom_k": 0.02730504237115383,
    "effective_rank": -0.0003203979867976159,
    "effective_rank_mergeability_score": 0.0003351555787958205,
    "stable_rank": -0.0005377558409236372,
    "spectral_gap": 0.0005061282427050173,
    "singular_value_ratio": -0.00046937866136431694,
    "layerwise_effective_rank": -0.0005517587414942682,
    "layerwise_effective_rank_mergeability_score": 0.00043108206591568887,
    "task_vector_cosine_similarity": -0.0002924669242929667,
    "task_vector_l2_distance": -0.01851021498441696,
    "task_vector_dot_product": -0.000510625948663801,
    "weight_space_angle": 0.0011753311846405268,
    "task_vector_magnitude_ratio": -0.004185675643384457,
    "singular_value_overlap": -0.018195267766714096,
    "subspace_overlap": 0.0027204789221286774,
    "right_subspace_overlap": 0.0009801069973036647,
    "activation_l2_distance": -0.00044936599442735314,
    "activation_cosine_similarity": 0.0001255279639735818,
    "activation_magnitude_ratio": -0.0049768188036978245,
    "activation_dot_product": -0.002195653971284628,
    "encoder_gradient_cosine_similarity": 0.00015232068835757673,
    "encoder_gradient_l2_distance": -0.011668307706713676,
    "encoder_gradient_dot_product": 0.0005043993587605655,
    "input_gradient_cosine_similarity": 0.0011440727394074202,
    "input_gradient_l2_distance": -0.02112356200814247,
    "input_gradient_dot_product": -0.004989933222532272
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.0026086147408932447,
    "right_subspace_overlap_bottom_k": 0.004568357020616531,
    "interaction_matrix_overlap_top_k": 0.001916107488796115,
    "interaction_matrix_overlap_bottom_k": 0.007318887393921614,
    "effective_rank": 0.0005613246466964483,
    "effective_rank_mergeability_score": 0.0006856020190753043,
    "stable_rank": 0.0006818942492827773,
    "spectral_gap": 0.0008963276050053537,
    "singular_value_ratio": 0.0009193715522997081,
    "layerwise_effective_rank": 0.0013081200886517763,
    "layerwise_effective_rank_mergeability_score": 0.0009728326695039868,
    "task_vector_cosine_similarity": 0.0011729317484423518,
    "task_vector_l2_distance": 0.007536298595368862,
    "task_vector_dot_product": 0.00265966122969985,
    "weight_space_angle": 0.0019250301411375403,
    "task_vector_magnitude_ratio": 0.001963724149391055,
    "singular_value_overlap": 0.006089130416512489,
    "subspace_overlap": 0.0026353122666478157,
    "right_subspace_overlap": 0.0030862672720104456,
    "activation_l2_distance": 0.0031041877809911966,
    "activation_cosine_similarity": 0.002082545543089509,
    "activation_magnitude_ratio": 0.0020626522600650787,
    "activation_dot_product": 0.004247982520610094,
    "encoder_gradient_cosine_similarity": 0.0017669587396085262,
    "encoder_gradient_l2_distance": 0.004704682622104883,
    "encoder_gradient_dot_product": 0.0014577734982594848,
    "input_gradient_cosine_similarity": 0.0012497496791183949,
    "input_gradient_l2_distance": 0.006714371498674154,
    "input_gradient_dot_product": 0.0032374041620641947
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.45,
    "right_subspace_overlap_bottom_k": 0.8,
    "interaction_matrix_overlap_top_k": 0.4,
    "interaction_matrix_overlap_bottom_k": 1.0,
    "effective_rank": 0.25,
    "effective_rank_mergeability_score": 0.35,
    "stable_rank": 0.4,
    "spectral_gap": 0.45,
    "singular_value_ratio": 0.4,
    "layerwise_effective_rank": 0.2,
    "layerwise_effective_rank_mergeability_score": 0.2,
    "task_vector_cosine_similarity": 0.3,
    "task_vector_l2_distance": 1.0,
    "task_vector_dot_product": 0.6,
    "weight_space_angle": 0.75,
    "task_vector_magnitude_ratio": 1.0,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.8,
    "right_subspace_overlap": 0.55,
    "activation_l2_distance": 0.9,
    "activation_cosine_similarity": 0.6,
    "activation_magnitude_ratio": 0.95,
    "activation_dot_product": 0.8,
    "encoder_gradient_cosine_similarity": 0.5,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.55,
    "input_gradient_cosine_similarity": 0.5,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 1.0
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6069669389747144,
      "val_r": 0.6216906850658248,
      "n_iterations": 209,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.001524151535704732,
        "right_subspace_overlap_bottom_k": 0.005971998907625675,
        "interaction_matrix_overlap_top_k": -0.0024150696117430925,
        "interaction_matrix_overlap_bottom_k": 0.03424370288848877,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0014240657910704613,
        "task_vector_l2_distance": -0.024421220645308495,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.004702414385974407,
        "task_vector_magnitude_ratio": -0.005878467112779617,
        "singular_value_overlap": -0.025676751509308815,
        "subspace_overlap": 0.0069850729778409,
        "right_subspace_overlap": -0.0020423561800271273,
        "activation_l2_distance": 0.001793664414435625,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.007859897799789906,
        "activation_dot_product": -0.005102195776998997,
        "encoder_gradient_cosine_similarity": -0.0020026019774377346,
        "encoder_gradient_l2_distance": -0.012159079313278198,
        "encoder_gradient_dot_product": 0.0012017423287034035,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.019374113529920578,
        "input_gradient_dot_product": -0.005960147362202406
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5427429750133878,
      "val_r": 0.5722878283435049,
      "n_iterations": 285,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004076370969414711,
        "right_subspace_overlap_bottom_k": 0.009004411287605762,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0332949161529541,
        "effective_rank": -0.001061383867636323,
        "effective_rank_mergeability_score": 0.0011477397056296468,
        "stable_rank": 0.0,
        "spectral_gap": 0.0016484237276017666,
        "singular_value_ratio": -0.001763252541422844,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.003885365556925535,
        "task_vector_l2_distance": -0.019061792641878128,
        "task_vector_dot_product": -0.005565094295889139,
        "weight_space_angle": 0.004030839540064335,
        "task_vector_magnitude_ratio": -0.006631467957049608,
        "singular_value_overlap": -0.027768077328801155,
        "subspace_overlap": 0.002981973346322775,
        "right_subspace_overlap": 0.0042241839691996574,
        "activation_l2_distance": -0.003849123604595661,
        "activation_cosine_similarity": 0.004013813566416502,
        "activation_magnitude_ratio": -0.00516230333596468,
        "activation_dot_product": -0.006769961677491665,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.02189590036869049,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.03315090760588646,
        "input_gradient_dot_product": -0.009675076231360435
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5436327474745457,
      "val_r": 0.4944656114086446,
      "n_iterations": 360,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.01131760235875845,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.03337346762418747,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0011112620122730732,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.02523939125239849,
        "task_vector_dot_product": 0.0019361465238034725,
        "weight_space_angle": 0.0010576883796602488,
        "task_vector_magnitude_ratio": -0.004404345527291298,
        "singular_value_overlap": -0.023091088980436325,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.003449718002229929,
        "activation_cosine_similarity": -0.0011386937694624066,
        "activation_magnitude_ratio": -0.005633268505334854,
        "activation_dot_product": 0.0010728633496910334,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.010564908385276794,
        "encoder_gradient_dot_product": -0.0017121769487857819,
        "input_gradient_cosine_similarity": 0.0020911889150738716,
        "input_gradient_l2_distance": -0.025726240128278732,
        "input_gradient_dot_product": -0.0077710445038974285
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5523244641491509,
      "val_r": 0.4961566155415025,
      "n_iterations": 312,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.003222195664420724,
        "interaction_matrix_overlap_top_k": -0.0011159993009641767,
        "interaction_matrix_overlap_bottom_k": 0.026475343853235245,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0013092323206365108,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0010392768308520317,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.017166607081890106,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.004562309477478266,
        "singular_value_overlap": -0.018783332780003548,
        "subspace_overlap": 0.005598260089755058,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": -0.0025193211622536182,
        "activation_magnitude_ratio": -0.007717553526163101,
        "activation_dot_product": -0.0029515058267861605,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.008273190818727016,
        "encoder_gradient_dot_product": 0.0011292226845398545,
        "input_gradient_cosine_similarity": 0.0027370338793843985,
        "input_gradient_l2_distance": -0.018112044781446457,
        "input_gradient_dot_product": -0.004235783126205206
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5714641337863879,
      "val_r": 0.5433104574757851,
      "n_iterations": 285,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.027806423604488373,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01366439275443554,
        "task_vector_dot_product": -0.005453597754240036,
        "weight_space_angle": 0.0019243372371420264,
        "task_vector_magnitude_ratio": -0.0023501699324697256,
        "singular_value_overlap": -0.01663006842136383,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.003317030146718025,
        "activation_l2_distance": -0.0015805643051862717,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.003356881905347109,
        "activation_dot_product": -0.0034704525023698807,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.008563730865716934,
        "encoder_gradient_dot_product": 0.0012573954882100224,
        "input_gradient_cosine_similarity": 0.002073411364108324,
        "input_gradient_l2_distance": -0.01798323169350624,
        "input_gradient_dot_product": -0.005510477814823389
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5564378383511293,
      "val_r": 0.6466885078100408,
      "n_iterations": 765,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0114522660151124,
        "interaction_matrix_overlap_top_k": -0.001710810698568821,
        "interaction_matrix_overlap_bottom_k": 0.033472802489995956,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0011312816059216857,
        "singular_value_ratio": -0.0018455003155395389,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.027337050065398216,
        "task_vector_dot_product": 0.004322591703385115,
        "weight_space_angle": 0.0038204360753297806,
        "task_vector_magnitude_ratio": -0.00638490729033947,
        "singular_value_overlap": -0.021145012229681015,
        "subspace_overlap": -0.0019058939069509506,
        "right_subspace_overlap": -0.003010713029652834,
        "activation_l2_distance": 0.004081739578396082,
        "activation_cosine_similarity": -0.001595612266100943,
        "activation_magnitude_ratio": -0.006089236121624708,
        "activation_dot_product": 0.0013372208923101425,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.012300750240683556,
        "encoder_gradient_dot_product": 0.0022348302882164717,
        "input_gradient_cosine_similarity": 0.0037616384215652943,
        "input_gradient_l2_distance": -0.017388854175806046,
        "input_gradient_dot_product": -0.005182607099413872
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5902396783824847,
      "val_r": 0.29220096697621006,
      "n_iterations": 395,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.00239451602101326,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.024971920996904373,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01178243663161993,
        "task_vector_dot_product": -0.003880639560520649,
        "weight_space_angle": 0.0011536937672644854,
        "task_vector_magnitude_ratio": -0.004681247286498547,
        "singular_value_overlap": -0.012164960615336895,
        "subspace_overlap": 0.0012366395676508546,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.007749900687485933,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.007878783158957958,
        "encoder_gradient_cosine_similarity": 0.0017331610433757305,
        "encoder_gradient_l2_distance": -0.013126324862241745,
        "encoder_gradient_dot_product": 0.0017383486265316606,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.014035208150744438,
        "input_gradient_dot_product": -0.004471853841096163
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5122449608095287,
      "val_r": 0.3374151268819038,
      "n_iterations": 243,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0021791732870042324,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.0011922621633857489,
        "interaction_matrix_overlap_bottom_k": 0.025361433625221252,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": -0.0010983586544170976,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.015579388476908207,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.004077722318470478,
        "singular_value_overlap": -0.016301028430461884,
        "subspace_overlap": 0.004408565815538168,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0014040053356438875,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0050685470923781395,
        "activation_dot_product": -0.004974489565938711,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.009209288284182549,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.00830375961959362,
        "input_gradient_dot_product": -0.0015971586108207703
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5493423879828563,
      "val_r": 0.45109733930877816,
      "n_iterations": 232,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.011151542887091637,
        "interaction_matrix_overlap_top_k": -0.0026049152947962284,
        "interaction_matrix_overlap_bottom_k": 0.03412509337067604,
        "effective_rank": -0.001292076543904841,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0011578128905966878,
        "spectral_gap": 0.0013079139171168208,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0015961683820933104,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.028163794428110123,
        "task_vector_dot_product": 0.0010001088958233595,
        "weight_space_angle": 0.002746023004874587,
        "task_vector_magnitude_ratio": -0.003284938633441925,
        "singular_value_overlap": -0.02574317529797554,
        "subspace_overlap": 0.002121339552104473,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0011354736052453518,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.008996433578431606,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0017176879337057471,
        "encoder_gradient_l2_distance": -0.010216271504759789,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0325823538005352,
        "input_gradient_dot_product": -0.001331257983110845
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5508031848690376,
      "val_r": 0.06715384739538477,
      "n_iterations": 313,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0015862876316532493,
        "right_subspace_overlap_bottom_k": 0.0075697097927331924,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.031408343464136124,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.022758115082979202,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.002797291148453951,
        "singular_value_overlap": -0.024546215310692787,
        "subspace_overlap": 0.0039932141080498695,
        "right_subspace_overlap": -0.001178162288852036,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": -0.0037631168961524963,
        "activation_magnitude_ratio": -0.00643800338730216,
        "activation_dot_product": -0.005684833973646164,
        "encoder_gradient_cosine_similarity": -0.0012444216990843415,
        "encoder_gradient_l2_distance": -0.011957656592130661,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.024428268894553185,
        "input_gradient_dot_product": -0.001133285346440971
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5207867116157635,
      "val_r": 0.38158294441729423,
      "n_iterations": 250,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.004498228896409273,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.02378096804022789,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0011707751546055079,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.014857947826385498,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0013641791883856058,
        "task_vector_magnitude_ratio": -0.0030622310005128384,
        "singular_value_overlap": -0.014363059774041176,
        "subspace_overlap": 0.0013521979562938213,
        "right_subspace_overlap": 0.0016890456900000572,
        "activation_l2_distance": -0.0018602557247504592,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.005566183477640152,
        "activation_dot_product": -0.0033922994043678045,
        "encoder_gradient_cosine_similarity": -0.002531364792957902,
        "encoder_gradient_l2_distance": -0.00836719386279583,
        "encoder_gradient_dot_product": -0.002757422160357237,
        "input_gradient_cosine_similarity": 0.00286948517896235,
        "input_gradient_l2_distance": -0.014766799286007881,
        "input_gradient_dot_product": -0.0025439895689487457
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4989191103229239,
      "val_r": 0.4109307517590827,
      "n_iterations": 434,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002873252145946026,
        "right_subspace_overlap_bottom_k": 0.004442664794623852,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.025784851983189583,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0010592297185212374,
        "singular_value_ratio": -0.0010790824890136719,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.015519039705395699,
        "task_vector_dot_product": -0.0011730091646313667,
        "weight_space_angle": 0.001927834004163742,
        "task_vector_magnitude_ratio": -0.004846005234867334,
        "singular_value_overlap": -0.015634071081876755,
        "subspace_overlap": 0.006941605359315872,
        "right_subspace_overlap": 0.0020716465078294277,
        "activation_l2_distance": -0.004540099762380123,
        "activation_cosine_similarity": 0.004206611774861813,
        "activation_magnitude_ratio": -0.0023550947662442923,
        "activation_dot_product": -0.004065544810146093,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.01053873635828495,
        "encoder_gradient_dot_product": -0.0011821193620562553,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.017835164442658424,
        "input_gradient_dot_product": -0.0048109968192875385
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5233722699895743,
      "val_r": 0.5498429125769141,
      "n_iterations": 290,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0107567785307765,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.03383341059088707,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0012821524869650602,
        "stable_rank": -0.0011420247610658407,
        "spectral_gap": 0.001424700254574418,
        "singular_value_ratio": -0.0014580392744392157,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0017128832405433059,
        "task_vector_l2_distance": -0.028372550383210182,
        "task_vector_dot_product": 0.001766058849170804,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0059733763337135315,
        "singular_value_overlap": -0.024399764835834503,
        "subspace_overlap": 0.0013220380060374737,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0018565452191978693,
        "activation_cosine_similarity": -0.0012813906650990248,
        "activation_magnitude_ratio": -0.006371192168444395,
        "activation_dot_product": -0.0033955180551856756,
        "encoder_gradient_cosine_similarity": 0.0012701674131676555,
        "encoder_gradient_l2_distance": -0.012103792279958725,
        "encoder_gradient_dot_product": 0.0035612762439996004,
        "input_gradient_cosine_similarity": 0.0011294233845546842,
        "input_gradient_l2_distance": -0.027677413076162338,
        "input_gradient_dot_product": -0.005082476418465376
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5041144651738104,
      "val_r": 0.646321400391478,
      "n_iterations": 429,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003290496300905943,
        "right_subspace_overlap_bottom_k": -0.002646005479618907,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.027032697573304176,
        "effective_rank": -0.0011400794610381126,
        "effective_rank_mergeability_score": 0.0011529546463862062,
        "stable_rank": -0.0011741681955754757,
        "spectral_gap": 0.0017073079943656921,
        "singular_value_ratio": -0.0014137664111331105,
        "layerwise_effective_rank": -0.0011874032206833363,
        "layerwise_effective_rank_mergeability_score": 0.0013008976820856333,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009128854610025883,
        "task_vector_dot_product": -0.0023865802213549614,
        "weight_space_angle": 0.0012414141092449427,
        "task_vector_magnitude_ratio": -0.00372564559802413,
        "singular_value_overlap": -0.01447802409529686,
        "subspace_overlap": 0.006005384027957916,
        "right_subspace_overlap": 0.0018590305699035525,
        "activation_l2_distance": -0.00407383730635047,
        "activation_cosine_similarity": 0.0017713172128424048,
        "activation_magnitude_ratio": -0.002142716431990266,
        "activation_dot_product": -0.0036503244191408157,
        "encoder_gradient_cosine_similarity": 0.002177273156121373,
        "encoder_gradient_l2_distance": -0.013312062248587608,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.019395483657717705,
        "input_gradient_dot_product": -0.010785548016428947
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5242619987231514,
      "val_r": 0.5649183417729386,
      "n_iterations": 225,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.02186451479792595,
        "effective_rank": -0.0015350099420174956,
        "effective_rank_mergeability_score": 0.0016513252630829811,
        "stable_rank": -0.0018564281053841114,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01716323010623455,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.002855539321899414,
        "task_vector_magnitude_ratio": -0.004322884138673544,
        "singular_value_overlap": -0.015294932760298252,
        "subspace_overlap": 0.0070470054633915424,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.002003840869292617,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.004908533301204443,
        "activation_dot_product": -0.004647768102586269,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.008104262873530388,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01780577003955841,
        "input_gradient_dot_product": -0.0039016446098685265
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5667117284122014,
      "val_r": 0.35328108368180833,
      "n_iterations": 183,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.004551155027002096,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.017724795266985893,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.001761134946718812,
        "task_vector_l2_distance": -0.015276627615094185,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0015753747429698706,
        "task_vector_magnitude_ratio": -0.0047744521871209145,
        "singular_value_overlap": -0.00700373575091362,
        "subspace_overlap": 0.0018156659789383411,
        "right_subspace_overlap": 0.002126511186361313,
        "activation_l2_distance": 0.004210122395306826,
        "activation_cosine_similarity": 0.002321334322914481,
        "activation_magnitude_ratio": -0.00409039156511426,
        "activation_dot_product": -0.0029630884528160095,
        "encoder_gradient_cosine_similarity": -0.0013543220702558756,
        "encoder_gradient_l2_distance": -0.009860232472419739,
        "encoder_gradient_dot_product": 0.0022873710840940475,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01297613326460123,
        "input_gradient_dot_product": -0.004677534569054842
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.537329918510123,
      "val_r": 0.351163707356006,
      "n_iterations": 269,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0021509374491870403,
        "right_subspace_overlap_bottom_k": 0.0018643452785909176,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.024103112518787384,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.017252828925848007,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.00219882489182055,
        "singular_value_overlap": -0.016546916216611862,
        "subspace_overlap": 0.00323116360232234,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0020421750377863646,
        "activation_cosine_similarity": -0.0010964109096676111,
        "activation_magnitude_ratio": -0.005013597197830677,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.008674830198287964,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0014979124534875154,
        "input_gradient_l2_distance": -0.01757928915321827,
        "input_gradient_dot_product": -0.005983153358101845
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5899216415369546,
      "val_r": 0.25577508889577494,
      "n_iterations": 279,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.005119509529322386,
        "interaction_matrix_overlap_top_k": -0.003921323921531439,
        "interaction_matrix_overlap_bottom_k": 0.033923979848623276,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.001030385261401534,
        "stable_rank": -0.0017580670537427068,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.001090093282982707,
        "layerwise_effective_rank": -0.003051054896786809,
        "layerwise_effective_rank_mergeability_score": 0.0034089256078004837,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.02207309380173683,
        "task_vector_dot_product": 0.0015252488665282726,
        "weight_space_angle": -0.0010877965250983834,
        "task_vector_magnitude_ratio": -0.0025957778561860323,
        "singular_value_overlap": -0.012887339107692242,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0028888797387480736,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0032698067370802164,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0033198785968124866,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.002239546738564968,
        "input_gradient_l2_distance": -0.025030171498656273,
        "input_gradient_dot_product": -0.0037472674157470465
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6838945455079937,
      "val_r": 0.5112175347497101,
      "n_iterations": 203,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010056748986244202,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.00546695152297616,
        "interaction_matrix_overlap_bottom_k": 0.00290966616012156,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0016769955400377512,
        "singular_value_ratio": 0.0016369145596399903,
        "layerwise_effective_rank": -0.005200548563152552,
        "layerwise_effective_rank_mergeability_score": 0.002872541779652238,
        "task_vector_cosine_similarity": -0.0019700180273503065,
        "task_vector_l2_distance": 0.0028844575863331556,
        "task_vector_dot_product": 0.002867761068046093,
        "weight_space_angle": 0.003683126997202635,
        "task_vector_magnitude_ratio": 0.0011206995695829391,
        "singular_value_overlap": -0.0064803361892700195,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.01218353770673275,
        "activation_l2_distance": -0.001341237802989781,
        "activation_cosine_similarity": 0.003647384699434042,
        "activation_magnitude_ratio": -0.004091414622962475,
        "activation_dot_product": 0.01262359507381916,
        "encoder_gradient_cosine_similarity": 0.005603737663477659,
        "encoder_gradient_l2_distance": -0.02500222809612751,
        "encoder_gradient_dot_product": 0.002329519484192133,
        "input_gradient_cosine_similarity": 0.0018601412884891033,
        "input_gradient_l2_distance": -0.026760468259453773,
        "input_gradient_dot_product": -0.012541331350803375
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5652565426005156,
      "val_r": 0.31527383063792014,
      "n_iterations": 403,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0020150139462202787,
        "right_subspace_overlap_bottom_k": 0.008963054046034813,
        "interaction_matrix_overlap_top_k": -0.0040805526077747345,
        "interaction_matrix_overlap_bottom_k": 0.030609438195824623,
        "effective_rank": -0.0013794098049402237,
        "effective_rank_mergeability_score": 0.0015369127504527569,
        "stable_rank": -0.001384578994475305,
        "spectral_gap": 0.002211470389738679,
        "singular_value_ratio": -0.002374752424657345,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.001478362362831831,
        "task_vector_l2_distance": -0.02827039733529091,
        "task_vector_dot_product": -0.005171515047550201,
        "weight_space_angle": -0.0016093741869553924,
        "task_vector_magnitude_ratio": -0.00828215479850769,
        "singular_value_overlap": -0.024967461824417114,
        "subspace_overlap": 0.0012753440532833338,
        "right_subspace_overlap": -0.0016376128187403083,
        "activation_l2_distance": -0.0020427724812179804,
        "activation_cosine_similarity": -0.0020553567446768284,
        "activation_magnitude_ratio": -0.00540532311424613,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": -0.0023229029029607773,
        "encoder_gradient_l2_distance": -0.015815820544958115,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0026216718833893538,
        "input_gradient_l2_distance": -0.031559545546770096,
        "input_gradient_dot_product": 0.001143971923738718
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.5,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}