{
  "aggregate_metrics": {
    "train_r": 0.5010419584391026,
    "train_p": 2.1049678397900135e-204,
    "val_r": 0.41113439539811647,
    "val_p": 4.922731681055768e-16
  },
  "per_fold_stats": {
    "train_r_mean": 0.752321260744318,
    "train_r_std": 0.08611818002791922,
    "val_r_mean": 0.6339301494701856,
    "val_r_std": 0.15659200054753425,
    "n_nonzero_mean": 20.65,
    "n_nonzero_std": 3.539420856580918
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.016838764771819115,
    "right_subspace_overlap_bottom_k": -0.03344161808490753,
    "interaction_matrix_overlap_top_k": 0.0006631833384744823,
    "interaction_matrix_overlap_bottom_k": 0.0016059704357758164,
    "effective_rank": 0.00019854112179018557,
    "effective_rank_mergeability_score": -2.7453818347566994e-06,
    "stable_rank": -0.00030911111389286816,
    "spectral_gap": -0.0004718953277915716,
    "singular_value_ratio": 0.0001685471652308479,
    "layerwise_effective_rank": -0.0017879221122711897,
    "layerwise_effective_rank_mergeability_score": 0.0015745064010843635,
    "task_vector_cosine_similarity": -0.0009089120430871844,
    "task_vector_l2_distance": -0.0009186530369333923,
    "task_vector_dot_product": -0.0009273619507439435,
    "weight_space_angle": 0.0013329994399100542,
    "task_vector_magnitude_ratio": 5.407524440670386e-05,
    "singular_value_overlap": 0.011035998351871967,
    "subspace_overlap": -0.0033972300589084625,
    "right_subspace_overlap": 0.018766013905405998,
    "activation_l2_distance": -0.0019305748865008354,
    "activation_cosine_similarity": 0.025048842653632164,
    "activation_magnitude_ratio": -0.0037035257555544376,
    "activation_dot_product": 0.0052244109101593494,
    "encoder_gradient_cosine_similarity": 0.004467204678803682,
    "encoder_gradient_l2_distance": -0.045101098716259,
    "encoder_gradient_dot_product": 3.6587203794624656e-05,
    "input_gradient_cosine_similarity": 0.0019958908669650555,
    "input_gradient_l2_distance": -0.025163492187857628,
    "input_gradient_dot_product": -0.003373838495463133
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.007814173586666584,
    "right_subspace_overlap_bottom_k": 0.00837439950555563,
    "interaction_matrix_overlap_top_k": 0.0035862051881849766,
    "interaction_matrix_overlap_bottom_k": 0.005865986924618483,
    "effective_rank": 0.0010545362019911408,
    "effective_rank_mergeability_score": 0.0011886422289535403,
    "stable_rank": 0.0009012783411890268,
    "spectral_gap": 0.0013872174313291907,
    "singular_value_ratio": 0.0016944174421951175,
    "layerwise_effective_rank": 0.002283903071656823,
    "layerwise_effective_rank_mergeability_score": 0.0024355240166187286,
    "task_vector_cosine_similarity": 0.004853693302720785,
    "task_vector_l2_distance": 0.005135438870638609,
    "task_vector_dot_product": 0.0038649989292025566,
    "weight_space_angle": 0.004675930831581354,
    "task_vector_magnitude_ratio": 0.0014355108141899109,
    "singular_value_overlap": 0.008168491534888744,
    "subspace_overlap": 0.00390060106292367,
    "right_subspace_overlap": 0.008578899316489697,
    "activation_l2_distance": 0.005541592836380005,
    "activation_cosine_similarity": 0.010923724621534348,
    "activation_magnitude_ratio": 0.0036924208980053663,
    "activation_dot_product": 0.017628155648708344,
    "encoder_gradient_cosine_similarity": 0.002315024845302105,
    "encoder_gradient_l2_distance": 0.024775903671979904,
    "encoder_gradient_dot_product": 0.0013508412521332502,
    "input_gradient_cosine_similarity": 0.0034671705216169357,
    "input_gradient_l2_distance": 0.01853375881910324,
    "input_gradient_dot_product": 0.002965184859931469
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 1.0,
    "right_subspace_overlap_bottom_k": 1.0,
    "interaction_matrix_overlap_top_k": 0.6,
    "interaction_matrix_overlap_bottom_k": 0.7,
    "effective_rank": 0.4,
    "effective_rank_mergeability_score": 0.3,
    "stable_rank": 0.25,
    "spectral_gap": 0.35,
    "singular_value_ratio": 0.35,
    "layerwise_effective_rank": 0.7,
    "layerwise_effective_rank_mergeability_score": 0.6,
    "task_vector_cosine_similarity": 0.65,
    "task_vector_l2_distance": 0.85,
    "task_vector_dot_product": 0.7,
    "weight_space_angle": 0.7,
    "task_vector_magnitude_ratio": 0.3,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.7,
    "right_subspace_overlap": 0.95,
    "activation_l2_distance": 1.0,
    "activation_cosine_similarity": 0.95,
    "activation_magnitude_ratio": 0.9,
    "activation_dot_product": 0.9,
    "encoder_gradient_cosine_similarity": 0.95,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.4,
    "input_gradient_cosine_similarity": 0.6,
    "input_gradient_l2_distance": 0.95,
    "input_gradient_dot_product": 0.9
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7699896473857593,
      "val_r": 0.5799781924450426,
      "n_iterations": 265,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009458289481699467,
        "right_subspace_overlap_bottom_k": -0.028161603957414627,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.008411013521254063,
        "effective_rank": 0.0010897618485614657,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.00110152130946517,
        "singular_value_ratio": 0.0013218398671597242,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0036956341937184334,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.003327519865706563,
        "weight_space_angle": 0.002803863026201725,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.005551824811846018,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.018300892785191536,
        "activation_l2_distance": -0.001755217439495027,
        "activation_cosine_similarity": 0.022714775055646896,
        "activation_magnitude_ratio": -0.006470154505223036,
        "activation_dot_product": -0.0013992944732308388,
        "encoder_gradient_cosine_similarity": 0.0023605653550475836,
        "encoder_gradient_l2_distance": -0.036477409303188324,
        "encoder_gradient_dot_product": -0.0013625819701701403,
        "input_gradient_cosine_similarity": 0.001425337279215455,
        "input_gradient_l2_distance": -0.01933632791042328,
        "input_gradient_dot_product": -0.005019378382712603
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7574870530118776,
      "val_r": 0.7987633220869355,
      "n_iterations": 238,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.018910448998212814,
        "right_subspace_overlap_bottom_k": -0.04376354068517685,
        "interaction_matrix_overlap_top_k": 0.0017886771820485592,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0012975451536476612,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0010801150929182768,
        "layerwise_effective_rank_mergeability_score": 0.0014919156674295664,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.008682291023433208,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.012224880047142506,
        "subspace_overlap": 0.0017077355878427625,
        "right_subspace_overlap": 0.031250081956386566,
        "activation_l2_distance": -0.002373032970353961,
        "activation_cosine_similarity": 0.044331181794404984,
        "activation_magnitude_ratio": -0.0067260717041790485,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0016687549650669098,
        "encoder_gradient_l2_distance": -0.07878421992063522,
        "encoder_gradient_dot_product": 0.0017164071323350072,
        "input_gradient_cosine_similarity": 0.0011870920425280929,
        "input_gradient_l2_distance": -0.043496642261743546,
        "input_gradient_dot_product": -0.002694809576496482
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.3853961407627781,
      "val_r": 0.5187495553419181,
      "n_iterations": 334,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003445527981966734,
        "right_subspace_overlap_bottom_k": -0.021755153313279152,
        "interaction_matrix_overlap_top_k": -0.002066396176815033,
        "interaction_matrix_overlap_bottom_k": 0.007947539910674095,
        "effective_rank": -0.0017405026592314243,
        "effective_rank_mergeability_score": 0.002821630798280239,
        "stable_rank": -0.0033020121045410633,
        "spectral_gap": 0.00323827238753438,
        "singular_value_ratio": -0.003761706408113241,
        "layerwise_effective_rank": -0.005884931422770023,
        "layerwise_effective_rank_mergeability_score": 0.007271526847034693,
        "task_vector_cosine_similarity": 0.001942767295986414,
        "task_vector_l2_distance": -0.0035582315176725388,
        "task_vector_dot_product": -0.0017129969783127308,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0033873848151415586,
        "singular_value_overlap": 0.0013192819897085428,
        "subspace_overlap": -0.010041161440312862,
        "right_subspace_overlap": 0.019280163571238518,
        "activation_l2_distance": 0.006053382530808449,
        "activation_cosine_similarity": 0.01895803213119507,
        "activation_magnitude_ratio": -0.0027459925040602684,
        "activation_dot_product": -0.003311010543256998,
        "encoder_gradient_cosine_similarity": 0.0012640038039535284,
        "encoder_gradient_l2_distance": -0.009722634218633175,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.010558000765740871,
        "input_gradient_dot_product": -0.004233225714415312
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7481528857964836,
      "val_r": 0.7074417502887235,
      "n_iterations": 237,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01774042472243309,
        "right_subspace_overlap_bottom_k": -0.03539867699146271,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0013218207750469446,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.002483920892700553,
        "singular_value_ratio": 0.0022011350374668837,
        "layerwise_effective_rank": -0.003591397078707814,
        "layerwise_effective_rank_mergeability_score": 0.004399905446916819,
        "task_vector_cosine_similarity": -0.007364509627223015,
        "task_vector_l2_distance": -0.003194466233253479,
        "task_vector_dot_product": -0.002682430436834693,
        "weight_space_angle": 0.003110448829829693,
        "task_vector_magnitude_ratio": 0.0020502840634435415,
        "singular_value_overlap": 0.01635180599987507,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.03279640153050423,
        "activation_l2_distance": -0.0029436710756272078,
        "activation_cosine_similarity": 0.022302042692899704,
        "activation_magnitude_ratio": -0.005385689903050661,
        "activation_dot_product": 0.013732915744185448,
        "encoder_gradient_cosine_similarity": 0.00527321919798851,
        "encoder_gradient_l2_distance": -0.07222457975149155,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.035447895526885986,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7700296953466099,
      "val_r": 0.7702020608264998,
      "n_iterations": 301,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.025250134989619255,
        "right_subspace_overlap_bottom_k": -0.037915438413619995,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0016190198948606849,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.004528526682406664,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.007797308266162872,
        "subspace_overlap": -0.001056171371601522,
        "right_subspace_overlap": 0.01631624810397625,
        "activation_l2_distance": 0.0017123720608651638,
        "activation_cosine_similarity": 0.03802676126360893,
        "activation_magnitude_ratio": -0.0030600139871239662,
        "activation_dot_product": -0.004804419353604317,
        "encoder_gradient_cosine_similarity": 0.0059656379744410515,
        "encoder_gradient_l2_distance": -0.05292496457695961,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.003832542337477207,
        "input_gradient_l2_distance": -0.01567360758781433,
        "input_gradient_dot_product": -0.00411309115588665
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7688812261420489,
      "val_r": 0.7127934638401079,
      "n_iterations": 230,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.014735122211277485,
        "right_subspace_overlap_bottom_k": -0.03034292347729206,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0019040919141843915,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.003665668424218893,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.009948953054845333,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.009709886275231838,
        "activation_l2_distance": 0.00170164555311203,
        "activation_cosine_similarity": 0.03893569856882095,
        "activation_magnitude_ratio": -0.0015289245638996363,
        "activation_dot_product": -0.0021684470120817423,
        "encoder_gradient_cosine_similarity": 0.0071237413212656975,
        "encoder_gradient_l2_distance": -0.04895995184779167,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0029169730842113495,
        "input_gradient_l2_distance": 0.0,
        "input_gradient_dot_product": -0.004003751557320356
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.777837874977334,
      "val_r": 0.6971400075830951,
      "n_iterations": 332,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01652803272008896,
        "right_subspace_overlap_bottom_k": -0.034826721996068954,
        "interaction_matrix_overlap_top_k": -0.0014636680716648698,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0013163771945983171,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0011134515516459942,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.00540512427687645,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.00922065693885088,
        "subspace_overlap": -0.0031616846099495888,
        "right_subspace_overlap": 0.010241164825856686,
        "activation_l2_distance": -0.004509790800511837,
        "activation_cosine_similarity": 0.023357780650258064,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.006740889977663755,
        "encoder_gradient_cosine_similarity": 0.007190857082605362,
        "encoder_gradient_l2_distance": -0.041836585849523544,
        "encoder_gradient_dot_product": 0.0016327484045177698,
        "input_gradient_cosine_similarity": -0.0012281432282179594,
        "input_gradient_l2_distance": -0.00986893568187952,
        "input_gradient_dot_product": -0.004431502427905798
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7521300998933087,
      "val_r": 0.30633858711265183,
      "n_iterations": 325,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.024706749245524406,
        "right_subspace_overlap_bottom_k": -0.04130015894770622,
        "interaction_matrix_overlap_top_k": 0.004378859885036945,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0016879650065675378,
        "spectral_gap": -0.002276569837704301,
        "singular_value_ratio": 0.0020978753454983234,
        "layerwise_effective_rank": -0.0012999260798096657,
        "layerwise_effective_rank_mergeability_score": 0.003095767227932811,
        "task_vector_cosine_similarity": -0.010330046527087688,
        "task_vector_l2_distance": -0.005766547285020351,
        "task_vector_dot_product": -0.0010093064047396183,
        "weight_space_angle": 0.013612581416964531,
        "task_vector_magnitude_ratio": 0.0016548134153708816,
        "singular_value_overlap": 0.015735667198896408,
        "subspace_overlap": -0.0036057245451956987,
        "right_subspace_overlap": 0.023340782150626183,
        "activation_l2_distance": -0.012665909714996815,
        "activation_cosine_similarity": 0.023121746256947517,
        "activation_magnitude_ratio": -0.004828827455639839,
        "activation_dot_product": 0.010300792753696442,
        "encoder_gradient_cosine_similarity": 0.008952133357524872,
        "encoder_gradient_l2_distance": -0.060683511197566986,
        "encoder_gradient_dot_product": -0.001314123161137104,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.035480331629514694,
        "input_gradient_dot_product": 0.0034090224653482437
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7955667767898834,
      "val_r": 0.3923637846421173,
      "n_iterations": 206,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.016810249537229538,
        "right_subspace_overlap_bottom_k": -0.04246967285871506,
        "interaction_matrix_overlap_top_k": 0.0015013858210295439,
        "interaction_matrix_overlap_bottom_k": 0.002833412028849125,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0062496354803442955,
        "layerwise_effective_rank_mergeability_score": 0.004748047795146704,
        "task_vector_cosine_similarity": -0.004264909774065018,
        "task_vector_l2_distance": 0.00285366945900023,
        "task_vector_dot_product": -0.003675454296171665,
        "weight_space_angle": 0.005386087112128735,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.006119220517575741,
        "subspace_overlap": -0.003088128287345171,
        "right_subspace_overlap": 0.028825024142861366,
        "activation_l2_distance": 0.002221824135631323,
        "activation_cosine_similarity": 0.036967236548662186,
        "activation_magnitude_ratio": -0.0016112590674310923,
        "activation_dot_product": -0.011099272407591343,
        "encoder_gradient_cosine_similarity": 0.004312921315431595,
        "encoder_gradient_l2_distance": -0.04483401030302048,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0030746881384402514,
        "input_gradient_l2_distance": -0.02720894105732441,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7727587499479239,
      "val_r": 0.487065514281008,
      "n_iterations": 272,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.019984371960163116,
        "right_subspace_overlap_bottom_k": -0.04011644050478935,
        "interaction_matrix_overlap_top_k": -0.0023367092944681644,
        "interaction_matrix_overlap_bottom_k": 0.0018517692806199193,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0024628823157399893,
        "layerwise_effective_rank_mergeability_score": 0.002025397727265954,
        "task_vector_cosine_similarity": -0.0012137687299400568,
        "task_vector_l2_distance": 0.0034156842157244682,
        "task_vector_dot_product": -0.002285826951265335,
        "weight_space_angle": 0.0018608069512993097,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.005782742984592915,
        "subspace_overlap": -0.003669386263936758,
        "right_subspace_overlap": 0.02758338861167431,
        "activation_l2_distance": -0.002256612293422222,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": 0.0023958240635693073,
        "activation_dot_product": -0.011141635477542877,
        "encoder_gradient_cosine_similarity": 0.008709906600415707,
        "encoder_gradient_l2_distance": -0.029338205233216286,
        "encoder_gradient_dot_product": 0.0020928680896759033,
        "input_gradient_cosine_similarity": 0.0028339792042970657,
        "input_gradient_l2_distance": -0.012166459113359451,
        "input_gradient_dot_product": -0.005157559644430876
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7301184331546079,
      "val_r": 0.25862772222240205,
      "n_iterations": 299,
      "n_nonzero_coefficients": 28,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01715259626507759,
        "right_subspace_overlap_bottom_k": -0.039290912449359894,
        "interaction_matrix_overlap_top_k": 0.013889574445784092,
        "interaction_matrix_overlap_bottom_k": -0.015916956588625908,
        "effective_rank": 0.00251792068593204,
        "effective_rank_mergeability_score": -0.0024565281346440315,
        "stable_rank": 0.0012178472243249416,
        "spectral_gap": -0.003962845541536808,
        "singular_value_ratio": 0.005096020642668009,
        "layerwise_effective_rank": 0.0038171173073351383,
        "layerwise_effective_rank_mergeability_score": -0.004018776118755341,
        "task_vector_cosine_similarity": 0.010956551879644394,
        "task_vector_l2_distance": 0.0017388213891535997,
        "task_vector_dot_product": 0.01108989492058754,
        "weight_space_angle": -0.007483424618840218,
        "task_vector_magnitude_ratio": 0.004093156661838293,
        "singular_value_overlap": 0.03578398376703262,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.029772071167826653,
        "activation_l2_distance": -0.013580786995589733,
        "activation_cosine_similarity": 0.03936244174838066,
        "activation_magnitude_ratio": -0.015746166929602623,
        "activation_dot_product": 0.06318000704050064,
        "encoder_gradient_cosine_similarity": 0.0037774285301566124,
        "encoder_gradient_l2_distance": -0.06372082233428955,
        "encoder_gradient_dot_product": -0.0018120144959539175,
        "input_gradient_cosine_similarity": 0.01575412228703499,
        "input_gradient_l2_distance": -0.06607828289270401,
        "input_gradient_dot_product": -0.0029854571912437677
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7902835126372765,
      "val_r": 0.777250283278053,
      "n_iterations": 313,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01937883347272873,
        "right_subspace_overlap_bottom_k": -0.03175074979662895,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.005493140313774347,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.005082754418253899,
        "task_vector_l2_distance": 0.0031673195771872997,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.005415224004536867,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0066698272712528706,
        "subspace_overlap": -0.004569229204207659,
        "right_subspace_overlap": 0.01145471353083849,
        "activation_l2_distance": 0.005708540789783001,
        "activation_cosine_similarity": 0.023651478812098503,
        "activation_magnitude_ratio": -0.0011451388709247112,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0031342064030468464,
        "encoder_gradient_l2_distance": -0.028747960925102234,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0027810262981802225,
        "input_gradient_l2_distance": -0.009198595769703388,
        "input_gradient_dot_product": -0.0031709184404462576
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7813442537646849,
      "val_r": 0.7924472706242145,
      "n_iterations": 256,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00801519863307476,
        "right_subspace_overlap_bottom_k": -0.02952522225677967,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.008381418883800507,
        "effective_rank": 0.0016642697155475616,
        "effective_rank_mergeability_score": -0.0018833121284842491,
        "stable_rank": 0.0,
        "spectral_gap": -0.0011811184231191874,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0020822277292609215,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0052402438595891,
        "task_vector_l2_distance": 0.006571640260517597,
        "task_vector_dot_product": -0.0015809042379260063,
        "weight_space_angle": -0.0028230296447873116,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.006444264203310013,
        "subspace_overlap": -0.008459323085844517,
        "right_subspace_overlap": 0.01198591198772192,
        "activation_l2_distance": 0.005098126363009214,
        "activation_cosine_similarity": 0.02287730947136879,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.006165016908198595,
        "encoder_gradient_cosine_similarity": 0.003597631584852934,
        "encoder_gradient_l2_distance": -0.016167806461453438,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.003022926626726985,
        "input_gradient_l2_distance": -0.013594754971563816,
        "input_gradient_dot_product": -0.0031757564283907413
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7581641910110042,
      "val_r": 0.7471406549191938,
      "n_iterations": 331,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.032977424561977386,
        "right_subspace_overlap_bottom_k": -0.041553813964128494,
        "interaction_matrix_overlap_top_k": -0.004144025035202503,
        "interaction_matrix_overlap_bottom_k": 0.0010645636357367039,
        "effective_rank": -0.001415084581822157,
        "effective_rank_mergeability_score": 0.0019958443008363247,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.003334588138386607,
        "layerwise_effective_rank_mergeability_score": 0.003556896699592471,
        "task_vector_cosine_similarity": 0.001034163637086749,
        "task_vector_l2_distance": -0.004824329633265734,
        "task_vector_dot_product": -0.010473182424902916,
        "weight_space_angle": -0.0010060666827484965,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.028279505670070648,
        "subspace_overlap": -0.004485655575990677,
        "right_subspace_overlap": 0.02136920392513275,
        "activation_l2_distance": -0.009927925653755665,
        "activation_cosine_similarity": 0.029602648690342903,
        "activation_magnitude_ratio": -0.003732345998287201,
        "activation_dot_product": 0.03295544162392616,
        "encoder_gradient_cosine_similarity": 0.0036632211413234472,
        "encoder_gradient_l2_distance": -0.11015128344297409,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0023607423063367605,
        "input_gradient_l2_distance": -0.06227148696780205,
        "input_gradient_dot_product": -0.0017406935803592205
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7909086906614332,
      "val_r": 0.7663144715869367,
      "n_iterations": 331,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.014456156641244888,
        "right_subspace_overlap_bottom_k": -0.04071410745382309,
        "interaction_matrix_overlap_top_k": -0.001501791994087398,
        "interaction_matrix_overlap_bottom_k": 0.0066762324422597885,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.007213900331407785,
        "task_vector_dot_product": -0.0044606951996684074,
        "weight_space_angle": 0.001412629964761436,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.007375389337539673,
        "subspace_overlap": -0.0038580521941184998,
        "right_subspace_overlap": 0.021209755912423134,
        "activation_l2_distance": -0.0024864748120307922,
        "activation_cosine_similarity": 0.026096312329173088,
        "activation_magnitude_ratio": -0.0024268818087875843,
        "activation_dot_product": -0.0071185571141541,
        "encoder_gradient_cosine_similarity": 0.0053602298721671104,
        "encoder_gradient_l2_distance": -0.03431965410709381,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01037103682756424,
        "input_gradient_dot_product": -0.006339618936181068
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.8122893319572404,
      "val_r": 0.6453293748598998,
      "n_iterations": 415,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0067427316680550575,
        "right_subspace_overlap_bottom_k": -0.02111029252409935,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0036922406870871782,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.00182614685036242,
        "task_vector_dot_product": -0.0014412426389753819,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0011357280891388655,
        "singular_value_overlap": 0.007783778011798859,
        "subspace_overlap": -0.012146273627877235,
        "right_subspace_overlap": 0.020579468458890915,
        "activation_l2_distance": 0.0014891638420522213,
        "activation_cosine_similarity": 0.014592590741813183,
        "activation_magnitude_ratio": -0.0024656709283590317,
        "activation_dot_product": -0.004043205175548792,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.015380941331386566,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.009007161483168602,
        "input_gradient_dot_product": -0.0034401905722916126
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7706920495167346,
      "val_r": 0.6872071147393481,
      "n_iterations": 248,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.024107038974761963,
        "right_subspace_overlap_bottom_k": -0.023981530219316483,
        "interaction_matrix_overlap_top_k": -0.0019114884780719876,
        "interaction_matrix_overlap_bottom_k": 0.010237151756882668,
        "effective_rank": 0.0019708899781107903,
        "effective_rank_mergeability_score": -0.0020813981536775827,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0012688061688095331,
        "task_vector_l2_distance": 0.0014270446263253689,
        "task_vector_dot_product": -0.0019605965353548527,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0030077723786234856,
        "subspace_overlap": -0.010394120588898659,
        "right_subspace_overlap": 0.005891080480068922,
        "activation_l2_distance": 0.003929058089852333,
        "activation_cosine_similarity": 0.01510532945394516,
        "activation_magnitude_ratio": -0.0033655755687505007,
        "activation_dot_product": -0.0013728669146075845,
        "encoder_gradient_cosine_similarity": 0.003101370297372341,
        "encoder_gradient_l2_distance": -0.012691045179963112,
        "encoder_gradient_dot_product": 0.003022804856300354,
        "input_gradient_cosine_similarity": 0.0019565292168408632,
        "input_gradient_l2_distance": -0.011797493323683739,
        "input_gradient_dot_product": -0.004037077073007822
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7626192729885066,
      "val_r": 0.6819787927745028,
      "n_iterations": 316,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.019609056413173676,
        "right_subspace_overlap_bottom_k": -0.0379418283700943,
        "interaction_matrix_overlap_top_k": 0.00298659922555089,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0013872624840587378,
        "layerwise_effective_rank_mergeability_score": 0.0014100667322054505,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.005598884541541338,
        "task_vector_dot_product": 0.0015775234205648303,
        "weight_space_angle": -0.0034674236085265875,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.014646326191723347,
        "subspace_overlap": -0.001117429113946855,
        "right_subspace_overlap": 0.016854288056492805,
        "activation_l2_distance": -0.0026464895345270634,
        "activation_cosine_similarity": 0.033790137618780136,
        "activation_magnitude_ratio": -0.0049504442140460014,
        "activation_dot_product": 0.0022860169410705566,
        "encoder_gradient_cosine_similarity": 0.004753071814775467,
        "encoder_gradient_l2_distance": -0.06017278879880905,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.05234226584434509,
        "input_gradient_dot_product": -0.009859222918748856
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7624767674650563,
      "val_r": 0.6734807086167082,
      "n_iterations": 240,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.025597117841243744,
        "right_subspace_overlap_bottom_k": -0.035206861793994904,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.00221051974222064,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0011125473538413644,
        "spectral_gap": -0.0016702029388397932,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.004095255397260189,
        "layerwise_effective_rank_mergeability_score": 0.001610070699825883,
        "task_vector_cosine_similarity": -0.01009437721222639,
        "task_vector_l2_distance": -0.0030742392409592867,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.00883825495839119,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.01476062461733818,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.018559826537966728,
        "activation_l2_distance": -0.005012974143028259,
        "activation_cosine_similarity": 0.01842840015888214,
        "activation_magnitude_ratio": -0.0022925150115042925,
        "activation_dot_product": 0.014143076725304127,
        "encoder_gradient_cosine_similarity": 0.003390370635315776,
        "encoder_gradient_l2_distance": -0.0586981326341629,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.03544384986162186,
        "input_gradient_dot_product": 0.0014320391928777099
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7892985616758073,
      "val_r": 0.6779903573343538,
      "n_iterations": 288,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0011697730515152216,
        "right_subspace_overlap_bottom_k": -0.011706741526722908,
        "interaction_matrix_overlap_top_k": 0.0021426493767648935,
        "interaction_matrix_overlap_bottom_k": -0.008245693519711494,
        "effective_rank": -0.0014382535591721535,
        "effective_rank_mergeability_score": 0.0015488556819036603,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0022678442765027285,
        "layerwise_effective_rank": -0.002822648733854294,
        "layerwise_effective_rank_mergeability_score": 0.004785857629030943,
        "task_vector_cosine_similarity": 0.0034252272453159094,
        "task_vector_l2_distance": -0.013641128316521645,
        "task_vector_dot_product": 0.003395499661564827,
        "weight_space_angle": -0.005528485402464867,
        "task_vector_magnitude_ratio": -0.002193636493757367,
        "singular_value_overlap": 0.005916162393987179,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.006366726942360401,
        "activation_cosine_similarity": 0.008754981681704521,
        "activation_magnitude_ratio": -0.007984671741724014,
        "activation_dot_product": 0.027254583314061165,
        "encoder_gradient_cosine_similarity": 0.005744819529354572,
        "encoder_gradient_l2_distance": -0.02618548832833767,
        "encoder_gradient_dot_product": -0.0032443644013255835,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.023927811533212662,
        "input_gradient_dot_product": -0.007915576919913292
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.3,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}