{
  "aggregate_metrics": {
    "train_r": 0.3911569467644164,
    "train_p": 2.7801838480791395e-118,
    "val_r": -0.05378638247523405,
    "val_p": 0.3101717083869684
  },
  "per_fold_stats": {
    "train_r_mean": 0.6067059645344435,
    "train_r_std": 0.059091197810535755,
    "val_r_mean": 0.47831982843692933,
    "val_r_std": 0.16561817884569371,
    "n_nonzero_mean": 23.15,
    "n_nonzero_std": 3.004579837514723
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.00981130637228489,
    "right_subspace_overlap_bottom_k": -0.013489723205566406,
    "interaction_matrix_overlap_top_k": 0.000632117036730051,
    "interaction_matrix_overlap_bottom_k": 0.05698845908045769,
    "effective_rank": -0.0023472930770367384,
    "effective_rank_mergeability_score": 0.002166495192795992,
    "stable_rank": -0.002921773586422205,
    "spectral_gap": 0.000522012822329998,
    "singular_value_ratio": -0.0006755044450983405,
    "layerwise_effective_rank": -0.00040010566590353847,
    "layerwise_effective_rank_mergeability_score": 0.0007460342603735626,
    "task_vector_cosine_similarity": -0.0022719050757586956,
    "task_vector_l2_distance": -0.04810795933008194,
    "task_vector_dot_product": -0.002098564989864826,
    "weight_space_angle": 0.0023016647901386023,
    "task_vector_magnitude_ratio": -0.011253916658461094,
    "singular_value_overlap": -0.0339774489402771,
    "subspace_overlap": 0.008511914871633053,
    "right_subspace_overlap": 0.010036087594926357,
    "activation_l2_distance": 9.106225479627028e-05,
    "activation_cosine_similarity": 0.009381154552102089,
    "activation_magnitude_ratio": -0.008931493386626244,
    "activation_dot_product": 0.011531488038599491,
    "encoder_gradient_cosine_similarity": 0.005572055000811815,
    "encoder_gradient_l2_distance": -0.06421003490686417,
    "encoder_gradient_dot_product": 0.005697900895029306,
    "input_gradient_cosine_similarity": 0.003183626336976886,
    "input_gradient_l2_distance": -0.06095961481332779,
    "input_gradient_dot_product": -0.02310163527727127
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.013322144746780396,
    "right_subspace_overlap_bottom_k": 0.01761561445891857,
    "interaction_matrix_overlap_top_k": 0.01141596119850874,
    "interaction_matrix_overlap_bottom_k": 0.022986769676208496,
    "effective_rank": 0.0032653133384883404,
    "effective_rank_mergeability_score": 0.0022738156840205193,
    "stable_rank": 0.0036193944979459047,
    "spectral_gap": 0.001850150991231203,
    "singular_value_ratio": 0.001749534043483436,
    "layerwise_effective_rank": 0.004254015628248453,
    "layerwise_effective_rank_mergeability_score": 0.003520891536027193,
    "task_vector_cosine_similarity": 0.009062557481229305,
    "task_vector_l2_distance": 0.024330006912350655,
    "task_vector_dot_product": 0.010543761774897575,
    "weight_space_angle": 0.00911787897348404,
    "task_vector_magnitude_ratio": 0.006031245458871126,
    "singular_value_overlap": 0.0195195022970438,
    "subspace_overlap": 0.008922035805881023,
    "right_subspace_overlap": 0.01286387536674738,
    "activation_l2_distance": 0.010175001807510853,
    "activation_cosine_similarity": 0.011034545488655567,
    "activation_magnitude_ratio": 0.007011127192527056,
    "activation_dot_product": 0.025531131774187088,
    "encoder_gradient_cosine_similarity": 0.00718772504478693,
    "encoder_gradient_l2_distance": 0.038600217550992966,
    "encoder_gradient_dot_product": 0.006412499584257603,
    "input_gradient_cosine_similarity": 0.004397028591483831,
    "input_gradient_l2_distance": 0.03746887668967247,
    "input_gradient_dot_product": 0.020608363673090935
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.9,
    "right_subspace_overlap_bottom_k": 0.95,
    "interaction_matrix_overlap_top_k": 0.7,
    "interaction_matrix_overlap_bottom_k": 1.0,
    "effective_rank": 0.6,
    "effective_rank_mergeability_score": 0.65,
    "stable_rank": 0.6,
    "spectral_gap": 0.65,
    "singular_value_ratio": 0.5,
    "layerwise_effective_rank": 0.3,
    "layerwise_effective_rank_mergeability_score": 0.3,
    "task_vector_cosine_similarity": 0.7,
    "task_vector_l2_distance": 1.0,
    "task_vector_dot_product": 0.85,
    "weight_space_angle": 0.7,
    "task_vector_magnitude_ratio": 0.95,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.7,
    "right_subspace_overlap": 0.95,
    "activation_l2_distance": 0.85,
    "activation_cosine_similarity": 0.95,
    "activation_magnitude_ratio": 0.95,
    "activation_dot_product": 0.9,
    "encoder_gradient_cosine_similarity": 0.85,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.8,
    "input_gradient_cosine_similarity": 0.85,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 1.0
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6398428718802955,
      "val_r": 0.625189258635213,
      "n_iterations": 278,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0011107976315543056,
        "right_subspace_overlap_bottom_k": 0.008589335717260838,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.08726958930492401,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0038268868811428547,
        "stable_rank": 0.0,
        "spectral_gap": 0.0032725450582802296,
        "singular_value_ratio": -0.0032649007625877857,
        "layerwise_effective_rank": 0.012673968449234962,
        "layerwise_effective_rank_mergeability_score": -0.004728790372610092,
        "task_vector_cosine_similarity": -0.003011570777744055,
        "task_vector_l2_distance": -0.07513544708490372,
        "task_vector_dot_product": -0.011218334548175335,
        "weight_space_angle": 0.004182769916951656,
        "task_vector_magnitude_ratio": -0.020300354808568954,
        "singular_value_overlap": -0.059035900980234146,
        "subspace_overlap": 0.02354365773499012,
        "right_subspace_overlap": 0.0038467689882963896,
        "activation_l2_distance": 0.008914357051253319,
        "activation_cosine_similarity": 0.018960287794470787,
        "activation_magnitude_ratio": -0.020969416946172714,
        "activation_dot_product": 0.0023681744933128357,
        "encoder_gradient_cosine_similarity": 0.0010559405200183392,
        "encoder_gradient_l2_distance": -0.0834868848323822,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.06925777345895767,
        "input_gradient_dot_product": -0.026176419109106064
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6062433820910322,
      "val_r": 0.5269652117721659,
      "n_iterations": 214,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0034338454715907574,
        "right_subspace_overlap_bottom_k": -0.016718847677111626,
        "interaction_matrix_overlap_top_k": -0.0013427194207906723,
        "interaction_matrix_overlap_bottom_k": 0.05038980767130852,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0018441778374835849,
        "stable_rank": 0.0,
        "spectral_gap": -0.0017790067940950394,
        "singular_value_ratio": 0.0022365287877619267,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.02947762981057167,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.01377051044255495,
        "singular_value_overlap": -0.018689801916480064,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0032757034059613943,
        "activation_l2_distance": 0.004876673221588135,
        "activation_cosine_similarity": 0.0029446410480886698,
        "activation_magnitude_ratio": -0.004253655672073364,
        "activation_dot_product": 0.008281907998025417,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.03605343773961067,
        "encoder_gradient_dot_product": 0.004793229978531599,
        "input_gradient_cosine_similarity": 0.0037995039019733667,
        "input_gradient_l2_distance": -0.028814662247896194,
        "input_gradient_dot_product": -0.00688762916252017
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6125844339039015,
      "val_r": 0.5258198139558772,
      "n_iterations": 376,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004178992006927729,
        "right_subspace_overlap_bottom_k": -0.01773279905319214,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.04536595195531845,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0021585715003311634,
        "singular_value_ratio": 0.0016282895812764764,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.024011921137571335,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.012498323805630207,
        "singular_value_overlap": -0.01799972914159298,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.005474657751619816,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0014019202208146453,
        "activation_magnitude_ratio": -0.005678580142557621,
        "activation_dot_product": 0.004334168042987585,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.026540549471974373,
        "encoder_gradient_dot_product": 0.0021663750521838665,
        "input_gradient_cosine_similarity": 0.003697680775076151,
        "input_gradient_l2_distance": -0.02613353729248047,
        "input_gradient_dot_product": -0.00924925971776247
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5996668240326422,
      "val_r": 0.4579671147280855,
      "n_iterations": 258,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0052794599905610085,
        "right_subspace_overlap_bottom_k": -0.0072654676623642445,
        "interaction_matrix_overlap_top_k": -0.0013418326852843165,
        "interaction_matrix_overlap_bottom_k": 0.06921649724245071,
        "effective_rank": -0.0019787787459790707,
        "effective_rank_mergeability_score": 0.0022371397353708744,
        "stable_rank": -0.00125157053116709,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.05275386571884155,
        "task_vector_dot_product": 0.006237474735826254,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.017219865694642067,
        "singular_value_overlap": -0.03906045854091644,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0059138513170182705,
        "activation_l2_distance": 0.00510860001668334,
        "activation_cosine_similarity": 0.0024792838376015425,
        "activation_magnitude_ratio": -0.012976198457181454,
        "activation_dot_product": 0.01441480964422226,
        "encoder_gradient_cosine_similarity": 0.0029159903060644865,
        "encoder_gradient_l2_distance": -0.05195820331573486,
        "encoder_gradient_dot_product": 0.0016664748545736074,
        "input_gradient_cosine_similarity": 0.005915921181440353,
        "input_gradient_l2_distance": -0.04879796504974365,
        "input_gradient_dot_product": -0.016483644023537636
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6106349837778355,
      "val_r": 0.7105157638364187,
      "n_iterations": 458,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.026741672307252884,
        "right_subspace_overlap_bottom_k": -0.028193358331918716,
        "interaction_matrix_overlap_top_k": 0.013435512781143188,
        "interaction_matrix_overlap_bottom_k": 0.07799048721790314,
        "effective_rank": -0.003943503834307194,
        "effective_rank_mergeability_score": 0.002738300245255232,
        "stable_rank": -0.004991042427718639,
        "spectral_gap": 0.004635652527213097,
        "singular_value_ratio": -0.00532064912840724,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.01530864741653204,
        "task_vector_l2_distance": -0.07875968515872955,
        "task_vector_dot_product": -0.02497737482190132,
        "weight_space_angle": 0.015645360574126244,
        "task_vector_magnitude_ratio": -0.009070578962564468,
        "singular_value_overlap": -0.06627552211284637,
        "subspace_overlap": 0.015902256593108177,
        "right_subspace_overlap": 0.026677614077925682,
        "activation_l2_distance": -0.016524767503142357,
        "activation_cosine_similarity": 0.016840150579810143,
        "activation_magnitude_ratio": -0.004844036418944597,
        "activation_dot_product": -0.007376601919531822,
        "encoder_gradient_cosine_similarity": 0.0020709398668259382,
        "encoder_gradient_l2_distance": -0.10089460015296936,
        "encoder_gradient_dot_product": 0.01523846760392189,
        "input_gradient_cosine_similarity": 0.014624240808188915,
        "input_gradient_l2_distance": -0.11439503729343414,
        "input_gradient_dot_product": -0.05392727628350258
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.6092990055969375,
      "val_r": 0.6868596364869748,
      "n_iterations": 420,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0034008468501269817,
        "interaction_matrix_overlap_top_k": 0.0021571277175098658,
        "interaction_matrix_overlap_bottom_k": 0.08245660364627838,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0027289472054690123,
        "singular_value_ratio": -0.0020415715407580137,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0010568134021013975,
        "task_vector_l2_distance": -0.07655006647109985,
        "task_vector_dot_product": 0.007760824169963598,
        "weight_space_angle": -0.0023801608476787806,
        "task_vector_magnitude_ratio": -0.019951077178120613,
        "singular_value_overlap": -0.04943167790770531,
        "subspace_overlap": 0.0022104063536971807,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0010130270384252071,
        "activation_cosine_similarity": 0.007242802530527115,
        "activation_magnitude_ratio": -0.012894172221422195,
        "activation_dot_product": 0.013103948906064034,
        "encoder_gradient_cosine_similarity": 0.009087005630135536,
        "encoder_gradient_l2_distance": -0.07630158960819244,
        "encoder_gradient_dot_product": 0.0027565956115722656,
        "input_gradient_cosine_similarity": 0.0025834026746451855,
        "input_gradient_l2_distance": -0.04763578623533249,
        "input_gradient_dot_product": -0.023349478840827942
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.60336474064021,
      "val_r": 0.16603965936322065,
      "n_iterations": 309,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007004874292761087,
        "right_subspace_overlap_bottom_k": -0.003321294905617833,
        "interaction_matrix_overlap_top_k": 0.0014224023325368762,
        "interaction_matrix_overlap_bottom_k": 0.06340597569942474,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0018589487299323082,
        "stable_rank": -0.0019852707628160715,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0028577386401593685,
        "task_vector_l2_distance": -0.05382581055164337,
        "task_vector_dot_product": -0.01809101738035679,
        "weight_space_angle": 0.0023538446985185146,
        "task_vector_magnitude_ratio": -0.015321850776672363,
        "singular_value_overlap": -0.03431367501616478,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.005979879759252071,
        "activation_l2_distance": -0.00706833228468895,
        "activation_cosine_similarity": 0.00919091422110796,
        "activation_magnitude_ratio": 0.0031077226158231497,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.006592004559934139,
        "encoder_gradient_l2_distance": -0.09211142361164093,
        "encoder_gradient_dot_product": 0.00991649180650711,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.06258735805749893,
        "input_gradient_dot_product": -0.02125726453959942
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5498470859714379,
      "val_r": 0.25550961608451206,
      "n_iterations": 306,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.012976303696632385,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": -0.001471338327974081,
        "interaction_matrix_overlap_bottom_k": 0.08889015763998032,
        "effective_rank": -0.0011192288948222995,
        "effective_rank_mergeability_score": 0.0011211292585358024,
        "stable_rank": 0.0,
        "spectral_gap": 0.0015595178119838238,
        "singular_value_ratio": -0.001632897648960352,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.09230254590511322,
        "task_vector_dot_product": -0.012363167479634285,
        "weight_space_angle": 0.0015733762411400676,
        "task_vector_magnitude_ratio": -0.018510568886995316,
        "singular_value_overlap": -0.054430898278951645,
        "subspace_overlap": 0.01668565720319748,
        "right_subspace_overlap": 0.01026005856692791,
        "activation_l2_distance": 0.005376099143177271,
        "activation_cosine_similarity": 0.01615457981824875,
        "activation_magnitude_ratio": -0.01547282561659813,
        "activation_dot_product": 0.005073400214314461,
        "encoder_gradient_cosine_similarity": 0.010760113596916199,
        "encoder_gradient_l2_distance": -0.09289952367544174,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.008284317329525948,
        "input_gradient_l2_distance": -0.04439061880111694,
        "input_gradient_dot_product": -0.0012164392974227667
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.6143524939318445,
      "val_r": 0.35891399497258436,
      "n_iterations": 284,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.001732149627059698,
        "right_subspace_overlap_bottom_k": -0.021865949034690857,
        "interaction_matrix_overlap_top_k": -0.0011141316499561071,
        "interaction_matrix_overlap_bottom_k": 0.06040804460644722,
        "effective_rank": -0.012149283662438393,
        "effective_rank_mergeability_score": 0.0052102431654930115,
        "stable_rank": -0.001934948144480586,
        "spectral_gap": -0.0010021049529314041,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.03728557750582695,
        "task_vector_dot_product": 0.003642738563939929,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.02699718251824379,
        "subspace_overlap": 0.0016683894209563732,
        "right_subspace_overlap": 0.0038043824024498463,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.008993136696517467,
        "activation_magnitude_ratio": -0.007685475051403046,
        "activation_dot_product": 0.0015404806472361088,
        "encoder_gradient_cosine_similarity": 0.006451454944908619,
        "encoder_gradient_l2_distance": -0.03396864980459213,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.001158884959295392,
        "input_gradient_l2_distance": -0.04575560614466667,
        "input_gradient_dot_product": -0.016484055668115616
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.601876379555681,
      "val_r": 0.2590121672205592,
      "n_iterations": 428,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.02526537887752056,
        "right_subspace_overlap_bottom_k": -0.01524187158793211,
        "interaction_matrix_overlap_top_k": 0.00195913203060627,
        "interaction_matrix_overlap_bottom_k": 0.06370864063501358,
        "effective_rank": -0.002411983907222748,
        "effective_rank_mergeability_score": 0.002448116894811392,
        "stable_rank": -0.004377003759145737,
        "spectral_gap": 0.0017064145067706704,
        "singular_value_ratio": -0.0016588084399700165,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.014597427099943161,
        "task_vector_l2_distance": -0.06199321523308754,
        "task_vector_dot_product": -0.01794395223259926,
        "weight_space_angle": 0.009931963868439198,
        "task_vector_magnitude_ratio": -0.010486888699233532,
        "singular_value_overlap": -0.05387226864695549,
        "subspace_overlap": 0.02610713243484497,
        "right_subspace_overlap": 0.021433861926198006,
        "activation_l2_distance": -0.02433599904179573,
        "activation_cosine_similarity": -0.020052608102560043,
        "activation_magnitude_ratio": -0.00959934014827013,
        "activation_dot_product": -0.018088290467858315,
        "encoder_gradient_cosine_similarity": 0.010495977476239204,
        "encoder_gradient_l2_distance": -0.08403213322162628,
        "encoder_gradient_dot_product": 0.01923760026693344,
        "input_gradient_cosine_similarity": -0.007466324605047703,
        "input_gradient_l2_distance": -0.0972338393330574,
        "input_gradient_dot_product": -0.027171682566404343
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.47500096919053436,
      "val_r": 0.2585524924171298,
      "n_iterations": 215,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.018023476004600525,
        "interaction_matrix_overlap_top_k": -0.0026581408455967903,
        "interaction_matrix_overlap_bottom_k": 0.03594452887773514,
        "effective_rank": -0.005217256024479866,
        "effective_rank_mergeability_score": 0.0037434077821671963,
        "stable_rank": -0.012658790685236454,
        "spectral_gap": 0.0016286354511976242,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": -0.0016768146306276321,
        "task_vector_cosine_similarity": -0.0025359478313475847,
        "task_vector_l2_distance": -0.02039831317961216,
        "task_vector_dot_product": 0.0013341712765395641,
        "weight_space_angle": 0.003936382941901684,
        "task_vector_magnitude_ratio": -0.00706237368285656,
        "singular_value_overlap": -0.016453273594379425,
        "subspace_overlap": 0.0019849601667374372,
        "right_subspace_overlap": 0.0017743106000125408,
        "activation_l2_distance": -0.003076755441725254,
        "activation_cosine_similarity": 0.007587703410536051,
        "activation_magnitude_ratio": -0.0072723859921097755,
        "activation_dot_product": 0.007152827922254801,
        "encoder_gradient_cosine_similarity": 0.002074931049719453,
        "encoder_gradient_l2_distance": -0.02472735196352005,
        "encoder_gradient_dot_product": 0.0027652704156935215,
        "input_gradient_cosine_similarity": 0.0053379167802631855,
        "input_gradient_l2_distance": -0.022810395807027817,
        "input_gradient_dot_product": -0.012545057572424412
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5882665165797416,
      "val_r": 0.4926088523899991,
      "n_iterations": 359,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002080457052215934,
        "right_subspace_overlap_bottom_k": -0.00555296940729022,
        "interaction_matrix_overlap_top_k": 0.004739504307508469,
        "interaction_matrix_overlap_bottom_k": 0.07013123482465744,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.004088812042027712,
        "task_vector_l2_distance": -0.05654565244913101,
        "task_vector_dot_product": 0.0013837250880897045,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.012574865482747555,
        "singular_value_overlap": -0.041550688445568085,
        "subspace_overlap": 0.009631596505641937,
        "right_subspace_overlap": 0.0017074828501790762,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.014673592522740364,
        "activation_magnitude_ratio": -0.014526525512337685,
        "activation_dot_product": 0.00422904547303915,
        "encoder_gradient_cosine_similarity": 0.0011060707038268447,
        "encoder_gradient_l2_distance": -0.07432599365711212,
        "encoder_gradient_dot_product": 0.0023841536603868008,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0680486336350441,
        "input_gradient_dot_product": -0.017847873270511627
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5114904016426023,
      "val_r": 0.534033909096285,
      "n_iterations": 571,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.014457223936915398,
        "right_subspace_overlap_bottom_k": -0.031479138880968094,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.05238265544176102,
        "effective_rank": -0.0011614044196903706,
        "effective_rank_mergeability_score": 0.0011085058795288205,
        "stable_rank": -0.0017524058930575848,
        "spectral_gap": -0.0016460366314277053,
        "singular_value_ratio": 0.0014103814028203487,
        "layerwise_effective_rank": -0.0019128703279420733,
        "layerwise_effective_rank_mergeability_score": 0.0011174161918461323,
        "task_vector_cosine_similarity": 0.02992950938642025,
        "task_vector_l2_distance": -0.013590855523943901,
        "task_vector_dot_product": 0.010801976546645164,
        "weight_space_angle": -0.029850659891963005,
        "task_vector_magnitude_ratio": -0.015122683718800545,
        "singular_value_overlap": -0.029834870249032974,
        "subspace_overlap": 0.012292344123125076,
        "right_subspace_overlap": 0.014029677025973797,
        "activation_l2_distance": -0.004342599306255579,
        "activation_cosine_similarity": 0.022684941068291664,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.020044924691319466,
        "encoder_gradient_cosine_similarity": 0.022492483258247375,
        "encoder_gradient_l2_distance": -0.044156499207019806,
        "encoder_gradient_dot_product": 0.01953602209687233,
        "input_gradient_cosine_similarity": 0.006513036787509918,
        "input_gradient_l2_distance": -0.058810461312532425,
        "input_gradient_dot_product": -0.04850469157099724
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5980818461482318,
      "val_r": 0.7417257851836587,
      "n_iterations": 303,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01716560870409012,
        "right_subspace_overlap_bottom_k": 0.0011459961533546448,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.07668864727020264,
        "effective_rank": -0.003160810796543956,
        "effective_rank_mergeability_score": 0.004017347935587168,
        "stable_rank": -0.004798769485205412,
        "spectral_gap": 0.0019097782205790281,
        "singular_value_ratio": -0.002823619870468974,
        "layerwise_effective_rank": -0.001769729540683329,
        "layerwise_effective_rank_mergeability_score": 0.0021860874257981777,
        "task_vector_cosine_similarity": -0.007483283989131451,
        "task_vector_l2_distance": -0.08827012032270432,
        "task_vector_dot_product": 0.001496435608714819,
        "weight_space_angle": 0.006364630069583654,
        "task_vector_magnitude_ratio": -0.01349311601370573,
        "singular_value_overlap": -0.069808728992939,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.020792830735445023,
        "activation_l2_distance": 0.003031593980267644,
        "activation_cosine_similarity": 0.015879681333899498,
        "activation_magnitude_ratio": -0.015187614597380161,
        "activation_dot_product": 0.00881805457174778,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.10542257875204086,
        "encoder_gradient_dot_product": 0.0012868113117292523,
        "input_gradient_cosine_similarity": 0.0037429826334118843,
        "input_gradient_l2_distance": -0.10166376084089279,
        "input_gradient_dot_product": -0.03137421980500221
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5694912503427552,
      "val_r": 0.6259882450917377,
      "n_iterations": 402,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01580440066754818,
        "right_subspace_overlap_bottom_k": -0.022355925291776657,
        "interaction_matrix_overlap_top_k": 0.0019255302613601089,
        "interaction_matrix_overlap_bottom_k": 0.06142405793070793,
        "effective_rank": -0.003067178186029196,
        "effective_rank_mergeability_score": 0.004275206942111254,
        "stable_rank": -0.0061149136163294315,
        "spectral_gap": 0.002137152710929513,
        "singular_value_ratio": -0.0020428416319191456,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.010221735574305058,
        "task_vector_l2_distance": -0.0545949786901474,
        "task_vector_dot_product": -0.015369292348623276,
        "weight_space_angle": 0.013394743204116821,
        "task_vector_magnitude_ratio": -0.010981089435517788,
        "singular_value_overlap": -0.04221964627504349,
        "subspace_overlap": 0.025631308555603027,
        "right_subspace_overlap": 0.014165224507451057,
        "activation_l2_distance": -0.0135352723300457,
        "activation_cosine_similarity": 0.010230723768472672,
        "activation_magnitude_ratio": -0.010379559360444546,
        "activation_dot_product": -0.005848342552781105,
        "encoder_gradient_cosine_similarity": 0.007263366598635912,
        "encoder_gradient_l2_distance": -0.06661257147789001,
        "encoder_gradient_dot_product": 0.0073528168722987175,
        "input_gradient_cosine_similarity": -0.0017617419362068176,
        "input_gradient_l2_distance": -0.07639626413583755,
        "input_gradient_dot_product": -0.01703449711203575
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.6349248016447244,
      "val_r": 0.3373369226632869,
      "n_iterations": 296,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009119822643697262,
        "right_subspace_overlap_bottom_k": -0.005601134616881609,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.03843885660171509,
        "effective_rank": -0.0010250138584524393,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0016335448017343879,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0011276446748524904,
        "task_vector_l2_distance": -0.03999275341629982,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0013224183348938823,
        "task_vector_magnitude_ratio": -0.013806847855448723,
        "singular_value_overlap": -0.012539427727460861,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.005867294035851955,
        "activation_l2_distance": 0.020368188619613647,
        "activation_cosine_similarity": 0.0181301049888134,
        "activation_magnitude_ratio": -0.00931365042924881,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": -0.0011059476528316736,
        "encoder_gradient_l2_distance": -0.040849827229976654,
        "encoder_gradient_dot_product": 0.004928359761834145,
        "input_gradient_cosine_similarity": 0.00249181198887527,
        "input_gradient_l2_distance": -0.035366181284189224,
        "input_gradient_dot_product": -0.01724444329738617
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6191315343595165,
      "val_r": 0.4995954533471319,
      "n_iterations": 414,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.003992356825619936,
        "right_subspace_overlap_bottom_k": -0.014021914452314377,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.053443361073732376,
        "effective_rank": -0.0018743412801995873,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.006262331269681454,
        "spectral_gap": -0.0025526678655296564,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.002307548886165023,
        "task_vector_l2_distance": -0.03894898667931557,
        "task_vector_dot_product": -0.0012897669803351164,
        "weight_space_angle": 0.005133720580488443,
        "task_vector_magnitude_ratio": -0.005542089696973562,
        "singular_value_overlap": -0.02117946743965149,
        "subspace_overlap": 0.004696819931268692,
        "right_subspace_overlap": 0.005104591138660908,
        "activation_l2_distance": 0.011546609923243523,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.005755561403930187,
        "activation_dot_product": 0.02114071696996689,
        "encoder_gradient_cosine_similarity": 0.004699856974184513,
        "encoder_gradient_l2_distance": -0.030420931056141853,
        "encoder_gradient_dot_product": 0.0025832222308963537,
        "input_gradient_cosine_similarity": 0.005184592213481665,
        "input_gradient_l2_distance": -0.032604608684778214,
        "input_gradient_dot_product": -0.012654099613428116
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6307269821214702,
      "val_r": 0.3936374657579433,
      "n_iterations": 232,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01318141259253025,
        "right_subspace_overlap_bottom_k": -0.005714092403650284,
        "interaction_matrix_overlap_top_k": -0.03360503166913986,
        "interaction_matrix_overlap_bottom_k": 0.044671572744846344,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.006030018907040358,
        "layerwise_effective_rank_mergeability_score": 0.003290654392912984,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.02739427238702774,
        "task_vector_dot_product": 0.006722790654748678,
        "weight_space_angle": -0.00101682567037642,
        "task_vector_magnitude_ratio": -0.0019110373686999083,
        "singular_value_overlap": -0.009355245158076286,
        "subspace_overlap": 0.004788586404174566,
        "right_subspace_overlap": 0.010328021831810474,
        "activation_l2_distance": 0.00871803518384695,
        "activation_cosine_similarity": 0.0030371907632797956,
        "activation_magnitude_ratio": -0.0017179199494421482,
        "activation_dot_product": 0.012723029591143131,
        "encoder_gradient_cosine_similarity": 0.001237828517332673,
        "encoder_gradient_l2_distance": -0.0191821102052927,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.005117275286465883,
        "input_gradient_l2_distance": -0.032712869346141815,
        "input_gradient_dot_product": -0.00690149562433362
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7813040628345558,
      "val_r": 0.6834877156845268,
      "n_iterations": 295,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.05009404197335243,
        "right_subspace_overlap_bottom_k": -0.0739716961979866,
        "interaction_matrix_overlap_top_k": 0.03484414890408516,
        "interaction_matrix_overlap_bottom_k": -0.012612705118954182,
        "effective_rank": -0.009837080724537373,
        "effective_rank_mergeability_score": 0.008900491520762444,
        "stable_rank": -0.01066605094820261,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.012597007676959038,
        "layerwise_effective_rank_mergeability_score": 0.01473213266581297,
        "task_vector_cosine_similarity": -0.013892977498471737,
        "task_vector_l2_distance": -0.008146004751324654,
        "task_vector_dot_product": 0.01461591012775898,
        "weight_space_angle": 0.015441731549799442,
        "task_vector_magnitude_ratio": 0.0010814907727763057,
        "singular_value_overlap": -0.003473130986094475,
        "subspace_overlap": 0.01165000256150961,
        "right_subspace_overlap": 0.052488282322883606,
        "activation_l2_distance": -0.007778314873576164,
        "activation_cosine_similarity": 0.03411860391497612,
        "activation_magnitude_ratio": -0.024559319019317627,
        "activation_dot_product": 0.11408679187297821,
        "encoder_gradient_cosine_similarity": 0.025608891621232033,
        "encoder_gradient_l2_distance": -0.17950789630413055,
        "encoder_gradient_dot_product": 0.0157770998775959,
        "input_gradient_cosine_similarity": 0.0011674156412482262,
        "input_gradient_l2_distance": -0.17898070812225342,
        "input_gradient_dot_product": -0.09242300689220428
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6779887244429215,
      "val_r": 0.4266374900512776,
      "n_iterations": 419,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.017392661422491074,
        "right_subspace_overlap_bottom_k": 0.004129296168684959,
        "interaction_matrix_overlap_top_k": -0.006307822186499834,
        "interaction_matrix_overlap_bottom_k": 0.030155297368764877,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0016423675697296858,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0010089143179357052,
        "task_vector_l2_distance": -0.03218135982751846,
        "task_vector_dot_product": 0.005285570863634348,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.008535710163414478,
        "singular_value_overlap": -0.013027417473495007,
        "subspace_overlap": 0.01344518456608057,
        "right_subspace_overlap": -0.012202730402350426,
        "activation_l2_distance": 0.009530100971460342,
        "activation_cosine_similarity": -0.002874555066227913,
        "activation_magnitude_ratio": 0.0013486386742442846,
        "activation_dot_product": 0.02463071048259735,
        "encoder_gradient_cosine_similarity": -0.0013658103998750448,
        "encoder_gradient_l2_distance": -0.020748136565089226,
        "encoder_gradient_dot_product": 0.0015690349973738194,
        "input_gradient_cosine_similarity": 0.005599379539489746,
        "input_gradient_l2_distance": -0.02679615095257759,
        "input_gradient_dot_product": -0.0033001680858433247
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.1,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}