{
  "aggregate_metrics": {
    "train_r": 0.4076342900004527,
    "train_p": 2.988332951371494e-129,
    "val_r": 0.02161719615394042,
    "val_p": 0.6835425789417914
  },
  "per_fold_stats": {
    "train_r_mean": 0.5605880627094761,
    "train_r_std": 0.06690443177279888,
    "val_r_mean": 0.48507219615164,
    "val_r_std": 0.1431777763376688,
    "n_nonzero_mean": 17.2,
    "n_nonzero_std": 3.4727510708370675
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.0024517152924090624,
    "right_subspace_overlap_bottom_k": 0.0011023199185729027,
    "interaction_matrix_overlap_top_k": 0.0005715301958844066,
    "interaction_matrix_overlap_bottom_k": 0.00665674451738596,
    "effective_rank": -0.0003917944268323481,
    "effective_rank_mergeability_score": 0.0006482239114120603,
    "stable_rank": -0.000497723463922739,
    "spectral_gap": 0.0009271434391848743,
    "singular_value_ratio": -0.0005744005320593715,
    "layerwise_effective_rank": -0.0003914072585757822,
    "layerwise_effective_rank_mergeability_score": 0.00028989012935198843,
    "task_vector_cosine_similarity": 6.849004421383142e-07,
    "task_vector_l2_distance": -0.010161987505853176,
    "task_vector_dot_product": 0.0001600960677023977,
    "weight_space_angle": 0.0002686892985366285,
    "task_vector_magnitude_ratio": -0.0011814769823104143,
    "singular_value_overlap": -0.0070360624231398106,
    "subspace_overlap": 0.0006428906926885247,
    "right_subspace_overlap": 0.0022568649146705866,
    "activation_l2_distance": -0.0019223010167479515,
    "activation_cosine_similarity": 0.0023802744690328836,
    "activation_magnitude_ratio": -0.0020703317131847143,
    "activation_dot_product": 0.0019410375971347094,
    "encoder_gradient_cosine_similarity": 0.000936667260248214,
    "encoder_gradient_l2_distance": -0.01443017739802599,
    "encoder_gradient_dot_product": 0.0009406910394318402,
    "input_gradient_cosine_similarity": 0.00030315364710986614,
    "input_gradient_l2_distance": -0.01589168794453144,
    "input_gradient_dot_product": -0.0022949837148189545
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.003450439078733325,
    "right_subspace_overlap_bottom_k": 0.003987317439168692,
    "interaction_matrix_overlap_top_k": 0.0013945965329185128,
    "interaction_matrix_overlap_bottom_k": 0.003686317475512624,
    "effective_rank": 0.0007770971860736609,
    "effective_rank_mergeability_score": 0.001033373293466866,
    "stable_rank": 0.0007990191224962473,
    "spectral_gap": 0.001166299101896584,
    "singular_value_ratio": 0.000983147881925106,
    "layerwise_effective_rank": 0.0007139832014217973,
    "layerwise_effective_rank_mergeability_score": 0.0006005637696944177,
    "task_vector_cosine_similarity": 0.0018047416815534234,
    "task_vector_l2_distance": 0.00466288672760129,
    "task_vector_dot_product": 0.001785371219739318,
    "weight_space_angle": 0.0017509470926597714,
    "task_vector_magnitude_ratio": 0.0009245088440366089,
    "singular_value_overlap": 0.0033157519064843655,
    "subspace_overlap": 0.0017471250612288713,
    "right_subspace_overlap": 0.0024133932311087847,
    "activation_l2_distance": 0.00220052944496274,
    "activation_cosine_similarity": 0.00226463726721704,
    "activation_magnitude_ratio": 0.0017515908693894744,
    "activation_dot_product": 0.003333326196298003,
    "encoder_gradient_cosine_similarity": 0.0014453900512307882,
    "encoder_gradient_l2_distance": 0.005029983352869749,
    "encoder_gradient_dot_product": 0.00113813322968781,
    "input_gradient_cosine_similarity": 0.0010957496706396341,
    "input_gradient_l2_distance": 0.006893472280353308,
    "input_gradient_dot_product": 0.0019585806876420975
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.55,
    "right_subspace_overlap_bottom_k": 0.7,
    "interaction_matrix_overlap_top_k": 0.35,
    "interaction_matrix_overlap_bottom_k": 1.0,
    "effective_rank": 0.35,
    "effective_rank_mergeability_score": 0.35,
    "stable_rank": 0.3,
    "spectral_gap": 0.55,
    "singular_value_ratio": 0.4,
    "layerwise_effective_rank": 0.25,
    "layerwise_effective_rank_mergeability_score": 0.2,
    "task_vector_cosine_similarity": 0.3,
    "task_vector_l2_distance": 0.9,
    "task_vector_dot_product": 0.5,
    "weight_space_angle": 0.5,
    "task_vector_magnitude_ratio": 0.7,
    "singular_value_overlap": 0.95,
    "subspace_overlap": 0.55,
    "right_subspace_overlap": 0.8,
    "activation_l2_distance": 0.7,
    "activation_cosine_similarity": 0.8,
    "activation_magnitude_ratio": 0.75,
    "activation_dot_product": 0.6,
    "encoder_gradient_cosine_similarity": 0.6,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.6,
    "input_gradient_cosine_similarity": 0.3,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.65
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5873199214786576,
      "val_r": 0.6469197090989678,
      "n_iterations": 340,
      "n_nonzero_coefficients": 10,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.013768425211310387,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.011165727861225605,
        "task_vector_dot_product": 0.0017798678018152714,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.007848395965993404,
        "subspace_overlap": 0.002525290008634329,
        "right_subspace_overlap": 0.0018686328548938036,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0027649058029055595,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.011905275285243988,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.011340068653225899,
        "input_gradient_dot_product": -0.004528702702373266
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5164957390027166,
      "val_r": 0.5212738097592381,
      "n_iterations": 384,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007465125061571598,
        "right_subspace_overlap_bottom_k": -0.002267077099531889,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.00591712212190032,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.002855525352060795,
        "singular_value_ratio": -0.0010507404804229736,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0017936022486537695,
        "task_vector_l2_distance": -0.00986732728779316,
        "task_vector_dot_product": -0.004076141864061356,
        "weight_space_angle": 0.0022398349829018116,
        "task_vector_magnitude_ratio": -0.0017085947329178452,
        "singular_value_overlap": -0.011377790942788124,
        "subspace_overlap": -0.003499262034893036,
        "right_subspace_overlap": 0.0022040512412786484,
        "activation_l2_distance": -0.003984573297202587,
        "activation_cosine_similarity": 0.006113119889050722,
        "activation_magnitude_ratio": -0.00485537713393569,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": -0.0011986595345661044,
        "encoder_gradient_l2_distance": -0.02789941243827343,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0338900201022625,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.564702564886449,
      "val_r": 0.5404793484185039,
      "n_iterations": 293,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0036848075687885284,
        "right_subspace_overlap_bottom_k": 0.002193686319515109,
        "interaction_matrix_overlap_top_k": 0.0026576484087854624,
        "interaction_matrix_overlap_bottom_k": 0.006104892585426569,
        "effective_rank": -0.0012347509618848562,
        "effective_rank_mergeability_score": 0.001390696270391345,
        "stable_rank": -0.0022632889449596405,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0014813675079494715,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.010040554217994213,
        "task_vector_dot_product": -0.0010371205862611532,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0019250897457823157,
        "singular_value_overlap": -0.009513987228274345,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.001571783795952797,
        "activation_l2_distance": -0.003888342995196581,
        "activation_cosine_similarity": 0.001911381259560585,
        "activation_magnitude_ratio": -0.005120354704558849,
        "activation_dot_product": 0.0016503814840689301,
        "encoder_gradient_cosine_similarity": 0.0017462018877267838,
        "encoder_gradient_l2_distance": -0.011465143412351608,
        "encoder_gradient_dot_product": 0.0017742780037224293,
        "input_gradient_cosine_similarity": 0.002087798435240984,
        "input_gradient_l2_distance": -0.013237693347036839,
        "input_gradient_dot_product": -0.0031177345663309097
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5830747535856372,
      "val_r": 0.4988095791707083,
      "n_iterations": 266,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006084047723561525,
        "right_subspace_overlap_bottom_k": 0.004276257008314133,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.00792190432548523,
        "effective_rank": -0.0012014805106446147,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0014958708779886365,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0011044745333492756,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.012623465619981289,
        "task_vector_dot_product": 0.0014510734472423792,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.001044062664732337,
        "singular_value_overlap": -0.009201682172715664,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.002054906217381358,
        "activation_l2_distance": 0.0011141751892864704,
        "activation_cosine_similarity": 0.002508314559236169,
        "activation_magnitude_ratio": -0.0034801550209522247,
        "activation_dot_product": 0.002027785172685981,
        "encoder_gradient_cosine_similarity": 0.0016397279687225819,
        "encoder_gradient_l2_distance": -0.014073065482079983,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.018065812066197395,
        "input_gradient_dot_product": -0.004868708085268736
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5933284082436407,
      "val_r": 0.48976277040506294,
      "n_iterations": 320,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0019200219539925456,
        "right_subspace_overlap_bottom_k": 0.006012754514813423,
        "interaction_matrix_overlap_top_k": -0.001369044533930719,
        "interaction_matrix_overlap_bottom_k": 0.014687025919556618,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.020057756453752518,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.001723847002722323,
        "task_vector_magnitude_ratio": -0.0016636487562209368,
        "singular_value_overlap": -0.013547364622354507,
        "subspace_overlap": -0.0014261328615248203,
        "right_subspace_overlap": -0.002058687387034297,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.00554652139544487,
        "activation_dot_product": 0.0014314533909782767,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.011591996066272259,
        "encoder_gradient_dot_product": 0.002637523226439953,
        "input_gradient_cosine_similarity": 0.0029455730691552162,
        "input_gradient_l2_distance": -0.0193453598767519,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5849186696456639,
      "val_r": 0.7238606087084734,
      "n_iterations": 246,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0028339065611362457,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.009383495897054672,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0013326520565897226,
        "singular_value_ratio": -0.0016376555431634188,
        "layerwise_effective_rank": -0.0014425343833863735,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.014650802128016949,
        "task_vector_dot_product": 0.0019338539568707347,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.001100885565392673,
        "singular_value_overlap": -0.010236764326691628,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0030682003125548363,
        "activation_l2_distance": -0.005278217606246471,
        "activation_cosine_similarity": 0.0019160587107762694,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.016366202384233475,
        "encoder_gradient_dot_product": 0.002147065242752433,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.016764679923653603,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.564865782564603,
      "val_r": 0.286499298896675,
      "n_iterations": 301,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.002277478575706482,
        "interaction_matrix_overlap_bottom_k": 0.0072657265700399876,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0012388823088258505,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0017248571384698153,
        "task_vector_l2_distance": -0.006494789384305477,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0014637152198702097,
        "singular_value_overlap": -0.002996477298438549,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0011333914007991552,
        "activation_l2_distance": -0.0013374215923249722,
        "activation_cosine_similarity": 0.0026028817519545555,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0011137713445350528,
        "encoder_gradient_l2_distance": -0.010992911644279957,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.007690551690757275,
        "input_gradient_dot_product": -0.001456861151382327
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4543204630275329,
      "val_r": 0.29625210436222593,
      "n_iterations": 320,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.006601434201002121,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.006429703906178474,
        "effective_rank": 0.001144637819379568,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0010338732972741127,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.012374759651720524,
        "task_vector_dot_product": 0.001852322369813919,
        "weight_space_angle": 0.0010183167178183794,
        "task_vector_magnitude_ratio": -0.0011693473206833005,
        "singular_value_overlap": -0.004788472317159176,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0015948107466101646,
        "activation_cosine_similarity": -0.0016025581862777472,
        "activation_magnitude_ratio": -0.0023082029074430466,
        "activation_dot_product": 0.003692477708682418,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.012560774572193623,
        "encoder_gradient_dot_product": 0.0013028817484155297,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.005592679139226675,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5733315384742722,
      "val_r": 0.5542828075704419,
      "n_iterations": 248,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0042280880734324455,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.007078502792865038,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0022616686765104532,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.012212523259222507,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0010921789798885584,
        "task_vector_magnitude_ratio": -0.0010941758519038558,
        "singular_value_overlap": -0.0057786074467003345,
        "subspace_overlap": 0.0012766649015247822,
        "right_subspace_overlap": 0.001687570009380579,
        "activation_l2_distance": -0.002693211892619729,
        "activation_cosine_similarity": 0.0023438623175024986,
        "activation_magnitude_ratio": -0.0016914841253310442,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.011467237025499344,
        "encoder_gradient_dot_product": 0.0017061287071555853,
        "input_gradient_cosine_similarity": 0.001667299889959395,
        "input_gradient_l2_distance": -0.014964237809181213,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5563973412857499,
      "val_r": 0.4481628938128986,
      "n_iterations": 281,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0027557010762393475,
        "right_subspace_overlap_bottom_k": 0.0010383558692410588,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.00681322580203414,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0010617355583235621,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.010676106438040733,
        "task_vector_dot_product": -0.002779340837150812,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0014437673380598426,
        "singular_value_overlap": -0.009828702546656132,
        "subspace_overlap": 0.0013421783223748207,
        "right_subspace_overlap": 0.0035419510677456856,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0010780820157378912,
        "activation_magnitude_ratio": -0.0013866735389456153,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.02108681946992874,
        "encoder_gradient_dot_product": 0.0010548296850174665,
        "input_gradient_cosine_similarity": 0.0010276816319674253,
        "input_gradient_l2_distance": -0.026212627068161964,
        "input_gradient_dot_product": -0.0016966145485639572
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.46574721809474734,
      "val_r": 0.2356411157044241,
      "n_iterations": 182,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0028347643092274666,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.006359940394759178,
        "effective_rank": -0.0019187191501259804,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0022496175952255726,
        "singular_value_ratio": -0.001438220962882042,
        "layerwise_effective_rank": -0.0012421014253050089,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.00793678592890501,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0010529900901019573,
        "task_vector_magnitude_ratio": -0.001514430157840252,
        "singular_value_overlap": -0.0031352443620562553,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0014916106592863798,
        "activation_l2_distance": -0.003680958179756999,
        "activation_cosine_similarity": 0.0014167793560773134,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0017778455512598157,
        "encoder_gradient_cosine_similarity": -0.0011461273534223437,
        "encoder_gradient_l2_distance": -0.008166652172803879,
        "encoder_gradient_dot_product": 0.0020675905980169773,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.005293450318276882,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5502957500580045,
      "val_r": 0.5046937481153649,
      "n_iterations": 383,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0027888319455087185,
        "right_subspace_overlap_bottom_k": -0.0015926191117614508,
        "interaction_matrix_overlap_top_k": -0.0010699727572500706,
        "interaction_matrix_overlap_bottom_k": 0.0064287325367331505,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0014674321282655,
        "spectral_gap": 0.0021199905313551426,
        "singular_value_ratio": -0.0014083784772083163,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0020560859702527523,
        "task_vector_l2_distance": -0.006613853387534618,
        "task_vector_dot_product": -0.002286122180521488,
        "weight_space_angle": 0.003128283191472292,
        "task_vector_magnitude_ratio": -0.0015112558612599969,
        "singular_value_overlap": -0.006815006956458092,
        "subspace_overlap": 0.004512857645750046,
        "right_subspace_overlap": 0.001353265717625618,
        "activation_l2_distance": -0.0013487073592841625,
        "activation_cosine_similarity": 0.003192978911101818,
        "activation_magnitude_ratio": -0.0011467286385595798,
        "activation_dot_product": 0.0014781320933252573,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.014505538158118725,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.014006896875798702,
        "input_gradient_dot_product": -0.0033537759445607662
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.45220454570206337,
      "val_r": 0.3779973450048288,
      "n_iterations": 234,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0014720647595822811,
        "interaction_matrix_overlap_bottom_k": 0.003175221849232912,
        "effective_rank": -0.001534485025331378,
        "effective_rank_mergeability_score": 0.0038375570438802242,
        "stable_rank": 0.0,
        "spectral_gap": 0.0019733719527721405,
        "singular_value_ratio": -0.002880288753658533,
        "layerwise_effective_rank": -0.0022758152335882187,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.005375674460083246,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0024997477885335684,
        "weight_space_angle": -0.0058027044869959354,
        "task_vector_magnitude_ratio": -0.0033239852637052536,
        "singular_value_overlap": -0.007441715802997351,
        "subspace_overlap": 0.002215270884335041,
        "right_subspace_overlap": 0.003722522174939513,
        "activation_l2_distance": -0.005921541713178158,
        "activation_cosine_similarity": 0.0070512136444449425,
        "activation_magnitude_ratio": -0.0018164190696552396,
        "activation_dot_product": 0.004188144579529762,
        "encoder_gradient_cosine_similarity": 0.004165479447692633,
        "encoder_gradient_l2_distance": -0.017367620021104813,
        "encoder_gradient_dot_product": 0.0024083489552140236,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.018774284049868584,
        "input_gradient_dot_product": -0.005179013591259718
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5763953381915536,
      "val_r": 0.7279711791167848,
      "n_iterations": 292,
      "n_nonzero_coefficients": 11,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0028394286055117846,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.007163072936236858,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0012238183990120888,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.001018791226670146,
        "layerwise_effective_rank_mergeability_score": 0.0012049797223880887,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01023052353411913,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.005628833081573248,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.003900852520018816,
        "encoder_gradient_cosine_similarity": 0.002098141238093376,
        "encoder_gradient_l2_distance": -0.011542834341526031,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.011953148059546947,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5124438908853232,
      "val_r": 0.5937393119347972,
      "n_iterations": 250,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0038059097714722157,
        "right_subspace_overlap_bottom_k": -0.0011719728354364634,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.005063754040747881,
        "effective_rank": -0.0013785870978608727,
        "effective_rank_mergeability_score": 0.0019493956351652741,
        "stable_rank": -0.0022022516932338476,
        "spectral_gap": 0.0020132786594331264,
        "singular_value_ratio": -0.0016690475167706609,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.013565653003752232,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.002406755927950144,
        "singular_value_overlap": -0.0076529295183718204,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0028076551388949156,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.00471105333417654,
        "activation_magnitude_ratio": -0.0019074635347351432,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.013818087056279182,
        "encoder_gradient_dot_product": 0.0026323425117880106,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01746547222137451,
        "input_gradient_dot_product": -0.004698914475739002
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5457654205902205,
      "val_r": 0.33988524412527676,
      "n_iterations": 267,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.011357590556144714,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.004005898255854845,
        "interaction_matrix_overlap_bottom_k": 0.0017089378088712692,
        "effective_rank": -0.0017125033773481846,
        "effective_rank_mergeability_score": 0.001278341980651021,
        "stable_rank": 0.0,
        "spectral_gap": 0.0018580014584586024,
        "singular_value_ratio": -0.00243755173869431,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01010213978588581,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0022598279174417257,
        "singular_value_overlap": -0.0030868700705468655,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.006810326594859362,
        "activation_l2_distance": -0.0016392710385844111,
        "activation_cosine_similarity": 0.004275770392268896,
        "activation_magnitude_ratio": -0.0010565274860709906,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.004173284862190485,
        "encoder_gradient_l2_distance": -0.013950249180197716,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01194679830223322,
        "input_gradient_dot_product": -0.004802321549504995
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.557201682215107,
      "val_r": 0.3590863912756767,
      "n_iterations": 211,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.001235250849276781,
        "right_subspace_overlap_bottom_k": 0.005669973324984312,
        "interaction_matrix_overlap_top_k": 0.0034565303940325975,
        "interaction_matrix_overlap_bottom_k": 0.001392120961099863,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.011323951184749603,
        "task_vector_dot_product": 0.003863781224936247,
        "weight_space_angle": -0.0019522388465702534,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.008655470795929432,
        "subspace_overlap": 0.001963779330253601,
        "right_subspace_overlap": 0.00544344587251544,
        "activation_l2_distance": -0.002442318247631192,
        "activation_cosine_similarity": 0.001610838109627366,
        "activation_magnitude_ratio": -0.0036900269333273172,
        "activation_dot_product": 0.0027053379453718662,
        "encoder_gradient_cosine_similarity": 0.0023907003924250603,
        "encoder_gradient_l2_distance": -0.011878348886966705,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.013555453158915043,
        "input_gradient_dot_product": -0.004454921931028366
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5828547140466014,
      "val_r": 0.3989728569330687,
      "n_iterations": 367,
      "n_nonzero_coefficients": 13,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.010127485729753971,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.001703982474282384,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.00689023407176137,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.003411875804886222,
        "subspace_overlap": 0.0015527609502896667,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0011071815388277173,
        "activation_dot_product": -0.0014217328280210495,
        "encoder_gradient_cosine_similarity": 0.0011261459439992905,
        "encoder_gradient_l2_distance": -0.005775080528110266,
        "encoder_gradient_dot_product": 0.001344044809229672,
        "input_gradient_cosine_similarity": 0.0011158839333802462,
        "input_gradient_l2_distance": -0.011656379327178001,
        "input_gradient_dot_product": -0.002736027119681239
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7753170930563794,
      "val_r": 0.7094007403953708,
      "n_iterations": 197,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.008937631733715534,
        "right_subspace_overlap_bottom_k": -0.012247536331415176,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": -0.001444084569811821,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.001093695405870676,
        "spectral_gap": -0.0013174507766962051,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0018489026697352529,
        "layerwise_effective_rank_mergeability_score": 0.0020069805905222893,
        "task_vector_cosine_similarity": -0.004826750140637159,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0013016783632338047,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0011288031237199903,
        "right_subspace_overlap": 0.008436672389507294,
        "activation_l2_distance": -0.004564887378364801,
        "activation_cosine_similarity": 0.002239333000034094,
        "activation_magnitude_ratio": -0.0035286126658320427,
        "activation_dot_product": 0.01487582828849554,
        "encoder_gradient_cosine_similarity": 0.001352954306639731,
        "encoder_gradient_l2_distance": -0.022100983187556267,
        "encoder_gradient_dot_product": 0.0013398559531196952,
        "input_gradient_cosine_similarity": -0.0027811636682599783,
        "input_gradient_l2_distance": -0.020100565627217293,
        "input_gradient_dot_product": -0.002661824692040682
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6147804191546016,
      "val_r": 0.447753060224011,
      "n_iterations": 341,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.003636380657553673,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.007789672818034887,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.001007936429232359,
        "stable_rank": 0.0,
        "spectral_gap": 0.002900276333093643,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.001589604769833386,
        "task_vector_l2_distance": -0.016412781551480293,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0015716003254055977,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.009775055572390556,
        "subspace_overlap": 0.0035232086665928364,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.004375554155558348,
        "activation_cosine_similarity": 0.006236382760107517,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0025142482481896877,
        "encoder_gradient_cosine_similarity": 0.001271725632250309,
        "encoder_gradient_l2_distance": -0.020089320838451385,
        "encoder_gradient_dot_product": -0.0016010728431865573,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.025977591052651405,
        "input_gradient_dot_product": -0.0023442537058144808
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1.5,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}