{
  "aggregate_metrics": {
    "train_r": 0.3917477808627931,
    "train_p": 1.1520125729793059e-118,
    "val_r": 0.23694319788887497,
    "val_p": 5.837310361483599e-06
  },
  "per_fold_stats": {
    "train_r_mean": 0.5854898891771219,
    "train_r_std": 0.05817213595727462,
    "val_r_mean": 0.43707050094559075,
    "val_r_std": 0.1592711518811142,
    "n_nonzero_mean": 19.95,
    "n_nonzero_std": 2.71062723368596
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.0037477246951311827,
    "right_subspace_overlap_bottom_k": 0.00231947167776525,
    "interaction_matrix_overlap_top_k": 0.00042551400838419795,
    "interaction_matrix_overlap_bottom_k": 0.015809424221515656,
    "effective_rank": -0.00041394858271814883,
    "effective_rank_mergeability_score": 0.0006149112014099956,
    "stable_rank": -0.0005335566820576787,
    "spectral_gap": 0.00036549632204696536,
    "singular_value_ratio": -0.0007274487870745361,
    "layerwise_effective_rank": 9.0822133643087e-05,
    "layerwise_effective_rank_mergeability_score": -4.189403171039885e-06,
    "task_vector_cosine_similarity": -7.505530811613426e-05,
    "task_vector_l2_distance": -0.01891893334686756,
    "task_vector_dot_product": -0.0022625583223998547,
    "weight_space_angle": 4.8540277930442244e-05,
    "task_vector_magnitude_ratio": -0.0030212069395929575,
    "singular_value_overlap": -0.012787980027496815,
    "subspace_overlap": 0.0018025061581283808,
    "right_subspace_overlap": 0.003992151003330946,
    "activation_l2_distance": -0.0013381324242800474,
    "activation_cosine_similarity": 0.0043684314005076885,
    "activation_magnitude_ratio": -0.002516301814466715,
    "activation_dot_product": 0.002063130959868431,
    "encoder_gradient_cosine_similarity": 0.0012900183210149407,
    "encoder_gradient_l2_distance": -0.02510172687470913,
    "encoder_gradient_dot_product": 0.002183905802667141,
    "input_gradient_cosine_similarity": 0.0009999233298003674,
    "input_gradient_l2_distance": -0.02733195386826992,
    "input_gradient_dot_product": -0.006324085406959057
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.0034218684304505587,
    "right_subspace_overlap_bottom_k": 0.006579133681952953,
    "interaction_matrix_overlap_top_k": 0.0021946250926703215,
    "interaction_matrix_overlap_bottom_k": 0.004869608208537102,
    "effective_rank": 0.0010929524432867765,
    "effective_rank_mergeability_score": 0.001044475706294179,
    "stable_rank": 0.0008320359629578888,
    "spectral_gap": 0.0007504062377847731,
    "singular_value_ratio": 0.0011729621328413486,
    "layerwise_effective_rank": 0.0011065690778195858,
    "layerwise_effective_rank_mergeability_score": 0.0010391226969659328,
    "task_vector_cosine_similarity": 0.0014355223393067718,
    "task_vector_l2_distance": 0.00920858234167099,
    "task_vector_dot_product": 0.0045274836011230946,
    "weight_space_angle": 0.0020014930050820112,
    "task_vector_magnitude_ratio": 0.0015213115839287639,
    "singular_value_overlap": 0.0055632456205785275,
    "subspace_overlap": 0.002767970087006688,
    "right_subspace_overlap": 0.004232888109982014,
    "activation_l2_distance": 0.0027159377932548523,
    "activation_cosine_similarity": 0.004904825706034899,
    "activation_magnitude_ratio": 0.0025467723608016968,
    "activation_dot_product": 0.0031967752147465944,
    "encoder_gradient_cosine_similarity": 0.0012969902018085122,
    "encoder_gradient_l2_distance": 0.01214951928704977,
    "encoder_gradient_dot_product": 0.002279068110510707,
    "input_gradient_cosine_similarity": 0.0017718096496537328,
    "input_gradient_l2_distance": 0.014155802316963673,
    "input_gradient_dot_product": 0.00524390721693635
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.85,
    "right_subspace_overlap_bottom_k": 0.8,
    "interaction_matrix_overlap_top_k": 0.5,
    "interaction_matrix_overlap_bottom_k": 1.0,
    "effective_rank": 0.4,
    "effective_rank_mergeability_score": 0.3,
    "stable_rank": 0.3,
    "spectral_gap": 0.35,
    "singular_value_ratio": 0.45,
    "layerwise_effective_rank": 0.35,
    "layerwise_effective_rank_mergeability_score": 0.35,
    "task_vector_cosine_similarity": 0.5,
    "task_vector_l2_distance": 1.0,
    "task_vector_dot_product": 0.7,
    "weight_space_angle": 0.6,
    "task_vector_magnitude_ratio": 0.9,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.65,
    "right_subspace_overlap": 0.85,
    "activation_l2_distance": 0.6,
    "activation_cosine_similarity": 0.85,
    "activation_magnitude_ratio": 0.8,
    "activation_dot_product": 0.85,
    "encoder_gradient_cosine_similarity": 0.6,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.75,
    "input_gradient_cosine_similarity": 0.7,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.95
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6143479166889876,
      "val_r": 0.5609875755689814,
      "n_iterations": 336,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006001337431371212,
        "right_subspace_overlap_bottom_k": 0.0072823623195290565,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.022553149610757828,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0023202747106552124,
        "layerwise_effective_rank_mergeability_score": -0.0020837695337831974,
        "task_vector_cosine_similarity": 0.001982383895665407,
        "task_vector_l2_distance": -0.023881344124674797,
        "task_vector_dot_product": -0.012634214013814926,
        "weight_space_angle": 0.003819542471319437,
        "task_vector_magnitude_ratio": -0.00440277298912406,
        "singular_value_overlap": -0.021546699106693268,
        "subspace_overlap": 0.01163461059331894,
        "right_subspace_overlap": 0.004143170081079006,
        "activation_l2_distance": -0.006451122462749481,
        "activation_cosine_similarity": 0.00997223425656557,
        "activation_magnitude_ratio": -0.005476315971463919,
        "activation_dot_product": -0.004295612685382366,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.03037828765809536,
        "encoder_gradient_dot_product": 0.0011567807523533702,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.033497363328933716,
        "input_gradient_dot_product": -0.0050719729624688625
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5955083594996604,
      "val_r": 0.565573173963452,
      "n_iterations": 270,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0014050654135644436,
        "right_subspace_overlap_bottom_k": -0.004320988897234201,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.014441588893532753,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.010848102159798145,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.004135867115110159,
        "singular_value_overlap": -0.00669501069933176,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0012636409373953938,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0022548383567482233,
        "activation_dot_product": 0.0015863118460401893,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.013368752785027027,
        "encoder_gradient_dot_product": 0.002134204376488924,
        "input_gradient_cosine_similarity": 0.002462063916027546,
        "input_gradient_l2_distance": -0.012623089365661144,
        "input_gradient_dot_product": -0.0032611945644021034
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.600046781731082,
      "val_r": 0.5381598358829975,
      "n_iterations": 202,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005286942236125469,
        "right_subspace_overlap_bottom_k": 0.003271027933806181,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.017260633409023285,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.00160709407646209,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0017604754539206624,
        "task_vector_l2_distance": -0.02065267786383629,
        "task_vector_dot_product": 0.0023478176444768906,
        "weight_space_angle": 0.001553368871100247,
        "task_vector_magnitude_ratio": -0.0033980871085077524,
        "singular_value_overlap": -0.01295840460807085,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0015739991795271635,
        "activation_cosine_similarity": 0.00249261362478137,
        "activation_magnitude_ratio": -0.0031469373498111963,
        "activation_dot_product": 0.0031513208523392677,
        "encoder_gradient_cosine_similarity": 0.002762575400993228,
        "encoder_gradient_l2_distance": -0.02005116268992424,
        "encoder_gradient_dot_product": 0.0021761844400316477,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.019813772290945053,
        "input_gradient_dot_product": -0.0032289838418364525
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5643528886412661,
      "val_r": 0.43299689538171304,
      "n_iterations": 224,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006751570850610733,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.004994284361600876,
        "interaction_matrix_overlap_bottom_k": 0.01674238033592701,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0018838879186660051,
        "spectral_gap": 0.001684723305515945,
        "singular_value_ratio": -0.0010123836109414697,
        "layerwise_effective_rank": -0.0019786532502621412,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0013127194251865149,
        "task_vector_l2_distance": -0.013158908113837242,
        "task_vector_dot_product": -0.005201490595936775,
        "weight_space_angle": -0.0010413186391815543,
        "task_vector_magnitude_ratio": -0.003590442705899477,
        "singular_value_overlap": -0.019456403329968452,
        "subspace_overlap": 0.004292978905141354,
        "right_subspace_overlap": 0.011696082539856434,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.008719360455870628,
        "activation_magnitude_ratio": -0.009087461046874523,
        "activation_dot_product": 0.005087993107736111,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.029946917667984962,
        "encoder_gradient_dot_product": 0.004221505485475063,
        "input_gradient_cosine_similarity": 0.004258722998201847,
        "input_gradient_l2_distance": -0.0376499742269516,
        "input_gradient_dot_product": -0.020137852057814598
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5255219130626367,
      "val_r": 0.4688773700385776,
      "n_iterations": 341,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002079365309327841,
        "right_subspace_overlap_bottom_k": -0.005364381242543459,
        "interaction_matrix_overlap_top_k": -0.0012517963768914342,
        "interaction_matrix_overlap_bottom_k": 0.017321588471531868,
        "effective_rank": -0.0013437094166874886,
        "effective_rank_mergeability_score": 0.0010686407331377268,
        "stable_rank": 0.0,
        "spectral_gap": 0.0012119067832827568,
        "singular_value_ratio": -0.0014838362112641335,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0013215196086093783,
        "task_vector_cosine_similarity": 0.0010243345750495791,
        "task_vector_l2_distance": -0.012014921754598618,
        "task_vector_dot_product": -0.0028301835991442204,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0033566360361874104,
        "singular_value_overlap": -0.007190175354480743,
        "subspace_overlap": -0.0017294615972787142,
        "right_subspace_overlap": 0.0015610397094860673,
        "activation_l2_distance": -0.0015982537297531962,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0010917941108345985,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0012938189320266247,
        "encoder_gradient_l2_distance": -0.008681881241500378,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.001255725510418415,
        "input_gradient_l2_distance": -0.010952974669635296,
        "input_gradient_dot_product": -0.002619992708787322
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.6080196256463744,
      "val_r": 0.6696168792433892,
      "n_iterations": 451,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.002646534238010645,
        "interaction_matrix_overlap_top_k": -0.0012061818270012736,
        "interaction_matrix_overlap_bottom_k": 0.018814561888575554,
        "effective_rank": -0.0017118076793849468,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.014849032275378704,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.005085091572254896,
        "singular_value_overlap": -0.010280579328536987,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0011512292549014091,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002457163529470563,
        "activation_dot_product": 0.0030722194351255894,
        "encoder_gradient_cosine_similarity": 0.0011984339216724038,
        "encoder_gradient_l2_distance": -0.016294613480567932,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.001088212593458593,
        "input_gradient_l2_distance": -0.00872272253036499,
        "input_gradient_dot_product": -0.0026217729318886995
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5872450340183619,
      "val_r": 0.03113228533760047,
      "n_iterations": 238,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0027311667799949646,
        "right_subspace_overlap_bottom_k": 0.014757857657968998,
        "interaction_matrix_overlap_top_k": -0.0020412292797118425,
        "interaction_matrix_overlap_bottom_k": 0.01672905869781971,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.002718151779845357,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.002061616163700819,
        "task_vector_l2_distance": -0.028109848499298096,
        "task_vector_dot_product": -0.00859706848859787,
        "weight_space_angle": 0.002298615174368024,
        "task_vector_magnitude_ratio": -0.004029236733913422,
        "singular_value_overlap": -0.020579423755407333,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.004239249974489212,
        "activation_l2_distance": -0.00880699884146452,
        "activation_cosine_similarity": 0.00520547479391098,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.0011602581944316626,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.048338718712329865,
        "encoder_gradient_dot_product": 0.00797776784747839,
        "input_gradient_cosine_similarity": -0.003305700607597828,
        "input_gradient_l2_distance": -0.04828806594014168,
        "input_gradient_dot_product": -0.00886137131601572
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5297283543925406,
      "val_r": 0.17191839112426313,
      "n_iterations": 285,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00391112407669425,
        "right_subspace_overlap_bottom_k": -0.001082785427570343,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.019858554005622864,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0016380607848986983,
        "spectral_gap": 0.001387589843943715,
        "singular_value_ratio": -0.0015183226205408573,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0011900601675733924,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.021600717678666115,
        "task_vector_dot_product": -0.0066514769569039345,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.005012219306081533,
        "singular_value_overlap": -0.01680549420416355,
        "subspace_overlap": 0.0012697562342509627,
        "right_subspace_overlap": 0.0066964938305318356,
        "activation_l2_distance": 0.0015065206680446863,
        "activation_cosine_similarity": 0.006225673481822014,
        "activation_magnitude_ratio": -0.005812576971948147,
        "activation_dot_product": -0.0019264915026724339,
        "encoder_gradient_cosine_similarity": 0.003800485050305724,
        "encoder_gradient_l2_distance": -0.02047933079302311,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0012178975157439709,
        "input_gradient_l2_distance": -0.01667434349656105,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.6040893379232214,
      "val_r": 0.32960758693120196,
      "n_iterations": 335,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002040610183030367,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.016801344230771065,
        "effective_rank": -0.0033226462546736,
        "effective_rank_mergeability_score": 0.002692684531211853,
        "stable_rank": -0.002117505995556712,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01609487272799015,
        "task_vector_dot_product": 0.0010292488150298595,
        "weight_space_angle": 0.0013337660348042846,
        "task_vector_magnitude_ratio": -0.001242933445610106,
        "singular_value_overlap": -0.011750640347599983,
        "subspace_overlap": 0.0011252242838963866,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0032730726525187492,
        "activation_magnitude_ratio": -0.0035790614783763885,
        "activation_dot_product": 0.0017591926734894514,
        "encoder_gradient_cosine_similarity": 0.0017365238163620234,
        "encoder_gradient_l2_distance": -0.014900073409080505,
        "encoder_gradient_dot_product": 0.0017573091899976134,
        "input_gradient_cosine_similarity": 0.0012329955352470279,
        "input_gradient_l2_distance": -0.024914072826504707,
        "input_gradient_dot_product": -0.006694899871945381
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5961953881601751,
      "val_r": 0.31480248275270645,
      "n_iterations": 254,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.004702517297118902,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.017940649762749672,
        "effective_rank": -0.001282256911508739,
        "effective_rank_mergeability_score": 0.0012809657491743565,
        "stable_rank": -0.0016262829303741455,
        "spectral_gap": 0.0010434488067403436,
        "singular_value_ratio": -0.001195718883536756,
        "layerwise_effective_rank": -0.0015139831230044365,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.001354625215753913,
        "task_vector_l2_distance": -0.024351587519049644,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0022061909548938274,
        "task_vector_magnitude_ratio": -0.001734578050673008,
        "singular_value_overlap": -0.015863962471485138,
        "subspace_overlap": 0.002135483082383871,
        "right_subspace_overlap": 0.0018465875182300806,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": -0.004040937405079603,
        "activation_magnitude_ratio": -0.0033056950196623802,
        "activation_dot_product": 0.0010666290763765574,
        "encoder_gradient_cosine_similarity": 0.001432984136044979,
        "encoder_gradient_l2_distance": -0.02136397361755371,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.026178620755672455,
        "input_gradient_dot_product": -0.004274875856935978
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5461344038035788,
      "val_r": 0.2709568529107788,
      "n_iterations": 377,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0037055877037346363,
        "right_subspace_overlap_bottom_k": 0.0035785783547908068,
        "interaction_matrix_overlap_top_k": 0.002625243505463004,
        "interaction_matrix_overlap_bottom_k": 0.013638935983181,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0012667701812461019,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0017742516938596964,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0021819504909217358,
        "task_vector_l2_distance": -0.014322448521852493,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.001265105907805264,
        "singular_value_overlap": -0.009690160863101482,
        "subspace_overlap": 0.001956482417881489,
        "right_subspace_overlap": 0.003698175773024559,
        "activation_l2_distance": -0.004040465224534273,
        "activation_cosine_similarity": 0.004556019324809313,
        "activation_magnitude_ratio": -0.0028170605655759573,
        "activation_dot_product": 0.002691203262656927,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.01794685795903206,
        "encoder_gradient_dot_product": 0.004246450029313564,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01706293225288391,
        "input_gradient_dot_product": -0.001773824100382626
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5795264454152953,
      "val_r": 0.4680056188894389,
      "n_iterations": 178,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0035965186543762684,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.016495058313012123,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.002055831253528595,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.001112542231567204,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.022003673017024994,
        "task_vector_dot_product": 0.002876266371458769,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0034896060824394226,
        "singular_value_overlap": -0.014306040480732918,
        "subspace_overlap": 0.0028346404433250427,
        "right_subspace_overlap": 0.0017673526890575886,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0019129316788166761,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0036291200667619705,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.02361343242228031,
        "encoder_gradient_dot_product": 0.0010216457303613424,
        "input_gradient_cosine_similarity": 0.0015405694721266627,
        "input_gradient_l2_distance": -0.023950790986418724,
        "input_gradient_dot_product": -0.009077141992747784
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5418108524642083,
      "val_r": 0.5238460829200023,
      "n_iterations": 237,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0036026393063366413,
        "right_subspace_overlap_bottom_k": -0.0019635299686342478,
        "interaction_matrix_overlap_top_k": 0.002461619907990098,
        "interaction_matrix_overlap_bottom_k": 0.01766391657292843,
        "effective_rank": 0.0016480219783261418,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.003206238616257906,
        "task_vector_l2_distance": -0.01020384393632412,
        "task_vector_dot_product": 0.0011630418011918664,
        "weight_space_angle": -0.005498719867318869,
        "task_vector_magnitude_ratio": -0.0025332451332360506,
        "singular_value_overlap": -0.011788487434387207,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.003939618356525898,
        "activation_l2_distance": -0.0011079998221248388,
        "activation_cosine_similarity": 0.003757753875106573,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0016844046767801046,
        "encoder_gradient_cosine_similarity": 0.003600247437134385,
        "encoder_gradient_l2_distance": -0.017178140580654144,
        "encoder_gradient_dot_product": 0.0046065328642725945,
        "input_gradient_cosine_similarity": 0.0025211432948708534,
        "input_gradient_l2_distance": -0.02259150519967079,
        "input_gradient_dot_product": -0.011916015297174454
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5566578066090138,
      "val_r": 0.653765625492652,
      "n_iterations": 409,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010913925245404243,
        "right_subspace_overlap_bottom_k": -0.0010923980735242367,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.013522780500352383,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01428250502794981,
        "task_vector_dot_product": -0.0026794308796525,
        "weight_space_angle": 0.0010903485817834735,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.013837171718478203,
        "subspace_overlap": 0.004963553510606289,
        "right_subspace_overlap": 0.004799004644155502,
        "activation_l2_distance": -0.0028786342591047287,
        "activation_cosine_similarity": 0.004038674291223288,
        "activation_magnitude_ratio": -0.001328629208728671,
        "activation_dot_product": 0.004570980556309223,
        "encoder_gradient_cosine_similarity": 0.0016839106101542711,
        "encoder_gradient_l2_distance": -0.027324683964252472,
        "encoder_gradient_dot_product": 0.0019627725705504417,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0300824586302042,
        "input_gradient_dot_product": -0.013487393036484718
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4737746351840928,
      "val_r": 0.5346348592393161,
      "n_iterations": 258,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0029197006952017546,
        "right_subspace_overlap_bottom_k": -0.008092103525996208,
        "interaction_matrix_overlap_top_k": 0.0033009222242981195,
        "interaction_matrix_overlap_bottom_k": 0.013408706523478031,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0012190408306196332,
        "singular_value_ratio": 0.00131707894615829,
        "layerwise_effective_rank": 0.0018680939683690667,
        "layerwise_effective_rank_mergeability_score": -0.002280952874571085,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.008452759124338627,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0014849158469587564,
        "task_vector_magnitude_ratio": -0.0020250107627362013,
        "singular_value_overlap": -0.0095598129555583,
        "subspace_overlap": 0.0033988915383815765,
        "right_subspace_overlap": 0.004029364325106144,
        "activation_l2_distance": -0.0015763535629957914,
        "activation_cosine_similarity": 0.0018949196673929691,
        "activation_magnitude_ratio": -0.003388145938515663,
        "activation_dot_product": 0.003330143168568611,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.016652334481477737,
        "encoder_gradient_dot_product": 0.0021369201131165028,
        "input_gradient_cosine_similarity": 0.002102028112858534,
        "input_gradient_l2_distance": -0.018322225660085678,
        "input_gradient_dot_product": -0.006516754627227783
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.6053682792641365,
      "val_r": 0.29852158361405345,
      "n_iterations": 228,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00563546409830451,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.011568245477974415,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0014357115142047405,
        "layerwise_effective_rank_mergeability_score": -0.001599665149115026,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.016251124441623688,
        "task_vector_dot_product": -0.0015062256716191769,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0030970843508839607,
        "singular_value_overlap": -0.003944288939237595,
        "subspace_overlap": 0.001127411494962871,
        "right_subspace_overlap": 0.006276421248912811,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.003395003965124488,
        "activation_magnitude_ratio": -0.0050366525538265705,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.00132596748881042,
        "encoder_gradient_l2_distance": -0.01752462610602379,
        "encoder_gradient_dot_product": 0.003833622904494405,
        "input_gradient_cosine_similarity": 0.001754753990098834,
        "input_gradient_l2_distance": -0.020063651725649834,
        "input_gradient_dot_product": -0.009425045922398567
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5690671195780511,
      "val_r": 0.4553732691093383,
      "n_iterations": 271,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.011003748513758183,
        "right_subspace_overlap_bottom_k": 0.020254001021385193,
        "interaction_matrix_overlap_top_k": 0.0012292080791667104,
        "interaction_matrix_overlap_bottom_k": 0.01591314747929573,
        "effective_rank": 0.0010483741061761975,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0027081426233053207,
        "task_vector_l2_distance": -0.04501861333847046,
        "task_vector_dot_product": -0.0047156186774373055,
        "weight_space_angle": -0.0018827146850526333,
        "task_vector_magnitude_ratio": -0.0026847815606743097,
        "singular_value_overlap": -0.02383860945701599,
        "subspace_overlap": 0.0016690564807504416,
        "right_subspace_overlap": 0.01656733639538288,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.011573988012969494,
        "activation_magnitude_ratio": -0.002446881029754877,
        "activation_dot_product": 0.0015184355434030294,
        "encoder_gradient_cosine_similarity": 0.0036794834304600954,
        "encoder_gradient_l2_distance": -0.05178828537464142,
        "encoder_gradient_dot_product": 0.005936973262578249,
        "input_gradient_cosine_similarity": 0.004086918197572231,
        "input_gradient_l2_distance": -0.059805143624544144,
        "input_gradient_dot_product": 0.002756645670160651
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.581440839400873,
      "val_r": 0.39568610550459604,
      "n_iterations": 224,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007480908185243607,
        "right_subspace_overlap_bottom_k": 0.009608354419469833,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.021779458969831467,
        "effective_rank": -0.0021999054588377476,
        "effective_rank_mergeability_score": 0.0021880045533180237,
        "stable_rank": -0.002138625830411911,
        "spectral_gap": 0.0016361776506528258,
        "singular_value_ratio": -0.003436567261815071,
        "layerwise_effective_rank": -0.002089252695441246,
        "layerwise_effective_rank_mergeability_score": 0.0022564774844795465,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.03326628729701042,
        "task_vector_dot_product": -0.011697567999362946,
        "weight_space_angle": 0.0017340548802167177,
        "task_vector_magnitude_ratio": -0.004396360367536545,
        "singular_value_overlap": -0.009520945139229298,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.00475994311273098,
        "activation_l2_distance": -0.00463142991065979,
        "activation_cosine_similarity": 0.007860549725592136,
        "activation_magnitude_ratio": 0.002807473298162222,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0013437001034617424,
        "encoder_gradient_l2_distance": -0.045131929218769073,
        "encoder_gradient_dot_product": -0.0013731473591178656,
        "input_gradient_cosine_similarity": -0.0022225226275622845,
        "input_gradient_l2_distance": -0.06016825884580612,
        "input_gradient_dot_product": -0.012743180617690086
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7751925077810964,
      "val_r": 0.6234852625164171,
      "n_iterations": 252,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0018683098023757339,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0037365099415183067,
        "interaction_matrix_overlap_bottom_k": -0.001983589492738247,
        "effective_rank": -0.0011150416685268283,
        "effective_rank_mergeability_score": 0.0034608340356498957,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0017508193850517273,
        "task_vector_l2_distance": -0.004360782448202372,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0031574112363159657,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0027926466427743435,
        "subspace_overlap": 0.0013714900705963373,
        "right_subspace_overlap": 0.005833922419697046,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.017906030640006065,
        "activation_magnitude_ratio": -0.0019042917992919683,
        "activation_dot_product": 0.0034833436366170645,
        "encoder_gradient_cosine_similarity": 0.0019422362092882395,
        "encoder_gradient_l2_distance": -0.04255228489637375,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.02865055575966835,
        "input_gradient_dot_product": -0.005012887064367533
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6557692942777847,
      "val_r": 0.4334622824903392,
      "n_iterations": 277,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.002382962964475155,
        "right_subspace_overlap_bottom_k": 0.003900937968865037,
        "interaction_matrix_overlap_top_k": -0.00533830001950264,
        "interaction_matrix_overlap_bottom_k": 0.015718279406428337,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0015651208814233541,
        "singular_value_ratio": -0.002445243764668703,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.02465463988482952,
        "task_vector_dot_product": 0.003845734754577279,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.004945079330354929,
        "singular_value_overlap": -0.013354637660086155,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": -0.003274380462244153,
        "activation_l2_distance": 0.0023993155919015408,
        "activation_cosine_similarity": -0.0013747317716479301,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.01201368123292923,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.018518254160881042,
        "encoder_gradient_dot_product": 0.001882591051980853,
        "input_gradient_cosine_similarity": 0.002005660906434059,
        "input_gradient_l2_distance": -0.026626506820321083,
        "input_gradient_dot_product": -0.0025132112205028534
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.5,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}