{
  "aggregate_metrics": {
    "train_r": 0.47193871532745885,
    "train_p": 1.9854288769797865e-178,
    "val_r": 0.4105078773143099,
    "val_p": 5.504553976319951e-16
  },
  "per_fold_stats": {
    "train_r_mean": 0.76364070611366,
    "train_r_std": 0.026339148561237972,
    "val_r_mean": 0.6524865616112956,
    "val_r_std": 0.15920835421146798,
    "n_nonzero_mean": 19.5,
    "n_nonzero_std": 2.692582403567252
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.01039185468107462,
    "right_subspace_overlap_bottom_k": -0.023234279826283455,
    "interaction_matrix_overlap_top_k": 0.0010229663457721472,
    "interaction_matrix_overlap_bottom_k": 0.0005268526147119701,
    "effective_rank": -6.643246888415888e-05,
    "effective_rank_mergeability_score": -9.291296009905636e-05,
    "stable_rank": -0.0003020542790181935,
    "spectral_gap": -0.00019181423704139888,
    "singular_value_ratio": 0.00019192098989151418,
    "layerwise_effective_rank": -0.0009774146601557732,
    "layerwise_effective_rank_mergeability_score": 0.000781026144977659,
    "task_vector_cosine_similarity": -0.0008694689022377133,
    "task_vector_l2_distance": -0.002294618869200349,
    "task_vector_dot_product": -0.0009608825785107911,
    "weight_space_angle": 0.001601977040991187,
    "task_vector_magnitude_ratio": -4.4909487769473344e-05,
    "singular_value_overlap": 0.008445673622190952,
    "subspace_overlap": -0.0014024314004927874,
    "right_subspace_overlap": 0.011210983619093895,
    "activation_l2_distance": -0.0016580860828980803,
    "activation_cosine_similarity": 0.015191597864031792,
    "activation_magnitude_ratio": -0.0020339174661785364,
    "activation_dot_product": 0.007064687553793192,
    "encoder_gradient_cosine_similarity": 0.002147587016224861,
    "encoder_gradient_l2_distance": -0.03285149484872818,
    "encoder_gradient_dot_product": 0.0003085916396230459,
    "input_gradient_cosine_similarity": 0.0014924760907888412,
    "input_gradient_l2_distance": -0.020349230617284775,
    "input_gradient_dot_product": -0.0030782923568040133
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.00525326281785965,
    "right_subspace_overlap_bottom_k": 0.006289131008088589,
    "interaction_matrix_overlap_top_k": 0.0028389038052409887,
    "interaction_matrix_overlap_bottom_k": 0.0034924007486552,
    "effective_rank": 0.0008330994169227779,
    "effective_rank_mergeability_score": 0.0007454389124177396,
    "stable_rank": 0.00087262800661847,
    "spectral_gap": 0.0007419059984385967,
    "singular_value_ratio": 0.000810161407571286,
    "layerwise_effective_rank": 0.0014038217486813664,
    "layerwise_effective_rank_mergeability_score": 0.0012354424688965082,
    "task_vector_cosine_similarity": 0.003715971251949668,
    "task_vector_l2_distance": 0.004872738383710384,
    "task_vector_dot_product": 0.0021193912252783775,
    "weight_space_angle": 0.0022354410029947758,
    "task_vector_magnitude_ratio": 0.0007130084559321404,
    "singular_value_overlap": 0.005613329820334911,
    "subspace_overlap": 0.001869942876510322,
    "right_subspace_overlap": 0.005387477111071348,
    "activation_l2_distance": 0.0039334590546786785,
    "activation_cosine_similarity": 0.005800665356218815,
    "activation_magnitude_ratio": 0.0018591417465358973,
    "activation_dot_product": 0.011777758598327637,
    "encoder_gradient_cosine_similarity": 0.0012069897493347526,
    "encoder_gradient_l2_distance": 0.017338348552584648,
    "encoder_gradient_dot_product": 0.001695265294983983,
    "input_gradient_cosine_similarity": 0.0019309911876916885,
    "input_gradient_l2_distance": 0.01589168980717659,
    "input_gradient_dot_product": 0.002548891818150878
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 1.0,
    "right_subspace_overlap_bottom_k": 1.0,
    "interaction_matrix_overlap_top_k": 0.55,
    "interaction_matrix_overlap_bottom_k": 0.95,
    "effective_rank": 0.25,
    "effective_rank_mergeability_score": 0.25,
    "stable_rank": 0.25,
    "spectral_gap": 0.35,
    "singular_value_ratio": 0.35,
    "layerwise_effective_rank": 0.5,
    "layerwise_effective_rank_mergeability_score": 0.35,
    "task_vector_cosine_similarity": 0.6,
    "task_vector_l2_distance": 0.65,
    "task_vector_dot_product": 0.5,
    "weight_space_angle": 0.7,
    "task_vector_magnitude_ratio": 0.25,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.7,
    "right_subspace_overlap": 1.0,
    "activation_l2_distance": 0.75,
    "activation_cosine_similarity": 1.0,
    "activation_magnitude_ratio": 0.7,
    "activation_dot_product": 0.9,
    "encoder_gradient_cosine_similarity": 0.85,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.65,
    "input_gradient_cosine_similarity": 0.55,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.9
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7605072750323043,
      "val_r": 0.5505701537713538,
      "n_iterations": 360,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.011279534548521042,
        "right_subspace_overlap_bottom_k": -0.016956757754087448,
        "interaction_matrix_overlap_top_k": 0.002775129396468401,
        "interaction_matrix_overlap_bottom_k": 0.003477186895906925,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0010068779811263084,
        "task_vector_dot_product": -0.001079390523955226,
        "weight_space_angle": 0.0010632809717208147,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.00430840440094471,
        "subspace_overlap": 0.0012780365068465471,
        "right_subspace_overlap": 0.008646040223538876,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.01612822152674198,
        "activation_magnitude_ratio": -0.004243497271090746,
        "activation_dot_product": 0.0018759852973744273,
        "encoder_gradient_cosine_similarity": 0.0015677365008741617,
        "encoder_gradient_l2_distance": -0.025088081136345863,
        "encoder_gradient_dot_product": -0.0013096884358674288,
        "input_gradient_cosine_similarity": 0.0015351837500929832,
        "input_gradient_l2_distance": -0.016836825758218765,
        "input_gradient_dot_product": -0.005277296062558889
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7440066987745588,
      "val_r": 0.7746330397879727,
      "n_iterations": 394,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005723155569285154,
        "right_subspace_overlap_bottom_k": -0.019587988033890724,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.004545197822153568,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0012048811186105013,
        "singular_value_ratio": 0.0015569995157420635,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.00591505179181695,
        "subspace_overlap": -0.0017176385736092925,
        "right_subspace_overlap": 0.015010873787105083,
        "activation_l2_distance": 0.0013545204419642687,
        "activation_cosine_similarity": 0.012110763229429722,
        "activation_magnitude_ratio": -0.002098198514431715,
        "activation_dot_product": 0.0041094934567809105,
        "encoder_gradient_cosine_similarity": 0.0019204916898161173,
        "encoder_gradient_l2_distance": -0.018757550045847893,
        "encoder_gradient_dot_product": 0.001302910503000021,
        "input_gradient_cosine_similarity": 0.00106775329913944,
        "input_gradient_l2_distance": -0.01518365927040577,
        "input_gradient_dot_product": -0.002268670592457056
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7755225959542899,
      "val_r": 0.8392711213720558,
      "n_iterations": 391,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01290604006499052,
        "right_subspace_overlap_bottom_k": -0.01757785864174366,
        "interaction_matrix_overlap_top_k": -0.0022654018830507994,
        "interaction_matrix_overlap_bottom_k": 0.0015352494083344936,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.003120811888948083,
        "layerwise_effective_rank_mergeability_score": 0.002063373802229762,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.001689832890406251,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.001809729845263064,
        "subspace_overlap": -0.0031204097904264927,
        "right_subspace_overlap": 0.007481016684323549,
        "activation_l2_distance": 0.0012074918486177921,
        "activation_cosine_similarity": 0.013488546945154667,
        "activation_magnitude_ratio": -0.0029473337344825268,
        "activation_dot_product": -0.0011872007744386792,
        "encoder_gradient_cosine_similarity": 0.001881023170426488,
        "encoder_gradient_l2_distance": -0.020930826663970947,
        "encoder_gradient_dot_product": -0.0019620435778051615,
        "input_gradient_cosine_similarity": 0.0034199801739305258,
        "input_gradient_l2_distance": -0.006312255747616291,
        "input_gradient_dot_product": -0.002530083991587162
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7647306673104068,
      "val_r": 0.7240061695166632,
      "n_iterations": 299,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004994068294763565,
        "right_subspace_overlap_bottom_k": -0.023908359929919243,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0011087254388257861,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0038672201335430145,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.003315966110676527,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.006081376690417528,
        "subspace_overlap": -0.0011889039305970073,
        "right_subspace_overlap": 0.017194343730807304,
        "activation_l2_distance": 0.003646780736744404,
        "activation_cosine_similarity": 0.020680950954556465,
        "activation_magnitude_ratio": -0.0015463994350284338,
        "activation_dot_product": -0.0039402786642313,
        "encoder_gradient_cosine_similarity": 0.0029657480772584677,
        "encoder_gradient_l2_distance": -0.025155767798423767,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.003544297767803073,
        "input_gradient_dot_product": -0.005507552530616522
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7656315364861824,
      "val_r": 0.7472895003256594,
      "n_iterations": 437,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.014049637131392956,
        "right_subspace_overlap_bottom_k": -0.02564697153866291,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0027756551280617714,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.001435547135770321,
        "task_vector_magnitude_ratio": -0.0012113124830648303,
        "singular_value_overlap": 0.005397249944508076,
        "subspace_overlap": -0.0018222004873678088,
        "right_subspace_overlap": 0.009799395687878132,
        "activation_l2_distance": 0.0021184992510825396,
        "activation_cosine_similarity": 0.01923413760960102,
        "activation_magnitude_ratio": -0.0013707939069718122,
        "activation_dot_product": -0.0028390607330948114,
        "encoder_gradient_cosine_similarity": 0.0024015421513468027,
        "encoder_gradient_l2_distance": -0.027403265237808228,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0030479026027023792,
        "input_gradient_l2_distance": -0.004370464477688074,
        "input_gradient_dot_product": -0.0020416155457496643
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7299534724663884,
      "val_r": 0.7338795846776529,
      "n_iterations": 273,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.014973548240959644,
        "right_subspace_overlap_bottom_k": -0.04074452444911003,
        "interaction_matrix_overlap_top_k": 0.005485143978148699,
        "interaction_matrix_overlap_bottom_k": -0.0014797199983149767,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0017497187945991755,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.010279703885316849,
        "task_vector_l2_distance": -0.007582205347716808,
        "task_vector_dot_product": -0.006276184692978859,
        "weight_space_angle": 0.00736887427046895,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.02170000784099102,
        "subspace_overlap": -0.0032580541446805,
        "right_subspace_overlap": 0.01202761847525835,
        "activation_l2_distance": -0.010857366025447845,
        "activation_cosine_similarity": 0.026225818321108818,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.04006562754511833,
        "encoder_gradient_cosine_similarity": 0.0033371662721037865,
        "encoder_gradient_l2_distance": -0.0872500091791153,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.05878182500600815,
        "input_gradient_dot_product": -0.0029991932678967714
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7486886849809424,
      "val_r": 0.6860847163556371,
      "n_iterations": 466,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.007677366025745869,
        "right_subspace_overlap_bottom_k": -0.02394814044237137,
        "interaction_matrix_overlap_top_k": 0.0030758632346987724,
        "interaction_matrix_overlap_bottom_k": 0.005710020661354065,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.005900510586798191,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.00273787509649992,
        "activation_l2_distance": -0.0017843247624114156,
        "activation_cosine_similarity": 0.008397962898015976,
        "activation_magnitude_ratio": -0.0016290000639855862,
        "activation_dot_product": 0.006313705816864967,
        "encoder_gradient_cosine_similarity": 0.0011863907566294074,
        "encoder_gradient_l2_distance": -0.02025531977415085,
        "encoder_gradient_dot_product": 0.0019180051749572158,
        "input_gradient_cosine_similarity": 0.0039000262040644884,
        "input_gradient_l2_distance": -0.018874499946832657,
        "input_gradient_dot_product": -0.006004870869219303
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7683721621891719,
      "val_r": 0.3869198832301105,
      "n_iterations": 345,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.020918821915984154,
        "right_subspace_overlap_bottom_k": -0.02194349840283394,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0010184048442170024,
        "layerwise_effective_rank_mergeability_score": 0.0012724248226732016,
        "task_vector_cosine_similarity": -0.005791707895696163,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.0045347390696406364,
        "weight_space_angle": 0.0027609155513346195,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0025309198535978794,
        "subspace_overlap": 0.0011412312742322683,
        "right_subspace_overlap": 0.008647488430142403,
        "activation_l2_distance": -0.006928625050932169,
        "activation_cosine_similarity": 0.01685091108083725,
        "activation_magnitude_ratio": -0.003886663820594549,
        "activation_dot_product": -0.0014185280306264758,
        "encoder_gradient_cosine_similarity": 0.004027705639600754,
        "encoder_gradient_l2_distance": -0.02669108472764492,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.011399266310036182,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7916270459486785,
      "val_r": 0.5606677271816939,
      "n_iterations": 286,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.008488948456943035,
        "right_subspace_overlap_bottom_k": -0.025246407836675644,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.002575280610471964,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.001120055909268558,
        "singular_value_ratio": 0.0010814610868692398,
        "layerwise_effective_rank": -0.002795466687530279,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0023053856566548347,
        "task_vector_l2_distance": 0.0015516034327447414,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.003200617851689458,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.006258614361286163,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.020490583032369614,
        "activation_l2_distance": 0.0029500515665858984,
        "activation_cosine_similarity": 0.01903063803911209,
        "activation_magnitude_ratio": -0.0019538269843906164,
        "activation_dot_product": -0.00407018419355154,
        "encoder_gradient_cosine_similarity": 0.0037245163694024086,
        "encoder_gradient_l2_distance": -0.024991579353809357,
        "encoder_gradient_dot_product": 0.004020919091999531,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.012454988434910774,
        "input_gradient_dot_product": -0.0016113759484142065
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7277840219375449,
      "val_r": 0.402159423879808,
      "n_iterations": 282,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010327713564038277,
        "right_subspace_overlap_bottom_k": -0.02147228829562664,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.004437221214175224,
        "effective_rank": -0.001165024470537901,
        "effective_rank_mergeability_score": 0.0010241720592603087,
        "stable_rank": -0.0018557531293481588,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0032533123157918453,
        "layerwise_effective_rank_mergeability_score": 0.0031466828659176826,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0031719491817057133,
        "task_vector_dot_product": -0.0017682032193988562,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.005135305225849152,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.00977794174104929,
        "activation_l2_distance": -0.0012438071426004171,
        "activation_cosine_similarity": -0.0017164587043225765,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.0017593302763998508,
        "encoder_gradient_cosine_similarity": 0.003831550944596529,
        "encoder_gradient_l2_distance": -0.015016790479421616,
        "encoder_gradient_dot_product": -0.0015746428398415446,
        "input_gradient_cosine_similarity": 0.0036741946823894978,
        "input_gradient_l2_distance": -0.013926757499575615,
        "input_gradient_dot_product": -0.0017162543954327703
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7925714797826183,
      "val_r": 0.17632662333784133,
      "n_iterations": 198,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.016474906355142593,
        "right_subspace_overlap_bottom_k": -0.022344287484884262,
        "interaction_matrix_overlap_top_k": -0.00114294677041471,
        "interaction_matrix_overlap_bottom_k": -0.0016673888312652707,
        "effective_rank": -0.0019757940899580717,
        "effective_rank_mergeability_score": 0.0017073567723855376,
        "stable_rank": -0.0011342098005115986,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0013755521504208446,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.002504173666238785,
        "task_vector_l2_distance": -0.0024435720406472683,
        "task_vector_dot_product": -0.004616455174982548,
        "weight_space_angle": 0.00364964478649199,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.016335666179656982,
        "subspace_overlap": -0.004269873257726431,
        "right_subspace_overlap": 0.007169612683355808,
        "activation_l2_distance": -0.007307027466595173,
        "activation_cosine_similarity": 0.01952088624238968,
        "activation_magnitude_ratio": -0.003779035061597824,
        "activation_dot_product": 0.0117418197914958,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.04022065922617912,
        "encoder_gradient_dot_product": -0.0020927165169268847,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.015976902097463608,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7651211540789623,
      "val_r": 0.7349544037647776,
      "n_iterations": 232,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009406491182744503,
        "right_subspace_overlap_bottom_k": -0.019022492691874504,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0016355746192857623,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0013455834705382586,
        "singular_value_ratio": -0.0013342146994546056,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.003125191433355212,
        "task_vector_l2_distance": 0.0018896044930443168,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0029780957847833633,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.002907977905124426,
        "subspace_overlap": -0.003228006884455681,
        "right_subspace_overlap": 0.011431070044636726,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.010472480207681656,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0028725024312734604,
        "encoder_gradient_cosine_similarity": 0.002216352615505457,
        "encoder_gradient_l2_distance": -0.020108316093683243,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.0019841715693473816,
        "input_gradient_l2_distance": -0.0046949852257966995,
        "input_gradient_dot_product": -0.001459138235077262
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7359434448055462,
      "val_r": 0.7137428510828359,
      "n_iterations": 409,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.013682922348380089,
        "right_subspace_overlap_bottom_k": -0.03012780286371708,
        "interaction_matrix_overlap_top_k": 0.0018480441067367792,
        "interaction_matrix_overlap_bottom_k": -0.006973499432206154,
        "effective_rank": 0.0016161950770765543,
        "effective_rank_mergeability_score": -0.001972475554794073,
        "stable_rank": 0.001250073197297752,
        "spectral_gap": -0.0015385511796921492,
        "singular_value_ratio": 0.0019444352947175503,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.00871219765394926,
        "task_vector_l2_distance": -0.001186045934446156,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.016496190801262856,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.010623179376125336,
        "activation_l2_distance": -0.0027231902349740267,
        "activation_cosine_similarity": 0.016176259145140648,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.022464606910943985,
        "encoder_gradient_cosine_similarity": 0.0024915789254009724,
        "encoder_gradient_l2_distance": -0.04979262873530388,
        "encoder_gradient_dot_product": -0.0010443704668432474,
        "input_gradient_cosine_similarity": 0.004663615021854639,
        "input_gradient_l2_distance": -0.03470746427774429,
        "input_gradient_dot_product": -0.0032492876052856445
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7728701274275775,
      "val_r": 0.7454163692123964,
      "n_iterations": 259,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005594575311988592,
        "right_subspace_overlap_bottom_k": -0.01489097997546196,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.001642466988414526,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": -0.0013653134228661656,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0050249407067894936,
        "task_vector_l2_distance": 0.003217422403395176,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.004388502333313227,
        "subspace_overlap": -0.0017839110223576427,
        "right_subspace_overlap": 0.013215694576501846,
        "activation_l2_distance": 0.003046841360628605,
        "activation_cosine_similarity": 0.013804864138364792,
        "activation_magnitude_ratio": -0.0010642834240570664,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0015434627421200275,
        "encoder_gradient_l2_distance": -0.01740739867091179,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.006026380229741335,
        "input_gradient_dot_product": -0.003746457863599062
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7427707954175713,
      "val_r": 0.7519253866781546,
      "n_iterations": 241,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010393500328063965,
        "right_subspace_overlap_bottom_k": -0.02685997448861599,
        "interaction_matrix_overlap_top_k": 0.006351139862090349,
        "interaction_matrix_overlap_bottom_k": -0.002924423897638917,
        "effective_rank": 0.0018411200726404786,
        "effective_rank_mergeability_score": -0.0012519990559667349,
        "stable_rank": 0.0,
        "spectral_gap": -0.0013890379341319203,
        "singular_value_ratio": 0.0010564371477812529,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0022435064893215895,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0010026635136455297,
        "task_vector_magnitude_ratio": 0.001395947067067027,
        "singular_value_overlap": 0.010595962405204773,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.018772851675748825,
        "activation_l2_distance": -0.0059678805992007256,
        "activation_cosine_similarity": 0.017151013016700745,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.005371175706386566,
        "encoder_gradient_cosine_similarity": 0.002383455168455839,
        "encoder_gradient_l2_distance": -0.03810879960656166,
        "encoder_gradient_dot_product": 0.001435756916180253,
        "input_gradient_cosine_similarity": 0.004854185972362757,
        "input_gradient_l2_distance": -0.026896633207798004,
        "input_gradient_dot_product": -0.003939148969948292
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7956247397726592,
      "val_r": 0.7446621147708151,
      "n_iterations": 227,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.012487822212278843,
        "right_subspace_overlap_bottom_k": -0.027465885505080223,
        "interaction_matrix_overlap_top_k": 0.001480477163568139,
        "interaction_matrix_overlap_bottom_k": 0.001503401785157621,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0028159539215266705,
        "task_vector_l2_distance": -0.008648897521197796,
        "task_vector_dot_product": 0.0016758847050368786,
        "weight_space_angle": 0.0010538893984630704,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.012045689858496189,
        "subspace_overlap": -0.0048063769936561584,
        "right_subspace_overlap": 0.017619961872696877,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.02233990654349327,
        "activation_magnitude_ratio": -0.005951200611889362,
        "activation_dot_product": -0.001565081300213933,
        "encoder_gradient_cosine_similarity": 0.002529281424358487,
        "encoder_gradient_l2_distance": -0.05339976027607918,
        "encoder_gradient_dot_product": 0.0014937825035303831,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.016979947686195374,
        "input_gradient_dot_product": -0.009070808067917824
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7740638658055193,
      "val_r": 0.7857705247792569,
      "n_iterations": 316,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002798784291371703,
        "right_subspace_overlap_bottom_k": -0.01705768331885338,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.003015739843249321,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0013786975760012865,
        "layerwise_effective_rank_mergeability_score": 0.001139903673902154,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.0018089249497279525,
        "weight_space_angle": 0.0016415781574323773,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.004015233367681503,
        "subspace_overlap": -0.0033668610267341137,
        "right_subspace_overlap": 0.014815614558756351,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.01149412989616394,
        "activation_magnitude_ratio": -0.0021870480850338936,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.003474715631455183,
        "encoder_gradient_l2_distance": -0.013635251671075821,
        "encoder_gradient_dot_product": -0.0017685218481346965,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.008968002162873745,
        "input_gradient_dot_product": -0.002765445038676262
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7457279379953815,
      "val_r": 0.6523384392021477,
      "n_iterations": 271,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.015205107629299164,
        "right_subspace_overlap_bottom_k": -0.02714559994637966,
        "interaction_matrix_overlap_top_k": 0.005057595204561949,
        "interaction_matrix_overlap_bottom_k": -0.001162748783826828,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0012813315261155367,
        "spectral_gap": -0.0011747176758944988,
        "singular_value_ratio": 0.0010865326039493084,
        "layerwise_effective_rank": -0.0019385417690500617,
        "layerwise_effective_rank_mergeability_score": 0.0013222681591287255,
        "task_vector_cosine_similarity": 0.0026931308675557375,
        "task_vector_l2_distance": -0.006867572665214539,
        "task_vector_dot_product": 0.0030305555555969477,
        "weight_space_angle": -0.001204392989166081,
        "task_vector_magnitude_ratio": 0.0016970597207546234,
        "singular_value_overlap": 0.018111400306224823,
        "subspace_overlap": 0.0013067257823422551,
        "right_subspace_overlap": 0.009014850482344627,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0157439224421978,
        "activation_magnitude_ratio": -0.005899697542190552,
        "activation_dot_product": 0.02050957828760147,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.03963863477110863,
        "encoder_gradient_dot_product": 0.0024527637287974358,
        "input_gradient_cosine_similarity": 0.0022864225320518017,
        "input_gradient_l2_distance": -0.045430682599544525,
        "input_gradient_dot_product": -0.0041196937672793865
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7339981743717914,
      "val_r": 0.6518770823840464,
      "n_iterations": 343,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.013206004165112972,
        "right_subspace_overlap_bottom_k": -0.030229942873120308,
        "interaction_matrix_overlap_top_k": 0.004116016905754805,
        "interaction_matrix_overlap_bottom_k": -0.0011576219694688916,
        "effective_rank": -0.0016451459378004074,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.003019864670932293,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0015532312681898475,
        "layerwise_effective_rank": -0.003988835960626602,
        "layerwise_effective_rank_mergeability_score": 0.004237051587551832,
        "task_vector_cosine_similarity": -0.002323820721358061,
        "task_vector_l2_distance": -0.009179670363664627,
        "task_vector_dot_product": -0.0021503600291907787,
        "weight_space_angle": 0.00571716483682394,
        "task_vector_magnitude_ratio": -0.0015450587961822748,
        "singular_value_overlap": 0.011472200974822044,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.012726440094411373,
        "activation_l2_distance": -0.004513949155807495,
        "activation_cosine_similarity": 0.016688821837306023,
        "activation_magnitude_ratio": -0.0021213688887655735,
        "activation_dot_product": 0.01669168472290039,
        "encoder_gradient_cosine_similarity": 0.001469018287025392,
        "encoder_gradient_l2_distance": -0.045609042048454285,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.003384430892765522,
        "input_gradient_l2_distance": -0.03516083583235741,
        "input_gradient_dot_product": -0.0061300466768443584
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.837298241735103,
      "val_r": 0.6872361169150321,
      "n_iterations": 235,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.002751868451014161,
        "right_subspace_overlap_bottom_k": -0.01250816322863102,
        "interaction_matrix_overlap_top_k": -0.0063217333517968655,
        "interaction_matrix_overlap_bottom_k": -0.008059263229370117,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.001245375256985426,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0016800565645098686,
        "layerwise_effective_rank_mergeability_score": 0.0024388178717345,
        "task_vector_cosine_similarity": 0.0019877683371305466,
        "task_vector_l2_distance": -0.01633143611252308,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0019443046767264605,
        "task_vector_magnitude_ratio": -0.0012348252348601818,
        "singular_value_overlap": 0.007507462054491043,
        "subspace_overlap": -0.0032123855780810118,
        "right_subspace_overlap": -0.002982762409374118,
        "activation_l2_distance": -0.006159732583910227,
        "activation_cosine_similarity": 0.010008213110268116,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.02605723962187767,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0475691594183445,
        "encoder_gradient_dot_product": 0.0032996786758303642,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0504579022526741,
        "input_gradient_dot_product": 0.0028710952028632164
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.5,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}