{
  "aggregate_metrics": {
    "train_r": 0.4139693561553167,
    "train_p": 1.2316343061628566e-133,
    "val_r": 0.4144841581795257,
    "val_p": 2.698218315867555e-16
  },
  "per_fold_stats": {
    "train_r_mean": 0.71262920818384,
    "train_r_std": 0.051609657958610715,
    "val_r_mean": 0.595483812621085,
    "val_r_std": 0.18542750329522736,
    "n_nonzero_mean": 19.35,
    "n_nonzero_std": 4.162631379308045
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.00858012679964304,
    "right_subspace_overlap_bottom_k": -0.012563901953399181,
    "interaction_matrix_overlap_top_k": 0.002696602139621973,
    "interaction_matrix_overlap_bottom_k": 0.00020185155153740197,
    "effective_rank": 3.664487667265348e-05,
    "effective_rank_mergeability_score": 1.478957710787654e-05,
    "stable_rank": -0.00018095248378813267,
    "spectral_gap": -0.000471137638669461,
    "singular_value_ratio": 0.00027577500441111624,
    "layerwise_effective_rank": -0.0005265657091513276,
    "layerwise_effective_rank_mergeability_score": 0.0007482047658413649,
    "task_vector_cosine_similarity": 0.0004935021861456335,
    "task_vector_l2_distance": -0.00489855045452714,
    "task_vector_dot_product": 0.00019358753343112767,
    "weight_space_angle": -0.00048789745778776705,
    "task_vector_magnitude_ratio": 0.0003288144653197378,
    "singular_value_overlap": 0.0010773919057101011,
    "subspace_overlap": 0.0009013173985294998,
    "right_subspace_overlap": 0.009669145569205284,
    "activation_l2_distance": -0.0023624952882528305,
    "activation_cosine_similarity": 0.015026758424937725,
    "activation_magnitude_ratio": -0.0024465317837893963,
    "activation_dot_product": 0.005946378223598003,
    "encoder_gradient_cosine_similarity": 0.0031095880549401045,
    "encoder_gradient_l2_distance": -0.033981747925281525,
    "encoder_gradient_dot_product": 0.0008441272075287998,
    "input_gradient_cosine_similarity": 0.0011626684572547674,
    "input_gradient_l2_distance": -0.02484271302819252,
    "input_gradient_dot_product": -0.0052782222628593445
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.004710078705102205,
    "right_subspace_overlap_bottom_k": 0.006615567021071911,
    "interaction_matrix_overlap_top_k": 0.003841655794531107,
    "interaction_matrix_overlap_bottom_k": 0.001885278383269906,
    "effective_rank": 0.0005270194378681481,
    "effective_rank_mergeability_score": 0.0007184629794210196,
    "stable_rank": 0.0008367974078282714,
    "spectral_gap": 0.001043274300172925,
    "singular_value_ratio": 0.0010521847289055586,
    "layerwise_effective_rank": 0.0010860032634809613,
    "layerwise_effective_rank_mergeability_score": 0.0012306462740525603,
    "task_vector_cosine_similarity": 0.0036292385775595903,
    "task_vector_l2_distance": 0.005006685387343168,
    "task_vector_dot_product": 0.0028741878923028708,
    "weight_space_angle": 0.004280199762433767,
    "task_vector_magnitude_ratio": 0.0007648772443644702,
    "singular_value_overlap": 0.0025878509040921926,
    "subspace_overlap": 0.0032235325779765844,
    "right_subspace_overlap": 0.00465243449434638,
    "activation_l2_distance": 0.006227007135748863,
    "activation_cosine_similarity": 0.004757098853588104,
    "activation_magnitude_ratio": 0.002545519033446908,
    "activation_dot_product": 0.012129505164921284,
    "encoder_gradient_cosine_similarity": 0.002321737352758646,
    "encoder_gradient_l2_distance": 0.01684023253619671,
    "encoder_gradient_dot_product": 0.0025946851819753647,
    "input_gradient_cosine_similarity": 0.0015118563314899802,
    "input_gradient_l2_distance": 0.022423435002565384,
    "input_gradient_dot_product": 0.003320841584354639
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 1.0,
    "right_subspace_overlap_bottom_k": 1.0,
    "interaction_matrix_overlap_top_k": 0.7,
    "interaction_matrix_overlap_bottom_k": 0.6,
    "effective_rank": 0.15,
    "effective_rank_mergeability_score": 0.3,
    "stable_rank": 0.3,
    "spectral_gap": 0.35,
    "singular_value_ratio": 0.25,
    "layerwise_effective_rank": 0.5,
    "layerwise_effective_rank_mergeability_score": 0.45,
    "task_vector_cosine_similarity": 0.55,
    "task_vector_l2_distance": 0.75,
    "task_vector_dot_product": 0.65,
    "weight_space_angle": 0.5,
    "task_vector_magnitude_ratio": 0.3,
    "singular_value_overlap": 0.7,
    "subspace_overlap": 0.55,
    "right_subspace_overlap": 1.0,
    "activation_l2_distance": 0.85,
    "activation_cosine_similarity": 1.0,
    "activation_magnitude_ratio": 0.8,
    "activation_dot_product": 0.65,
    "encoder_gradient_cosine_similarity": 1.0,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.8,
    "input_gradient_cosine_similarity": 0.75,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.9
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7465736634947071,
      "val_r": 0.6141580660679975,
      "n_iterations": 259,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004757261835038662,
        "right_subspace_overlap_bottom_k": -0.004554815124720335,
        "interaction_matrix_overlap_top_k": 0.002013747813180089,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.005029598716646433,
        "task_vector_dot_product": -0.0021364183630794287,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0012315702624619007,
        "singular_value_overlap": -0.001471254974603653,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0052145496010780334,
        "activation_l2_distance": 0.0018119974993169308,
        "activation_cosine_similarity": 0.017490744590759277,
        "activation_magnitude_ratio": -0.0031180281657725573,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.002332049421966076,
        "encoder_gradient_l2_distance": -0.03265007585287094,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.00237054331228137,
        "input_gradient_l2_distance": -0.008360089734196663,
        "input_gradient_dot_product": -0.008117591962218285
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.721693121202641,
      "val_r": 0.7971717822663296,
      "n_iterations": 279,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01254858635365963,
        "right_subspace_overlap_bottom_k": -0.016628947108983994,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0019401079043745995,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0017243518959730864,
        "spectral_gap": 0.0016037551686167717,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.001737657468765974,
        "task_vector_cosine_similarity": 0.0014840804506093264,
        "task_vector_l2_distance": -0.011820260435342789,
        "task_vector_dot_product": -0.0026118895038962364,
        "weight_space_angle": -0.0013674618676304817,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0012007259065285325,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.017603930085897446,
        "activation_l2_distance": -0.00937139242887497,
        "activation_cosine_similarity": 0.02025172859430313,
        "activation_magnitude_ratio": -0.002689594868570566,
        "activation_dot_product": 0.0012287237914279103,
        "encoder_gradient_cosine_similarity": 0.002711603883653879,
        "encoder_gradient_l2_distance": -0.051120657473802567,
        "encoder_gradient_dot_product": 0.0011759751942008734,
        "input_gradient_cosine_similarity": 0.001682164380326867,
        "input_gradient_l2_distance": -0.051050350069999695,
        "input_gradient_dot_product": -0.0029302197508513927
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.649006961343899,
      "val_r": 0.6114716677237888,
      "n_iterations": 305,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005502097774296999,
        "right_subspace_overlap_bottom_k": -0.00810432992875576,
        "interaction_matrix_overlap_top_k": 0.0011835845652967691,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": -0.001171924639493227,
        "stable_rank": 0.0014155787648633122,
        "spectral_gap": -0.0014209793880581856,
        "singular_value_ratio": 0.0016537961782887578,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0019385823979973793,
        "subspace_overlap": -0.003010181710124016,
        "right_subspace_overlap": 0.009785669855773449,
        "activation_l2_distance": 0.005364277400076389,
        "activation_cosine_similarity": 0.01197126042097807,
        "activation_magnitude_ratio": -0.0026862905360758305,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0016738760750740767,
        "encoder_gradient_l2_distance": -0.01732007972896099,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0020953055936843157,
        "input_gradient_l2_distance": -0.006811793893575668,
        "input_gradient_dot_product": -0.0024355859495699406
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7399976509252302,
      "val_r": 0.6711635739586465,
      "n_iterations": 191,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0016396398423239589,
        "right_subspace_overlap_bottom_k": -0.010377462022006512,
        "interaction_matrix_overlap_top_k": 0.0019974419847130775,
        "interaction_matrix_overlap_bottom_k": 0.002164271892979741,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.002555245067924261,
        "task_vector_l2_distance": -0.0024325656704604626,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.012010814622044563,
        "activation_l2_distance": 0.0019184676930308342,
        "activation_cosine_similarity": 0.011676578782498837,
        "activation_magnitude_ratio": -0.002954744966700673,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.00347074493765831,
        "encoder_gradient_l2_distance": -0.01645175740122795,
        "encoder_gradient_dot_product": 0.0012794072972610593,
        "input_gradient_cosine_similarity": 0.0015253486344590783,
        "input_gradient_l2_distance": -0.012195615097880363,
        "input_gradient_dot_product": -0.004201535601168871
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7297176848576753,
      "val_r": 0.8053170210104545,
      "n_iterations": 244,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006371607072651386,
        "right_subspace_overlap_bottom_k": -0.009151935577392578,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.007907296530902386,
        "task_vector_dot_product": -0.0016062816139310598,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.007512927986681461,
        "activation_l2_distance": -0.0045299953781068325,
        "activation_cosine_similarity": 0.019635336473584175,
        "activation_magnitude_ratio": -0.007288071326911449,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.002771900501102209,
        "encoder_gradient_l2_distance": -0.045006535947322845,
        "encoder_gradient_dot_product": 0.0013511438155546784,
        "input_gradient_cosine_similarity": 0.0023659535218030214,
        "input_gradient_l2_distance": -0.028143260627985,
        "input_gradient_dot_product": -0.003174177836626768
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7403690112239814,
      "val_r": 0.6835814544565345,
      "n_iterations": 246,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0033870916813611984,
        "right_subspace_overlap_bottom_k": -0.004395840689539909,
        "interaction_matrix_overlap_top_k": 0.004238399676978588,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": -0.001651154481805861,
        "effective_rank_mergeability_score": 0.0016336794942617416,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.002586937742307782,
        "layerwise_effective_rank": -0.0012308716541156173,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0010972920572385192,
        "task_vector_l2_distance": -0.010436475276947021,
        "task_vector_dot_product": 0.001261943019926548,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.001252556685358286,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0033173987176269293,
        "activation_l2_distance": -0.00625475961714983,
        "activation_cosine_similarity": 0.023190177977085114,
        "activation_magnitude_ratio": -0.005916287191212177,
        "activation_dot_product": 0.0020409298595041037,
        "encoder_gradient_cosine_similarity": 0.00479262787848711,
        "encoder_gradient_l2_distance": -0.056392744183540344,
        "encoder_gradient_dot_product": -0.00127077242359519,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0012757759541273117,
        "input_gradient_dot_product": -0.0025742454454302788
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7334035710734469,
      "val_r": 0.43174553106619584,
      "n_iterations": 189,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.00519327400252223,
        "right_subspace_overlap_bottom_k": -0.01230807788670063,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0011137435212731361,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.001010395586490631,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0032243956811726093,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0013594881165772676,
        "right_subspace_overlap": 0.008992563001811504,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.014719528146088123,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0054337927140295506,
        "encoder_gradient_l2_distance": -0.024616746231913567,
        "encoder_gradient_dot_product": 0.006936129182577133,
        "input_gradient_cosine_similarity": -0.0010443413630127907,
        "input_gradient_l2_distance": -0.021321211010217667,
        "input_gradient_dot_product": -0.0030932780355215073
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6886325362281189,
      "val_r": 0.3614958986914594,
      "n_iterations": 435,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005700204521417618,
        "right_subspace_overlap_bottom_k": -0.011198272928595543,
        "interaction_matrix_overlap_top_k": -0.001613835571333766,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0011156853288412094,
        "layerwise_effective_rank_mergeability_score": 0.0012379125691950321,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.004158291034400463,
        "weight_space_angle": 0.002061766805127263,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0010123095707967877,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.006263066083192825,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.00948380958288908,
        "activation_magnitude_ratio": -0.002739682560786605,
        "activation_dot_product": -0.001038963906466961,
        "encoder_gradient_cosine_similarity": 0.00378204882144928,
        "encoder_gradient_l2_distance": -0.016869351267814636,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0019418663578107953,
        "input_gradient_l2_distance": -0.004722507204860449,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7558277662790652,
      "val_r": 0.5221119528714532,
      "n_iterations": 301,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010770456865429878,
        "right_subspace_overlap_bottom_k": -0.019477369263768196,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0013527318369597197,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.002632678486406803,
        "layerwise_effective_rank_mergeability_score": 0.004150463733822107,
        "task_vector_cosine_similarity": -0.001829257933422923,
        "task_vector_l2_distance": -0.0022958810441195965,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0014358953339979053,
        "right_subspace_overlap": 0.009320396929979324,
        "activation_l2_distance": -0.01129004918038845,
        "activation_cosine_similarity": 0.01754843257367611,
        "activation_magnitude_ratio": -0.005655823275446892,
        "activation_dot_product": -0.0024859260302037,
        "encoder_gradient_cosine_similarity": 0.0014960987027734518,
        "encoder_gradient_l2_distance": -0.0384446419775486,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.03454756364226341,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7179296377948734,
      "val_r": 0.7935827155691875,
      "n_iterations": 270,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.013793205842375755,
        "right_subspace_overlap_bottom_k": -0.01506218034774065,
        "interaction_matrix_overlap_top_k": 0.005085535813122988,
        "interaction_matrix_overlap_bottom_k": 0.002679120283573866,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.001813225564546883,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0014348509721457958,
        "layerwise_effective_rank_mergeability_score": 0.001959211193025112,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.013902842067182064,
        "task_vector_dot_product": 0.0015851211501285434,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0014057322405278683,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.01165725663304329,
        "activation_l2_distance": -0.0016483785584568977,
        "activation_cosine_similarity": 0.0028296986129134893,
        "activation_magnitude_ratio": -0.004515659064054489,
        "activation_dot_product": -0.007086532656103373,
        "encoder_gradient_cosine_similarity": 0.0020082546398043633,
        "encoder_gradient_l2_distance": -0.05624326318502426,
        "encoder_gradient_dot_product": -0.002433165442198515,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0563192181289196,
        "input_gradient_dot_product": -0.008123164065182209
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7478055809545225,
      "val_r": 0.09587698741440052,
      "n_iterations": 332,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0012163660721853375,
        "right_subspace_overlap_bottom_k": -0.007892929017543793,
        "interaction_matrix_overlap_top_k": -0.001159133855253458,
        "interaction_matrix_overlap_bottom_k": -0.0011823063250631094,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.001146239461377263,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0013567920541390777,
        "task_vector_dot_product": 0.0018829198088496923,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0025483337230980396,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.002806657925248146,
        "activation_l2_distance": -0.0020051333121955395,
        "activation_cosine_similarity": 0.017408723011612892,
        "activation_magnitude_ratio": -0.0016602614196017385,
        "activation_dot_product": 0.0031590473372489214,
        "encoder_gradient_cosine_similarity": 0.0013532901648432016,
        "encoder_gradient_l2_distance": -0.030656132847070694,
        "encoder_gradient_dot_product": 0.0013022113125771284,
        "input_gradient_cosine_similarity": 0.0017991071799769998,
        "input_gradient_l2_distance": -0.003935717511922121,
        "input_gradient_dot_product": -0.00137567357160151
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7168033816949608,
      "val_r": 0.6930603769397594,
      "n_iterations": 333,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01225774921476841,
        "right_subspace_overlap_bottom_k": -0.012547682039439678,
        "interaction_matrix_overlap_top_k": 0.0042548100464046,
        "interaction_matrix_overlap_bottom_k": 0.002134614158421755,
        "effective_rank": 0.0012747423024848104,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0026131796184927225,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0019970284774899483,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.002069841604679823,
        "subspace_overlap": 0.001700859284028411,
        "right_subspace_overlap": 0.007802381180226803,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.009170527569949627,
        "activation_magnitude_ratio": -0.00438362080603838,
        "activation_dot_product": 0.007712895516306162,
        "encoder_gradient_cosine_similarity": 0.005881779827177525,
        "encoder_gradient_l2_distance": -0.013905304484069347,
        "encoder_gradient_dot_product": 0.0023539543617516756,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.015743862837553024,
        "input_gradient_dot_product": -0.006872732192277908
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7326766814063249,
      "val_r": 0.695811275478976,
      "n_iterations": 217,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006555825471878052,
        "right_subspace_overlap_bottom_k": -0.010426826775074005,
        "interaction_matrix_overlap_top_k": 0.0015369139146059752,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.001312200678512454,
        "task_vector_cosine_similarity": 0.003462825436145067,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.0013697840040549636,
        "weight_space_angle": -0.001260238466784358,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0016850084066390991,
        "subspace_overlap": -0.0022498781327158213,
        "right_subspace_overlap": 0.003917216788977385,
        "activation_l2_distance": 0.008134807460010052,
        "activation_cosine_similarity": 0.01725567877292633,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0014878124929964542,
        "encoder_gradient_l2_distance": -0.022267106920480728,
        "encoder_gradient_dot_product": -0.002462238073348999,
        "input_gradient_cosine_similarity": 0.003981403075158596,
        "input_gradient_l2_distance": -0.005934727378189564,
        "input_gradient_dot_product": -0.004073622170835733
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7269878984825061,
      "val_r": 0.7804595183633558,
      "n_iterations": 294,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0025570495054125786,
        "right_subspace_overlap_bottom_k": -0.008141877129673958,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0018539782613515854,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.0012688423739746213,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0015616851160302758,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.001628296566195786,
        "right_subspace_overlap": 0.011655004695057869,
        "activation_l2_distance": 0.0025043587666004896,
        "activation_cosine_similarity": 0.012062359601259232,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0024401687551289797,
        "encoder_gradient_l2_distance": -0.021824296563863754,
        "encoder_gradient_dot_product": 0.0010606375290080905,
        "input_gradient_cosine_similarity": 0.0020030387677252293,
        "input_gradient_l2_distance": -0.007617623079568148,
        "input_gradient_dot_product": -0.004650663584470749
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6957431983146035,
      "val_r": 0.7475471629316266,
      "n_iterations": 318,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.013462860137224197,
        "right_subspace_overlap_bottom_k": -0.03036523424088955,
        "interaction_matrix_overlap_top_k": 0.006345122586935759,
        "interaction_matrix_overlap_bottom_k": -0.005273522809147835,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.002691581379622221,
        "singular_value_ratio": 0.0026430829893797636,
        "layerwise_effective_rank": -0.0012094550766050816,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0027385232970118523,
        "task_vector_l2_distance": -0.007613364141434431,
        "task_vector_dot_product": 0.0014295184519141912,
        "weight_space_angle": 0.004769246093928814,
        "task_vector_magnitude_ratio": 0.0017678363947197795,
        "singular_value_overlap": 0.0015592641429975629,
        "subspace_overlap": 0.0035946574062108994,
        "right_subspace_overlap": 0.019312230870127678,
        "activation_l2_distance": -0.014148593880236149,
        "activation_cosine_similarity": 0.01314075943082571,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.035316042602062225,
        "encoder_gradient_cosine_similarity": -0.0019185980781912804,
        "encoder_gradient_l2_distance": -0.05456953123211861,
        "encoder_gradient_dot_product": -0.0015927599743008614,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.07119573652744293,
        "input_gradient_dot_product": -0.008942823857069016
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.6211470562802448,
      "val_r": 0.25403468478323876,
      "n_iterations": 279,
      "n_nonzero_coefficients": 29,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.011999636888504028,
        "right_subspace_overlap_bottom_k": -0.008115438744425774,
        "interaction_matrix_overlap_top_k": 0.0050923144444823265,
        "interaction_matrix_overlap_bottom_k": 0.0012615978484973311,
        "effective_rank": 0.0011093097273260355,
        "effective_rank_mergeability_score": -0.001242073718458414,
        "stable_rank": 0.0014087400631979108,
        "spectral_gap": -0.0017454616026952863,
        "singular_value_ratio": 0.001837287680245936,
        "layerwise_effective_rank": 0.0014286767691373825,
        "layerwise_effective_rank_mergeability_score": -0.0013371044769883156,
        "task_vector_cosine_similarity": 0.004301866516470909,
        "task_vector_l2_distance": -0.00397390965372324,
        "task_vector_dot_product": 0.0012523563345894217,
        "weight_space_angle": -0.005628383718430996,
        "task_vector_magnitude_ratio": 0.0017099407268688083,
        "singular_value_overlap": 0.0040045250207185745,
        "subspace_overlap": 0.001828220672905445,
        "right_subspace_overlap": 0.008515117689967155,
        "activation_l2_distance": 0.0034287748858332634,
        "activation_cosine_similarity": 0.011739924550056458,
        "activation_magnitude_ratio": -0.003763754153624177,
        "activation_dot_product": 0.0056189498864114285,
        "encoder_gradient_cosine_similarity": 0.0032728826627135277,
        "encoder_gradient_l2_distance": -0.018063845112919807,
        "encoder_gradient_dot_product": 0.003300704061985016,
        "input_gradient_cosine_similarity": 0.001770233502611518,
        "input_gradient_l2_distance": -0.017759479582309723,
        "input_gradient_dot_product": -0.006273755803704262
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7484884020070731,
      "val_r": 0.7040006710871135,
      "n_iterations": 181,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01340597216039896,
        "right_subspace_overlap_bottom_k": -0.01835760474205017,
        "interaction_matrix_overlap_top_k": 0.0030394583009183407,
        "interaction_matrix_overlap_bottom_k": -0.002720687072724104,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0010606369469314814,
        "stable_rank": -0.0017595515819266438,
        "spectral_gap": -0.0011681062169373035,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.002069291193038225,
        "layerwise_effective_rank_mergeability_score": 0.0020596832036972046,
        "task_vector_cosine_similarity": -0.0015564365312457085,
        "task_vector_l2_distance": -0.005799052305519581,
        "task_vector_dot_product": -0.0012677133781835437,
        "weight_space_angle": 0.005540396552532911,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0025114708114415407,
        "subspace_overlap": 0.002166751539334655,
        "right_subspace_overlap": 0.012278051115572453,
        "activation_l2_distance": -0.0022801519371569157,
        "activation_cosine_similarity": 0.013690602965652943,
        "activation_magnitude_ratio": -0.003121388843283057,
        "activation_dot_product": 0.010933329351246357,
        "encoder_gradient_cosine_similarity": 0.004972036927938461,
        "encoder_gradient_l2_distance": -0.02829176001250744,
        "encoder_gradient_dot_product": 0.007362585049122572,
        "input_gradient_cosine_similarity": 0.004034403245896101,
        "input_gradient_l2_distance": -0.030692800879478455,
        "input_gradient_dot_product": -0.011496673338115215
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7069149664224414,
      "val_r": 0.5449229934709972,
      "n_iterations": 287,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.017454449087381363,
        "right_subspace_overlap_bottom_k": -0.024294862523674965,
        "interaction_matrix_overlap_top_k": 0.006096201948821545,
        "interaction_matrix_overlap_bottom_k": 0.0021350220777094364,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.00298998411744833,
        "singular_value_ratio": 0.0019682706333696842,
        "layerwise_effective_rank": -0.0011229870142415166,
        "layerwise_effective_rank_mergeability_score": 0.0013183706905692816,
        "task_vector_cosine_similarity": -0.0013405017089098692,
        "task_vector_l2_distance": -0.008773823268711567,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0023745340295135975,
        "task_vector_magnitude_ratio": 0.001498967525549233,
        "singular_value_overlap": 0.00556210707873106,
        "subspace_overlap": 0.0025456089060753584,
        "right_subspace_overlap": 0.017924387007951736,
        "activation_l2_distance": -0.004301498178392649,
        "activation_cosine_similarity": 0.01923150196671486,
        "activation_magnitude_ratio": 0.0026811007410287857,
        "activation_dot_product": 0.031051214784383774,
        "encoder_gradient_cosine_similarity": 0.0014487984590232372,
        "encoder_gradient_l2_distance": -0.07636620104312897,
        "encoder_gradient_dot_product": -0.0013418806483969092,
        "input_gradient_cosine_similarity": -0.0010749687207862735,
        "input_gradient_l2_distance": -0.07932557910680771,
        "input_gradient_dot_product": -0.009162185713648796
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7829939062413407,
      "val_r": 0.5257531783556362,
      "n_iterations": 303,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009371960535645485,
        "right_subspace_overlap_bottom_k": -0.01577179506421089,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.002531979698687792,
        "layerwise_effective_rank_mergeability_score": 0.002525699557736516,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.002068891189992428,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0020169480703771114,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.005218958482146263,
        "activation_l2_distance": 0.0015210899291560054,
        "activation_cosine_similarity": 0.020664745941758156,
        "activation_magnitude_ratio": -0.003270520828664303,
        "activation_dot_product": -0.001469096401706338,
        "encoder_gradient_cosine_similarity": 0.0028316951356828213,
        "encoder_gradient_l2_distance": -0.03262852132320404,
        "encoder_gradient_dot_product": 0.0014360386412590742,
        "input_gradient_cosine_similarity": 0.0012129920069128275,
        "input_gradient_l2_distance": -0.012178799137473106,
        "input_gradient_dot_product": -0.00818860437721014
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5498714874491438,
      "val_r": 0.5764097399145472,
      "n_iterations": 366,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.013657225295901299,
        "right_subspace_overlap_bottom_k": -0.004104543477296829,
        "interaction_matrix_overlap_top_k": 0.015821482986211777,
        "interaction_matrix_overlap_bottom_k": -0.0020689077209681273,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": -0.0013372583780437708,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.001387808471918106,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.014351706951856613,
        "task_vector_l2_distance": -0.015473637729883194,
        "task_vector_dot_product": 0.010879112407565117,
        "weight_space_angle": -0.016267728060483932,
        "task_vector_magnitude_ratio": 0.00126942980568856,
        "singular_value_overlap": 0.008711554110050201,
        "subspace_overlap": 0.013155014254152775,
        "right_subspace_overlap": 0.01227435003966093,
        "activation_l2_distance": -0.016103729605674744,
        "activation_cosine_similarity": 0.01737302541732788,
        "activation_magnitude_ratio": 0.002151991706341505,
        "activation_dot_product": 0.03394694626331329,
        "encoder_gradient_cosine_similarity": 0.009948899038136005,
        "encoder_gradient_l2_distance": -0.025946343317627907,
        "encoder_gradient_dot_product": -0.001575423520989716,
        "input_gradient_cosine_similarity": -0.0014096822123974562,
        "input_gradient_l2_distance": -0.027722543105483055,
        "input_gradient_dot_product": -0.009877907112240791
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.5,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}