{
  "weight_avg": {
    "aggregate_metrics": {
      "train_r": 0.4139693561553167,
      "train_p": 1.2316343061628566e-133,
      "val_r": 0.4144841581795257,
      "val_p": 2.698218315867555e-16
    },
    "per_fold_stats": {
      "train_r_mean": 0.71262920818384,
      "train_r_std": 0.051609657958610715,
      "val_r_mean": 0.595483812621085,
      "val_r_std": 0.18542750329522736,
      "n_nonzero_mean": 19.35,
      "n_nonzero_std": 4.162631379308045
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.00858012679964304,
      "right_subspace_overlap_bottom_k": -0.012563901953399181,
      "interaction_matrix_overlap_top_k": 0.002696602139621973,
      "interaction_matrix_overlap_bottom_k": 0.00020185155153740197,
      "effective_rank": 3.664487667265348e-05,
      "effective_rank_mergeability_score": 1.478957710787654e-05,
      "stable_rank": -0.00018095248378813267,
      "spectral_gap": -0.000471137638669461,
      "singular_value_ratio": 0.00027577500441111624,
      "layerwise_effective_rank": -0.0005265657091513276,
      "layerwise_effective_rank_mergeability_score": 0.0007482047658413649,
      "task_vector_cosine_similarity": 0.0004935021861456335,
      "task_vector_l2_distance": -0.00489855045452714,
      "task_vector_dot_product": 0.00019358753343112767,
      "weight_space_angle": -0.00048789745778776705,
      "task_vector_magnitude_ratio": 0.0003288144653197378,
      "singular_value_overlap": 0.0010773919057101011,
      "subspace_overlap": 0.0009013173985294998,
      "right_subspace_overlap": 0.009669145569205284,
      "activation_l2_distance": -0.0023624952882528305,
      "activation_cosine_similarity": 0.015026758424937725,
      "activation_magnitude_ratio": -0.0024465317837893963,
      "activation_dot_product": 0.005946378223598003,
      "encoder_gradient_cosine_similarity": 0.0031095880549401045,
      "encoder_gradient_l2_distance": -0.033981747925281525,
      "encoder_gradient_dot_product": 0.0008441272075287998,
      "input_gradient_cosine_similarity": 0.0011626684572547674,
      "input_gradient_l2_distance": -0.02484271302819252,
      "input_gradient_dot_product": -0.0052782222628593445
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.004710078705102205,
      "right_subspace_overlap_bottom_k": 0.006615567021071911,
      "interaction_matrix_overlap_top_k": 0.003841655794531107,
      "interaction_matrix_overlap_bottom_k": 0.001885278383269906,
      "effective_rank": 0.0005270194378681481,
      "effective_rank_mergeability_score": 0.0007184629794210196,
      "stable_rank": 0.0008367974078282714,
      "spectral_gap": 0.001043274300172925,
      "singular_value_ratio": 0.0010521847289055586,
      "layerwise_effective_rank": 0.0010860032634809613,
      "layerwise_effective_rank_mergeability_score": 0.0012306462740525603,
      "task_vector_cosine_similarity": 0.0036292385775595903,
      "task_vector_l2_distance": 0.005006685387343168,
      "task_vector_dot_product": 0.0028741878923028708,
      "weight_space_angle": 0.004280199762433767,
      "task_vector_magnitude_ratio": 0.0007648772443644702,
      "singular_value_overlap": 0.0025878509040921926,
      "subspace_overlap": 0.0032235325779765844,
      "right_subspace_overlap": 0.00465243449434638,
      "activation_l2_distance": 0.006227007135748863,
      "activation_cosine_similarity": 0.004757098853588104,
      "activation_magnitude_ratio": 0.002545519033446908,
      "activation_dot_product": 0.012129505164921284,
      "encoder_gradient_cosine_similarity": 0.002321737352758646,
      "encoder_gradient_l2_distance": 0.01684023253619671,
      "encoder_gradient_dot_product": 0.0025946851819753647,
      "input_gradient_cosine_similarity": 0.0015118563314899802,
      "input_gradient_l2_distance": 0.022423435002565384,
      "input_gradient_dot_product": 0.003320841584354639
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 1.0,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.7,
      "interaction_matrix_overlap_bottom_k": 0.6,
      "effective_rank": 0.15,
      "effective_rank_mergeability_score": 0.3,
      "stable_rank": 0.3,
      "spectral_gap": 0.35,
      "singular_value_ratio": 0.25,
      "layerwise_effective_rank": 0.5,
      "layerwise_effective_rank_mergeability_score": 0.45,
      "task_vector_cosine_similarity": 0.55,
      "task_vector_l2_distance": 0.75,
      "task_vector_dot_product": 0.65,
      "weight_space_angle": 0.5,
      "task_vector_magnitude_ratio": 0.3,
      "singular_value_overlap": 0.7,
      "subspace_overlap": 0.55,
      "right_subspace_overlap": 1.0,
      "activation_l2_distance": 0.85,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.8,
      "activation_dot_product": 0.65,
      "encoder_gradient_cosine_similarity": 1.0,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.8,
      "input_gradient_cosine_similarity": 0.75,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.9
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7465736634947071,
        "val_r": 0.6141580660679975,
        "n_iterations": 259,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004757261835038662,
          "right_subspace_overlap_bottom_k": -0.004554815124720335,
          "interaction_matrix_overlap_top_k": 0.002013747813180089,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.005029598716646433,
          "task_vector_dot_product": -0.0021364183630794287,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0012315702624619007,
          "singular_value_overlap": -0.001471254974603653,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0052145496010780334,
          "activation_l2_distance": 0.0018119974993169308,
          "activation_cosine_similarity": 0.017490744590759277,
          "activation_magnitude_ratio": -0.0031180281657725573,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.002332049421966076,
          "encoder_gradient_l2_distance": -0.03265007585287094,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.00237054331228137,
          "input_gradient_l2_distance": -0.008360089734196663,
          "input_gradient_dot_product": -0.008117591962218285
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.721693121202641,
        "val_r": 0.7971717822663296,
        "n_iterations": 279,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01254858635365963,
          "right_subspace_overlap_bottom_k": -0.016628947108983994,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0019401079043745995,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0017243518959730864,
          "spectral_gap": 0.0016037551686167717,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.001737657468765974,
          "task_vector_cosine_similarity": 0.0014840804506093264,
          "task_vector_l2_distance": -0.011820260435342789,
          "task_vector_dot_product": -0.0026118895038962364,
          "weight_space_angle": -0.0013674618676304817,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0012007259065285325,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.017603930085897446,
          "activation_l2_distance": -0.00937139242887497,
          "activation_cosine_similarity": 0.02025172859430313,
          "activation_magnitude_ratio": -0.002689594868570566,
          "activation_dot_product": 0.0012287237914279103,
          "encoder_gradient_cosine_similarity": 0.002711603883653879,
          "encoder_gradient_l2_distance": -0.051120657473802567,
          "encoder_gradient_dot_product": 0.0011759751942008734,
          "input_gradient_cosine_similarity": 0.001682164380326867,
          "input_gradient_l2_distance": -0.051050350069999695,
          "input_gradient_dot_product": -0.0029302197508513927
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.649006961343899,
        "val_r": 0.6114716677237888,
        "n_iterations": 305,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005502097774296999,
          "right_subspace_overlap_bottom_k": -0.00810432992875576,
          "interaction_matrix_overlap_top_k": 0.0011835845652967691,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": -0.001171924639493227,
          "stable_rank": 0.0014155787648633122,
          "spectral_gap": -0.0014209793880581856,
          "singular_value_ratio": 0.0016537961782887578,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0019385823979973793,
          "subspace_overlap": -0.003010181710124016,
          "right_subspace_overlap": 0.009785669855773449,
          "activation_l2_distance": 0.005364277400076389,
          "activation_cosine_similarity": 0.01197126042097807,
          "activation_magnitude_ratio": -0.0026862905360758305,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0016738760750740767,
          "encoder_gradient_l2_distance": -0.01732007972896099,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0020953055936843157,
          "input_gradient_l2_distance": -0.006811793893575668,
          "input_gradient_dot_product": -0.0024355859495699406
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7399976509252302,
        "val_r": 0.6711635739586465,
        "n_iterations": 191,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0016396398423239589,
          "right_subspace_overlap_bottom_k": -0.010377462022006512,
          "interaction_matrix_overlap_top_k": 0.0019974419847130775,
          "interaction_matrix_overlap_bottom_k": 0.002164271892979741,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.002555245067924261,
          "task_vector_l2_distance": -0.0024325656704604626,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.012010814622044563,
          "activation_l2_distance": 0.0019184676930308342,
          "activation_cosine_similarity": 0.011676578782498837,
          "activation_magnitude_ratio": -0.002954744966700673,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.00347074493765831,
          "encoder_gradient_l2_distance": -0.01645175740122795,
          "encoder_gradient_dot_product": 0.0012794072972610593,
          "input_gradient_cosine_similarity": 0.0015253486344590783,
          "input_gradient_l2_distance": -0.012195615097880363,
          "input_gradient_dot_product": -0.004201535601168871
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7297176848576753,
        "val_r": 0.8053170210104545,
        "n_iterations": 244,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006371607072651386,
          "right_subspace_overlap_bottom_k": -0.009151935577392578,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.007907296530902386,
          "task_vector_dot_product": -0.0016062816139310598,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.007512927986681461,
          "activation_l2_distance": -0.0045299953781068325,
          "activation_cosine_similarity": 0.019635336473584175,
          "activation_magnitude_ratio": -0.007288071326911449,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.002771900501102209,
          "encoder_gradient_l2_distance": -0.045006535947322845,
          "encoder_gradient_dot_product": 0.0013511438155546784,
          "input_gradient_cosine_similarity": 0.0023659535218030214,
          "input_gradient_l2_distance": -0.028143260627985,
          "input_gradient_dot_product": -0.003174177836626768
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7403690112239814,
        "val_r": 0.6835814544565345,
        "n_iterations": 246,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0033870916813611984,
          "right_subspace_overlap_bottom_k": -0.004395840689539909,
          "interaction_matrix_overlap_top_k": 0.004238399676978588,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": -0.001651154481805861,
          "effective_rank_mergeability_score": 0.0016336794942617416,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.002586937742307782,
          "layerwise_effective_rank": -0.0012308716541156173,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0010972920572385192,
          "task_vector_l2_distance": -0.010436475276947021,
          "task_vector_dot_product": 0.001261943019926548,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.001252556685358286,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0033173987176269293,
          "activation_l2_distance": -0.00625475961714983,
          "activation_cosine_similarity": 0.023190177977085114,
          "activation_magnitude_ratio": -0.005916287191212177,
          "activation_dot_product": 0.0020409298595041037,
          "encoder_gradient_cosine_similarity": 0.00479262787848711,
          "encoder_gradient_l2_distance": -0.056392744183540344,
          "encoder_gradient_dot_product": -0.00127077242359519,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0012757759541273117,
          "input_gradient_dot_product": -0.0025742454454302788
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7334035710734469,
        "val_r": 0.43174553106619584,
        "n_iterations": 189,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00519327400252223,
          "right_subspace_overlap_bottom_k": -0.01230807788670063,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0011137435212731361,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.001010395586490631,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0032243956811726093,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0013594881165772676,
          "right_subspace_overlap": 0.008992563001811504,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.014719528146088123,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0054337927140295506,
          "encoder_gradient_l2_distance": -0.024616746231913567,
          "encoder_gradient_dot_product": 0.006936129182577133,
          "input_gradient_cosine_similarity": -0.0010443413630127907,
          "input_gradient_l2_distance": -0.021321211010217667,
          "input_gradient_dot_product": -0.0030932780355215073
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6886325362281189,
        "val_r": 0.3614958986914594,
        "n_iterations": 435,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005700204521417618,
          "right_subspace_overlap_bottom_k": -0.011198272928595543,
          "interaction_matrix_overlap_top_k": -0.001613835571333766,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0011156853288412094,
          "layerwise_effective_rank_mergeability_score": 0.0012379125691950321,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.004158291034400463,
          "weight_space_angle": 0.002061766805127263,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0010123095707967877,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.006263066083192825,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.00948380958288908,
          "activation_magnitude_ratio": -0.002739682560786605,
          "activation_dot_product": -0.001038963906466961,
          "encoder_gradient_cosine_similarity": 0.00378204882144928,
          "encoder_gradient_l2_distance": -0.016869351267814636,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0019418663578107953,
          "input_gradient_l2_distance": -0.004722507204860449,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7558277662790652,
        "val_r": 0.5221119528714532,
        "n_iterations": 301,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010770456865429878,
          "right_subspace_overlap_bottom_k": -0.019477369263768196,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0013527318369597197,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002632678486406803,
          "layerwise_effective_rank_mergeability_score": 0.004150463733822107,
          "task_vector_cosine_similarity": -0.001829257933422923,
          "task_vector_l2_distance": -0.0022958810441195965,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0014358953339979053,
          "right_subspace_overlap": 0.009320396929979324,
          "activation_l2_distance": -0.01129004918038845,
          "activation_cosine_similarity": 0.01754843257367611,
          "activation_magnitude_ratio": -0.005655823275446892,
          "activation_dot_product": -0.0024859260302037,
          "encoder_gradient_cosine_similarity": 0.0014960987027734518,
          "encoder_gradient_l2_distance": -0.0384446419775486,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.03454756364226341,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7179296377948734,
        "val_r": 0.7935827155691875,
        "n_iterations": 270,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.013793205842375755,
          "right_subspace_overlap_bottom_k": -0.01506218034774065,
          "interaction_matrix_overlap_top_k": 0.005085535813122988,
          "interaction_matrix_overlap_bottom_k": 0.002679120283573866,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.001813225564546883,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0014348509721457958,
          "layerwise_effective_rank_mergeability_score": 0.001959211193025112,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.013902842067182064,
          "task_vector_dot_product": 0.0015851211501285434,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0014057322405278683,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.01165725663304329,
          "activation_l2_distance": -0.0016483785584568977,
          "activation_cosine_similarity": 0.0028296986129134893,
          "activation_magnitude_ratio": -0.004515659064054489,
          "activation_dot_product": -0.007086532656103373,
          "encoder_gradient_cosine_similarity": 0.0020082546398043633,
          "encoder_gradient_l2_distance": -0.05624326318502426,
          "encoder_gradient_dot_product": -0.002433165442198515,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0563192181289196,
          "input_gradient_dot_product": -0.008123164065182209
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7478055809545225,
        "val_r": 0.09587698741440052,
        "n_iterations": 332,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0012163660721853375,
          "right_subspace_overlap_bottom_k": -0.007892929017543793,
          "interaction_matrix_overlap_top_k": -0.001159133855253458,
          "interaction_matrix_overlap_bottom_k": -0.0011823063250631094,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.001146239461377263,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0013567920541390777,
          "task_vector_dot_product": 0.0018829198088496923,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0025483337230980396,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.002806657925248146,
          "activation_l2_distance": -0.0020051333121955395,
          "activation_cosine_similarity": 0.017408723011612892,
          "activation_magnitude_ratio": -0.0016602614196017385,
          "activation_dot_product": 0.0031590473372489214,
          "encoder_gradient_cosine_similarity": 0.0013532901648432016,
          "encoder_gradient_l2_distance": -0.030656132847070694,
          "encoder_gradient_dot_product": 0.0013022113125771284,
          "input_gradient_cosine_similarity": 0.0017991071799769998,
          "input_gradient_l2_distance": -0.003935717511922121,
          "input_gradient_dot_product": -0.00137567357160151
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7168033816949608,
        "val_r": 0.6930603769397594,
        "n_iterations": 333,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01225774921476841,
          "right_subspace_overlap_bottom_k": -0.012547682039439678,
          "interaction_matrix_overlap_top_k": 0.0042548100464046,
          "interaction_matrix_overlap_bottom_k": 0.002134614158421755,
          "effective_rank": 0.0012747423024848104,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0026131796184927225,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0019970284774899483,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.002069841604679823,
          "subspace_overlap": 0.001700859284028411,
          "right_subspace_overlap": 0.007802381180226803,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.009170527569949627,
          "activation_magnitude_ratio": -0.00438362080603838,
          "activation_dot_product": 0.007712895516306162,
          "encoder_gradient_cosine_similarity": 0.005881779827177525,
          "encoder_gradient_l2_distance": -0.013905304484069347,
          "encoder_gradient_dot_product": 0.0023539543617516756,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.015743862837553024,
          "input_gradient_dot_product": -0.006872732192277908
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7326766814063249,
        "val_r": 0.695811275478976,
        "n_iterations": 217,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006555825471878052,
          "right_subspace_overlap_bottom_k": -0.010426826775074005,
          "interaction_matrix_overlap_top_k": 0.0015369139146059752,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.001312200678512454,
          "task_vector_cosine_similarity": 0.003462825436145067,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.0013697840040549636,
          "weight_space_angle": -0.001260238466784358,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0016850084066390991,
          "subspace_overlap": -0.0022498781327158213,
          "right_subspace_overlap": 0.003917216788977385,
          "activation_l2_distance": 0.008134807460010052,
          "activation_cosine_similarity": 0.01725567877292633,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0014878124929964542,
          "encoder_gradient_l2_distance": -0.022267106920480728,
          "encoder_gradient_dot_product": -0.002462238073348999,
          "input_gradient_cosine_similarity": 0.003981403075158596,
          "input_gradient_l2_distance": -0.005934727378189564,
          "input_gradient_dot_product": -0.004073622170835733
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7269878984825061,
        "val_r": 0.7804595183633558,
        "n_iterations": 294,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0025570495054125786,
          "right_subspace_overlap_bottom_k": -0.008141877129673958,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0018539782613515854,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.0012688423739746213,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0015616851160302758,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.001628296566195786,
          "right_subspace_overlap": 0.011655004695057869,
          "activation_l2_distance": 0.0025043587666004896,
          "activation_cosine_similarity": 0.012062359601259232,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0024401687551289797,
          "encoder_gradient_l2_distance": -0.021824296563863754,
          "encoder_gradient_dot_product": 0.0010606375290080905,
          "input_gradient_cosine_similarity": 0.0020030387677252293,
          "input_gradient_l2_distance": -0.007617623079568148,
          "input_gradient_dot_product": -0.004650663584470749
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6957431983146035,
        "val_r": 0.7475471629316266,
        "n_iterations": 318,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.013462860137224197,
          "right_subspace_overlap_bottom_k": -0.03036523424088955,
          "interaction_matrix_overlap_top_k": 0.006345122586935759,
          "interaction_matrix_overlap_bottom_k": -0.005273522809147835,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.002691581379622221,
          "singular_value_ratio": 0.0026430829893797636,
          "layerwise_effective_rank": -0.0012094550766050816,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0027385232970118523,
          "task_vector_l2_distance": -0.007613364141434431,
          "task_vector_dot_product": 0.0014295184519141912,
          "weight_space_angle": 0.004769246093928814,
          "task_vector_magnitude_ratio": 0.0017678363947197795,
          "singular_value_overlap": 0.0015592641429975629,
          "subspace_overlap": 0.0035946574062108994,
          "right_subspace_overlap": 0.019312230870127678,
          "activation_l2_distance": -0.014148593880236149,
          "activation_cosine_similarity": 0.01314075943082571,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.035316042602062225,
          "encoder_gradient_cosine_similarity": -0.0019185980781912804,
          "encoder_gradient_l2_distance": -0.05456953123211861,
          "encoder_gradient_dot_product": -0.0015927599743008614,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.07119573652744293,
          "input_gradient_dot_product": -0.008942823857069016
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.6211470562802448,
        "val_r": 0.25403468478323876,
        "n_iterations": 279,
        "n_nonzero_coefficients": 29,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011999636888504028,
          "right_subspace_overlap_bottom_k": -0.008115438744425774,
          "interaction_matrix_overlap_top_k": 0.0050923144444823265,
          "interaction_matrix_overlap_bottom_k": 0.0012615978484973311,
          "effective_rank": 0.0011093097273260355,
          "effective_rank_mergeability_score": -0.001242073718458414,
          "stable_rank": 0.0014087400631979108,
          "spectral_gap": -0.0017454616026952863,
          "singular_value_ratio": 0.001837287680245936,
          "layerwise_effective_rank": 0.0014286767691373825,
          "layerwise_effective_rank_mergeability_score": -0.0013371044769883156,
          "task_vector_cosine_similarity": 0.004301866516470909,
          "task_vector_l2_distance": -0.00397390965372324,
          "task_vector_dot_product": 0.0012523563345894217,
          "weight_space_angle": -0.005628383718430996,
          "task_vector_magnitude_ratio": 0.0017099407268688083,
          "singular_value_overlap": 0.0040045250207185745,
          "subspace_overlap": 0.001828220672905445,
          "right_subspace_overlap": 0.008515117689967155,
          "activation_l2_distance": 0.0034287748858332634,
          "activation_cosine_similarity": 0.011739924550056458,
          "activation_magnitude_ratio": -0.003763754153624177,
          "activation_dot_product": 0.0056189498864114285,
          "encoder_gradient_cosine_similarity": 0.0032728826627135277,
          "encoder_gradient_l2_distance": -0.018063845112919807,
          "encoder_gradient_dot_product": 0.003300704061985016,
          "input_gradient_cosine_similarity": 0.001770233502611518,
          "input_gradient_l2_distance": -0.017759479582309723,
          "input_gradient_dot_product": -0.006273755803704262
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7484884020070731,
        "val_r": 0.7040006710871135,
        "n_iterations": 181,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01340597216039896,
          "right_subspace_overlap_bottom_k": -0.01835760474205017,
          "interaction_matrix_overlap_top_k": 0.0030394583009183407,
          "interaction_matrix_overlap_bottom_k": -0.002720687072724104,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0010606369469314814,
          "stable_rank": -0.0017595515819266438,
          "spectral_gap": -0.0011681062169373035,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002069291193038225,
          "layerwise_effective_rank_mergeability_score": 0.0020596832036972046,
          "task_vector_cosine_similarity": -0.0015564365312457085,
          "task_vector_l2_distance": -0.005799052305519581,
          "task_vector_dot_product": -0.0012677133781835437,
          "weight_space_angle": 0.005540396552532911,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0025114708114415407,
          "subspace_overlap": 0.002166751539334655,
          "right_subspace_overlap": 0.012278051115572453,
          "activation_l2_distance": -0.0022801519371569157,
          "activation_cosine_similarity": 0.013690602965652943,
          "activation_magnitude_ratio": -0.003121388843283057,
          "activation_dot_product": 0.010933329351246357,
          "encoder_gradient_cosine_similarity": 0.004972036927938461,
          "encoder_gradient_l2_distance": -0.02829176001250744,
          "encoder_gradient_dot_product": 0.007362585049122572,
          "input_gradient_cosine_similarity": 0.004034403245896101,
          "input_gradient_l2_distance": -0.030692800879478455,
          "input_gradient_dot_product": -0.011496673338115215
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7069149664224414,
        "val_r": 0.5449229934709972,
        "n_iterations": 287,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.017454449087381363,
          "right_subspace_overlap_bottom_k": -0.024294862523674965,
          "interaction_matrix_overlap_top_k": 0.006096201948821545,
          "interaction_matrix_overlap_bottom_k": 0.0021350220777094364,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.00298998411744833,
          "singular_value_ratio": 0.0019682706333696842,
          "layerwise_effective_rank": -0.0011229870142415166,
          "layerwise_effective_rank_mergeability_score": 0.0013183706905692816,
          "task_vector_cosine_similarity": -0.0013405017089098692,
          "task_vector_l2_distance": -0.008773823268711567,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0023745340295135975,
          "task_vector_magnitude_ratio": 0.001498967525549233,
          "singular_value_overlap": 0.00556210707873106,
          "subspace_overlap": 0.0025456089060753584,
          "right_subspace_overlap": 0.017924387007951736,
          "activation_l2_distance": -0.004301498178392649,
          "activation_cosine_similarity": 0.01923150196671486,
          "activation_magnitude_ratio": 0.0026811007410287857,
          "activation_dot_product": 0.031051214784383774,
          "encoder_gradient_cosine_similarity": 0.0014487984590232372,
          "encoder_gradient_l2_distance": -0.07636620104312897,
          "encoder_gradient_dot_product": -0.0013418806483969092,
          "input_gradient_cosine_similarity": -0.0010749687207862735,
          "input_gradient_l2_distance": -0.07932557910680771,
          "input_gradient_dot_product": -0.009162185713648796
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7829939062413407,
        "val_r": 0.5257531783556362,
        "n_iterations": 303,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009371960535645485,
          "right_subspace_overlap_bottom_k": -0.01577179506421089,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002531979698687792,
          "layerwise_effective_rank_mergeability_score": 0.002525699557736516,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.002068891189992428,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0020169480703771114,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005218958482146263,
          "activation_l2_distance": 0.0015210899291560054,
          "activation_cosine_similarity": 0.020664745941758156,
          "activation_magnitude_ratio": -0.003270520828664303,
          "activation_dot_product": -0.001469096401706338,
          "encoder_gradient_cosine_similarity": 0.0028316951356828213,
          "encoder_gradient_l2_distance": -0.03262852132320404,
          "encoder_gradient_dot_product": 0.0014360386412590742,
          "input_gradient_cosine_similarity": 0.0012129920069128275,
          "input_gradient_l2_distance": -0.012178799137473106,
          "input_gradient_dot_product": -0.00818860437721014
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5498714874491438,
        "val_r": 0.5764097399145472,
        "n_iterations": 366,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.013657225295901299,
          "right_subspace_overlap_bottom_k": -0.004104543477296829,
          "interaction_matrix_overlap_top_k": 0.015821482986211777,
          "interaction_matrix_overlap_bottom_k": -0.0020689077209681273,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": -0.0013372583780437708,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.001387808471918106,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.014351706951856613,
          "task_vector_l2_distance": -0.015473637729883194,
          "task_vector_dot_product": 0.010879112407565117,
          "weight_space_angle": -0.016267728060483932,
          "task_vector_magnitude_ratio": 0.00126942980568856,
          "singular_value_overlap": 0.008711554110050201,
          "subspace_overlap": 0.013155014254152775,
          "right_subspace_overlap": 0.01227435003966093,
          "activation_l2_distance": -0.016103729605674744,
          "activation_cosine_similarity": 0.01737302541732788,
          "activation_magnitude_ratio": 0.002151991706341505,
          "activation_dot_product": 0.03394694626331329,
          "encoder_gradient_cosine_similarity": 0.009948899038136005,
          "encoder_gradient_l2_distance": -0.025946343317627907,
          "encoder_gradient_dot_product": -0.001575423520989716,
          "input_gradient_cosine_similarity": -0.0014096822123974562,
          "input_gradient_l2_distance": -0.027722543105483055,
          "input_gradient_dot_product": -0.009877907112240791
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.5,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "arithmetic": {
    "aggregate_metrics": {
      "train_r": 0.3917477808627931,
      "train_p": 1.1520125729793059e-118,
      "val_r": 0.23694319788887497,
      "val_p": 5.837310361483599e-06
    },
    "per_fold_stats": {
      "train_r_mean": 0.5854898891771219,
      "train_r_std": 0.05817213595727462,
      "val_r_mean": 0.43707050094559075,
      "val_r_std": 0.1592711518811142,
      "n_nonzero_mean": 19.95,
      "n_nonzero_std": 2.71062723368596
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.0037477246951311827,
      "right_subspace_overlap_bottom_k": 0.00231947167776525,
      "interaction_matrix_overlap_top_k": 0.00042551400838419795,
      "interaction_matrix_overlap_bottom_k": 0.015809424221515656,
      "effective_rank": -0.00041394858271814883,
      "effective_rank_mergeability_score": 0.0006149112014099956,
      "stable_rank": -0.0005335566820576787,
      "spectral_gap": 0.00036549632204696536,
      "singular_value_ratio": -0.0007274487870745361,
      "layerwise_effective_rank": 9.0822133643087e-05,
      "layerwise_effective_rank_mergeability_score": -4.189403171039885e-06,
      "task_vector_cosine_similarity": -7.505530811613426e-05,
      "task_vector_l2_distance": -0.01891893334686756,
      "task_vector_dot_product": -0.0022625583223998547,
      "weight_space_angle": 4.8540277930442244e-05,
      "task_vector_magnitude_ratio": -0.0030212069395929575,
      "singular_value_overlap": -0.012787980027496815,
      "subspace_overlap": 0.0018025061581283808,
      "right_subspace_overlap": 0.003992151003330946,
      "activation_l2_distance": -0.0013381324242800474,
      "activation_cosine_similarity": 0.0043684314005076885,
      "activation_magnitude_ratio": -0.002516301814466715,
      "activation_dot_product": 0.002063130959868431,
      "encoder_gradient_cosine_similarity": 0.0012900183210149407,
      "encoder_gradient_l2_distance": -0.02510172687470913,
      "encoder_gradient_dot_product": 0.002183905802667141,
      "input_gradient_cosine_similarity": 0.0009999233298003674,
      "input_gradient_l2_distance": -0.02733195386826992,
      "input_gradient_dot_product": -0.006324085406959057
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.0034218684304505587,
      "right_subspace_overlap_bottom_k": 0.006579133681952953,
      "interaction_matrix_overlap_top_k": 0.0021946250926703215,
      "interaction_matrix_overlap_bottom_k": 0.004869608208537102,
      "effective_rank": 0.0010929524432867765,
      "effective_rank_mergeability_score": 0.001044475706294179,
      "stable_rank": 0.0008320359629578888,
      "spectral_gap": 0.0007504062377847731,
      "singular_value_ratio": 0.0011729621328413486,
      "layerwise_effective_rank": 0.0011065690778195858,
      "layerwise_effective_rank_mergeability_score": 0.0010391226969659328,
      "task_vector_cosine_similarity": 0.0014355223393067718,
      "task_vector_l2_distance": 0.00920858234167099,
      "task_vector_dot_product": 0.0045274836011230946,
      "weight_space_angle": 0.0020014930050820112,
      "task_vector_magnitude_ratio": 0.0015213115839287639,
      "singular_value_overlap": 0.0055632456205785275,
      "subspace_overlap": 0.002767970087006688,
      "right_subspace_overlap": 0.004232888109982014,
      "activation_l2_distance": 0.0027159377932548523,
      "activation_cosine_similarity": 0.004904825706034899,
      "activation_magnitude_ratio": 0.0025467723608016968,
      "activation_dot_product": 0.0031967752147465944,
      "encoder_gradient_cosine_similarity": 0.0012969902018085122,
      "encoder_gradient_l2_distance": 0.01214951928704977,
      "encoder_gradient_dot_product": 0.002279068110510707,
      "input_gradient_cosine_similarity": 0.0017718096496537328,
      "input_gradient_l2_distance": 0.014155802316963673,
      "input_gradient_dot_product": 0.00524390721693635
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.85,
      "right_subspace_overlap_bottom_k": 0.8,
      "interaction_matrix_overlap_top_k": 0.5,
      "interaction_matrix_overlap_bottom_k": 1.0,
      "effective_rank": 0.4,
      "effective_rank_mergeability_score": 0.3,
      "stable_rank": 0.3,
      "spectral_gap": 0.35,
      "singular_value_ratio": 0.45,
      "layerwise_effective_rank": 0.35,
      "layerwise_effective_rank_mergeability_score": 0.35,
      "task_vector_cosine_similarity": 0.5,
      "task_vector_l2_distance": 1.0,
      "task_vector_dot_product": 0.7,
      "weight_space_angle": 0.6,
      "task_vector_magnitude_ratio": 0.9,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.65,
      "right_subspace_overlap": 0.85,
      "activation_l2_distance": 0.6,
      "activation_cosine_similarity": 0.85,
      "activation_magnitude_ratio": 0.8,
      "activation_dot_product": 0.85,
      "encoder_gradient_cosine_similarity": 0.6,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.75,
      "input_gradient_cosine_similarity": 0.7,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.95
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6143479166889876,
        "val_r": 0.5609875755689814,
        "n_iterations": 336,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006001337431371212,
          "right_subspace_overlap_bottom_k": 0.0072823623195290565,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.022553149610757828,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0023202747106552124,
          "layerwise_effective_rank_mergeability_score": -0.0020837695337831974,
          "task_vector_cosine_similarity": 0.001982383895665407,
          "task_vector_l2_distance": -0.023881344124674797,
          "task_vector_dot_product": -0.012634214013814926,
          "weight_space_angle": 0.003819542471319437,
          "task_vector_magnitude_ratio": -0.00440277298912406,
          "singular_value_overlap": -0.021546699106693268,
          "subspace_overlap": 0.01163461059331894,
          "right_subspace_overlap": 0.004143170081079006,
          "activation_l2_distance": -0.006451122462749481,
          "activation_cosine_similarity": 0.00997223425656557,
          "activation_magnitude_ratio": -0.005476315971463919,
          "activation_dot_product": -0.004295612685382366,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.03037828765809536,
          "encoder_gradient_dot_product": 0.0011567807523533702,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.033497363328933716,
          "input_gradient_dot_product": -0.0050719729624688625
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5955083594996604,
        "val_r": 0.565573173963452,
        "n_iterations": 270,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0014050654135644436,
          "right_subspace_overlap_bottom_k": -0.004320988897234201,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.014441588893532753,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.010848102159798145,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.004135867115110159,
          "singular_value_overlap": -0.00669501069933176,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0012636409373953938,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0022548383567482233,
          "activation_dot_product": 0.0015863118460401893,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.013368752785027027,
          "encoder_gradient_dot_product": 0.002134204376488924,
          "input_gradient_cosine_similarity": 0.002462063916027546,
          "input_gradient_l2_distance": -0.012623089365661144,
          "input_gradient_dot_product": -0.0032611945644021034
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.600046781731082,
        "val_r": 0.5381598358829975,
        "n_iterations": 202,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005286942236125469,
          "right_subspace_overlap_bottom_k": 0.003271027933806181,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.017260633409023285,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.00160709407646209,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0017604754539206624,
          "task_vector_l2_distance": -0.02065267786383629,
          "task_vector_dot_product": 0.0023478176444768906,
          "weight_space_angle": 0.001553368871100247,
          "task_vector_magnitude_ratio": -0.0033980871085077524,
          "singular_value_overlap": -0.01295840460807085,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0015739991795271635,
          "activation_cosine_similarity": 0.00249261362478137,
          "activation_magnitude_ratio": -0.0031469373498111963,
          "activation_dot_product": 0.0031513208523392677,
          "encoder_gradient_cosine_similarity": 0.002762575400993228,
          "encoder_gradient_l2_distance": -0.02005116268992424,
          "encoder_gradient_dot_product": 0.0021761844400316477,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.019813772290945053,
          "input_gradient_dot_product": -0.0032289838418364525
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5643528886412661,
        "val_r": 0.43299689538171304,
        "n_iterations": 224,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006751570850610733,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.004994284361600876,
          "interaction_matrix_overlap_bottom_k": 0.01674238033592701,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0018838879186660051,
          "spectral_gap": 0.001684723305515945,
          "singular_value_ratio": -0.0010123836109414697,
          "layerwise_effective_rank": -0.0019786532502621412,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0013127194251865149,
          "task_vector_l2_distance": -0.013158908113837242,
          "task_vector_dot_product": -0.005201490595936775,
          "weight_space_angle": -0.0010413186391815543,
          "task_vector_magnitude_ratio": -0.003590442705899477,
          "singular_value_overlap": -0.019456403329968452,
          "subspace_overlap": 0.004292978905141354,
          "right_subspace_overlap": 0.011696082539856434,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.008719360455870628,
          "activation_magnitude_ratio": -0.009087461046874523,
          "activation_dot_product": 0.005087993107736111,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.029946917667984962,
          "encoder_gradient_dot_product": 0.004221505485475063,
          "input_gradient_cosine_similarity": 0.004258722998201847,
          "input_gradient_l2_distance": -0.0376499742269516,
          "input_gradient_dot_product": -0.020137852057814598
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5255219130626367,
        "val_r": 0.4688773700385776,
        "n_iterations": 341,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002079365309327841,
          "right_subspace_overlap_bottom_k": -0.005364381242543459,
          "interaction_matrix_overlap_top_k": -0.0012517963768914342,
          "interaction_matrix_overlap_bottom_k": 0.017321588471531868,
          "effective_rank": -0.0013437094166874886,
          "effective_rank_mergeability_score": 0.0010686407331377268,
          "stable_rank": 0.0,
          "spectral_gap": 0.0012119067832827568,
          "singular_value_ratio": -0.0014838362112641335,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0013215196086093783,
          "task_vector_cosine_similarity": 0.0010243345750495791,
          "task_vector_l2_distance": -0.012014921754598618,
          "task_vector_dot_product": -0.0028301835991442204,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0033566360361874104,
          "singular_value_overlap": -0.007190175354480743,
          "subspace_overlap": -0.0017294615972787142,
          "right_subspace_overlap": 0.0015610397094860673,
          "activation_l2_distance": -0.0015982537297531962,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0010917941108345985,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0012938189320266247,
          "encoder_gradient_l2_distance": -0.008681881241500378,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.001255725510418415,
          "input_gradient_l2_distance": -0.010952974669635296,
          "input_gradient_dot_product": -0.002619992708787322
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.6080196256463744,
        "val_r": 0.6696168792433892,
        "n_iterations": 451,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.002646534238010645,
          "interaction_matrix_overlap_top_k": -0.0012061818270012736,
          "interaction_matrix_overlap_bottom_k": 0.018814561888575554,
          "effective_rank": -0.0017118076793849468,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.014849032275378704,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.005085091572254896,
          "singular_value_overlap": -0.010280579328536987,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0011512292549014091,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.002457163529470563,
          "activation_dot_product": 0.0030722194351255894,
          "encoder_gradient_cosine_similarity": 0.0011984339216724038,
          "encoder_gradient_l2_distance": -0.016294613480567932,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.001088212593458593,
          "input_gradient_l2_distance": -0.00872272253036499,
          "input_gradient_dot_product": -0.0026217729318886995
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.5872450340183619,
        "val_r": 0.03113228533760047,
        "n_iterations": 238,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0027311667799949646,
          "right_subspace_overlap_bottom_k": 0.014757857657968998,
          "interaction_matrix_overlap_top_k": -0.0020412292797118425,
          "interaction_matrix_overlap_bottom_k": 0.01672905869781971,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.002718151779845357,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.002061616163700819,
          "task_vector_l2_distance": -0.028109848499298096,
          "task_vector_dot_product": -0.00859706848859787,
          "weight_space_angle": 0.002298615174368024,
          "task_vector_magnitude_ratio": -0.004029236733913422,
          "singular_value_overlap": -0.020579423755407333,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.004239249974489212,
          "activation_l2_distance": -0.00880699884146452,
          "activation_cosine_similarity": 0.00520547479391098,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.0011602581944316626,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.048338718712329865,
          "encoder_gradient_dot_product": 0.00797776784747839,
          "input_gradient_cosine_similarity": -0.003305700607597828,
          "input_gradient_l2_distance": -0.04828806594014168,
          "input_gradient_dot_product": -0.00886137131601572
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5297283543925406,
        "val_r": 0.17191839112426313,
        "n_iterations": 285,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00391112407669425,
          "right_subspace_overlap_bottom_k": -0.001082785427570343,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.019858554005622864,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0016380607848986983,
          "spectral_gap": 0.001387589843943715,
          "singular_value_ratio": -0.0015183226205408573,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0011900601675733924,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.021600717678666115,
          "task_vector_dot_product": -0.0066514769569039345,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.005012219306081533,
          "singular_value_overlap": -0.01680549420416355,
          "subspace_overlap": 0.0012697562342509627,
          "right_subspace_overlap": 0.0066964938305318356,
          "activation_l2_distance": 0.0015065206680446863,
          "activation_cosine_similarity": 0.006225673481822014,
          "activation_magnitude_ratio": -0.005812576971948147,
          "activation_dot_product": -0.0019264915026724339,
          "encoder_gradient_cosine_similarity": 0.003800485050305724,
          "encoder_gradient_l2_distance": -0.02047933079302311,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0012178975157439709,
          "input_gradient_l2_distance": -0.01667434349656105,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.6040893379232214,
        "val_r": 0.32960758693120196,
        "n_iterations": 335,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002040610183030367,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.016801344230771065,
          "effective_rank": -0.0033226462546736,
          "effective_rank_mergeability_score": 0.002692684531211853,
          "stable_rank": -0.002117505995556712,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01609487272799015,
          "task_vector_dot_product": 0.0010292488150298595,
          "weight_space_angle": 0.0013337660348042846,
          "task_vector_magnitude_ratio": -0.001242933445610106,
          "singular_value_overlap": -0.011750640347599983,
          "subspace_overlap": 0.0011252242838963866,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0032730726525187492,
          "activation_magnitude_ratio": -0.0035790614783763885,
          "activation_dot_product": 0.0017591926734894514,
          "encoder_gradient_cosine_similarity": 0.0017365238163620234,
          "encoder_gradient_l2_distance": -0.014900073409080505,
          "encoder_gradient_dot_product": 0.0017573091899976134,
          "input_gradient_cosine_similarity": 0.0012329955352470279,
          "input_gradient_l2_distance": -0.024914072826504707,
          "input_gradient_dot_product": -0.006694899871945381
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5961953881601751,
        "val_r": 0.31480248275270645,
        "n_iterations": 254,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.004702517297118902,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.017940649762749672,
          "effective_rank": -0.001282256911508739,
          "effective_rank_mergeability_score": 0.0012809657491743565,
          "stable_rank": -0.0016262829303741455,
          "spectral_gap": 0.0010434488067403436,
          "singular_value_ratio": -0.001195718883536756,
          "layerwise_effective_rank": -0.0015139831230044365,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.001354625215753913,
          "task_vector_l2_distance": -0.024351587519049644,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0022061909548938274,
          "task_vector_magnitude_ratio": -0.001734578050673008,
          "singular_value_overlap": -0.015863962471485138,
          "subspace_overlap": 0.002135483082383871,
          "right_subspace_overlap": 0.0018465875182300806,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": -0.004040937405079603,
          "activation_magnitude_ratio": -0.0033056950196623802,
          "activation_dot_product": 0.0010666290763765574,
          "encoder_gradient_cosine_similarity": 0.001432984136044979,
          "encoder_gradient_l2_distance": -0.02136397361755371,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.026178620755672455,
          "input_gradient_dot_product": -0.004274875856935978
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5461344038035788,
        "val_r": 0.2709568529107788,
        "n_iterations": 377,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0037055877037346363,
          "right_subspace_overlap_bottom_k": 0.0035785783547908068,
          "interaction_matrix_overlap_top_k": 0.002625243505463004,
          "interaction_matrix_overlap_bottom_k": 0.013638935983181,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0012667701812461019,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0017742516938596964,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0021819504909217358,
          "task_vector_l2_distance": -0.014322448521852493,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.001265105907805264,
          "singular_value_overlap": -0.009690160863101482,
          "subspace_overlap": 0.001956482417881489,
          "right_subspace_overlap": 0.003698175773024559,
          "activation_l2_distance": -0.004040465224534273,
          "activation_cosine_similarity": 0.004556019324809313,
          "activation_magnitude_ratio": -0.0028170605655759573,
          "activation_dot_product": 0.002691203262656927,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.01794685795903206,
          "encoder_gradient_dot_product": 0.004246450029313564,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01706293225288391,
          "input_gradient_dot_product": -0.001773824100382626
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5795264454152953,
        "val_r": 0.4680056188894389,
        "n_iterations": 178,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0035965186543762684,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.016495058313012123,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.002055831253528595,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.001112542231567204,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.022003673017024994,
          "task_vector_dot_product": 0.002876266371458769,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0034896060824394226,
          "singular_value_overlap": -0.014306040480732918,
          "subspace_overlap": 0.0028346404433250427,
          "right_subspace_overlap": 0.0017673526890575886,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0019129316788166761,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0036291200667619705,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.02361343242228031,
          "encoder_gradient_dot_product": 0.0010216457303613424,
          "input_gradient_cosine_similarity": 0.0015405694721266627,
          "input_gradient_l2_distance": -0.023950790986418724,
          "input_gradient_dot_product": -0.009077141992747784
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5418108524642083,
        "val_r": 0.5238460829200023,
        "n_iterations": 237,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0036026393063366413,
          "right_subspace_overlap_bottom_k": -0.0019635299686342478,
          "interaction_matrix_overlap_top_k": 0.002461619907990098,
          "interaction_matrix_overlap_bottom_k": 0.01766391657292843,
          "effective_rank": 0.0016480219783261418,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.003206238616257906,
          "task_vector_l2_distance": -0.01020384393632412,
          "task_vector_dot_product": 0.0011630418011918664,
          "weight_space_angle": -0.005498719867318869,
          "task_vector_magnitude_ratio": -0.0025332451332360506,
          "singular_value_overlap": -0.011788487434387207,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.003939618356525898,
          "activation_l2_distance": -0.0011079998221248388,
          "activation_cosine_similarity": 0.003757753875106573,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0016844046767801046,
          "encoder_gradient_cosine_similarity": 0.003600247437134385,
          "encoder_gradient_l2_distance": -0.017178140580654144,
          "encoder_gradient_dot_product": 0.0046065328642725945,
          "input_gradient_cosine_similarity": 0.0025211432948708534,
          "input_gradient_l2_distance": -0.02259150519967079,
          "input_gradient_dot_product": -0.011916015297174454
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5566578066090138,
        "val_r": 0.653765625492652,
        "n_iterations": 409,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010913925245404243,
          "right_subspace_overlap_bottom_k": -0.0010923980735242367,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.013522780500352383,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01428250502794981,
          "task_vector_dot_product": -0.0026794308796525,
          "weight_space_angle": 0.0010903485817834735,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.013837171718478203,
          "subspace_overlap": 0.004963553510606289,
          "right_subspace_overlap": 0.004799004644155502,
          "activation_l2_distance": -0.0028786342591047287,
          "activation_cosine_similarity": 0.004038674291223288,
          "activation_magnitude_ratio": -0.001328629208728671,
          "activation_dot_product": 0.004570980556309223,
          "encoder_gradient_cosine_similarity": 0.0016839106101542711,
          "encoder_gradient_l2_distance": -0.027324683964252472,
          "encoder_gradient_dot_product": 0.0019627725705504417,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0300824586302042,
          "input_gradient_dot_product": -0.013487393036484718
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.4737746351840928,
        "val_r": 0.5346348592393161,
        "n_iterations": 258,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0029197006952017546,
          "right_subspace_overlap_bottom_k": -0.008092103525996208,
          "interaction_matrix_overlap_top_k": 0.0033009222242981195,
          "interaction_matrix_overlap_bottom_k": 0.013408706523478031,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0012190408306196332,
          "singular_value_ratio": 0.00131707894615829,
          "layerwise_effective_rank": 0.0018680939683690667,
          "layerwise_effective_rank_mergeability_score": -0.002280952874571085,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.008452759124338627,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0014849158469587564,
          "task_vector_magnitude_ratio": -0.0020250107627362013,
          "singular_value_overlap": -0.0095598129555583,
          "subspace_overlap": 0.0033988915383815765,
          "right_subspace_overlap": 0.004029364325106144,
          "activation_l2_distance": -0.0015763535629957914,
          "activation_cosine_similarity": 0.0018949196673929691,
          "activation_magnitude_ratio": -0.003388145938515663,
          "activation_dot_product": 0.003330143168568611,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.016652334481477737,
          "encoder_gradient_dot_product": 0.0021369201131165028,
          "input_gradient_cosine_similarity": 0.002102028112858534,
          "input_gradient_l2_distance": -0.018322225660085678,
          "input_gradient_dot_product": -0.006516754627227783
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.6053682792641365,
        "val_r": 0.29852158361405345,
        "n_iterations": 228,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00563546409830451,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.011568245477974415,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0014357115142047405,
          "layerwise_effective_rank_mergeability_score": -0.001599665149115026,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.016251124441623688,
          "task_vector_dot_product": -0.0015062256716191769,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0030970843508839607,
          "singular_value_overlap": -0.003944288939237595,
          "subspace_overlap": 0.001127411494962871,
          "right_subspace_overlap": 0.006276421248912811,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.003395003965124488,
          "activation_magnitude_ratio": -0.0050366525538265705,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.00132596748881042,
          "encoder_gradient_l2_distance": -0.01752462610602379,
          "encoder_gradient_dot_product": 0.003833622904494405,
          "input_gradient_cosine_similarity": 0.001754753990098834,
          "input_gradient_l2_distance": -0.020063651725649834,
          "input_gradient_dot_product": -0.009425045922398567
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5690671195780511,
        "val_r": 0.4553732691093383,
        "n_iterations": 271,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011003748513758183,
          "right_subspace_overlap_bottom_k": 0.020254001021385193,
          "interaction_matrix_overlap_top_k": 0.0012292080791667104,
          "interaction_matrix_overlap_bottom_k": 0.01591314747929573,
          "effective_rank": 0.0010483741061761975,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0027081426233053207,
          "task_vector_l2_distance": -0.04501861333847046,
          "task_vector_dot_product": -0.0047156186774373055,
          "weight_space_angle": -0.0018827146850526333,
          "task_vector_magnitude_ratio": -0.0026847815606743097,
          "singular_value_overlap": -0.02383860945701599,
          "subspace_overlap": 0.0016690564807504416,
          "right_subspace_overlap": 0.01656733639538288,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.011573988012969494,
          "activation_magnitude_ratio": -0.002446881029754877,
          "activation_dot_product": 0.0015184355434030294,
          "encoder_gradient_cosine_similarity": 0.0036794834304600954,
          "encoder_gradient_l2_distance": -0.05178828537464142,
          "encoder_gradient_dot_product": 0.005936973262578249,
          "input_gradient_cosine_similarity": 0.004086918197572231,
          "input_gradient_l2_distance": -0.059805143624544144,
          "input_gradient_dot_product": 0.002756645670160651
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.581440839400873,
        "val_r": 0.39568610550459604,
        "n_iterations": 224,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007480908185243607,
          "right_subspace_overlap_bottom_k": 0.009608354419469833,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.021779458969831467,
          "effective_rank": -0.0021999054588377476,
          "effective_rank_mergeability_score": 0.0021880045533180237,
          "stable_rank": -0.002138625830411911,
          "spectral_gap": 0.0016361776506528258,
          "singular_value_ratio": -0.003436567261815071,
          "layerwise_effective_rank": -0.002089252695441246,
          "layerwise_effective_rank_mergeability_score": 0.0022564774844795465,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.03326628729701042,
          "task_vector_dot_product": -0.011697567999362946,
          "weight_space_angle": 0.0017340548802167177,
          "task_vector_magnitude_ratio": -0.004396360367536545,
          "singular_value_overlap": -0.009520945139229298,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.00475994311273098,
          "activation_l2_distance": -0.00463142991065979,
          "activation_cosine_similarity": 0.007860549725592136,
          "activation_magnitude_ratio": 0.002807473298162222,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0013437001034617424,
          "encoder_gradient_l2_distance": -0.045131929218769073,
          "encoder_gradient_dot_product": -0.0013731473591178656,
          "input_gradient_cosine_similarity": -0.0022225226275622845,
          "input_gradient_l2_distance": -0.06016825884580612,
          "input_gradient_dot_product": -0.012743180617690086
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7751925077810964,
        "val_r": 0.6234852625164171,
        "n_iterations": 252,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0018683098023757339,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0037365099415183067,
          "interaction_matrix_overlap_bottom_k": -0.001983589492738247,
          "effective_rank": -0.0011150416685268283,
          "effective_rank_mergeability_score": 0.0034608340356498957,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0017508193850517273,
          "task_vector_l2_distance": -0.004360782448202372,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0031574112363159657,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0027926466427743435,
          "subspace_overlap": 0.0013714900705963373,
          "right_subspace_overlap": 0.005833922419697046,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.017906030640006065,
          "activation_magnitude_ratio": -0.0019042917992919683,
          "activation_dot_product": 0.0034833436366170645,
          "encoder_gradient_cosine_similarity": 0.0019422362092882395,
          "encoder_gradient_l2_distance": -0.04255228489637375,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.02865055575966835,
          "input_gradient_dot_product": -0.005012887064367533
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6557692942777847,
        "val_r": 0.4334622824903392,
        "n_iterations": 277,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.002382962964475155,
          "right_subspace_overlap_bottom_k": 0.003900937968865037,
          "interaction_matrix_overlap_top_k": -0.00533830001950264,
          "interaction_matrix_overlap_bottom_k": 0.015718279406428337,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0015651208814233541,
          "singular_value_ratio": -0.002445243764668703,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.02465463988482952,
          "task_vector_dot_product": 0.003845734754577279,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.004945079330354929,
          "singular_value_overlap": -0.013354637660086155,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": -0.003274380462244153,
          "activation_l2_distance": 0.0023993155919015408,
          "activation_cosine_similarity": -0.0013747317716479301,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.01201368123292923,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.018518254160881042,
          "encoder_gradient_dot_product": 0.001882591051980853,
          "input_gradient_cosine_similarity": 0.002005660906434059,
          "input_gradient_l2_distance": -0.026626506820321083,
          "input_gradient_dot_product": -0.0025132112205028534
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.5,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "tsv": {
    "aggregate_metrics": {
      "train_r": 0.47193871532745885,
      "train_p": 1.9854288769797865e-178,
      "val_r": 0.4105078773143099,
      "val_p": 5.504553976319951e-16
    },
    "per_fold_stats": {
      "train_r_mean": 0.76364070611366,
      "train_r_std": 0.026339148561237972,
      "val_r_mean": 0.6524865616112956,
      "val_r_std": 0.15920835421146798,
      "n_nonzero_mean": 19.5,
      "n_nonzero_std": 2.692582403567252
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.01039185468107462,
      "right_subspace_overlap_bottom_k": -0.023234279826283455,
      "interaction_matrix_overlap_top_k": 0.0010229663457721472,
      "interaction_matrix_overlap_bottom_k": 0.0005268526147119701,
      "effective_rank": -6.643246888415888e-05,
      "effective_rank_mergeability_score": -9.291296009905636e-05,
      "stable_rank": -0.0003020542790181935,
      "spectral_gap": -0.00019181423704139888,
      "singular_value_ratio": 0.00019192098989151418,
      "layerwise_effective_rank": -0.0009774146601557732,
      "layerwise_effective_rank_mergeability_score": 0.000781026144977659,
      "task_vector_cosine_similarity": -0.0008694689022377133,
      "task_vector_l2_distance": -0.002294618869200349,
      "task_vector_dot_product": -0.0009608825785107911,
      "weight_space_angle": 0.001601977040991187,
      "task_vector_magnitude_ratio": -4.4909487769473344e-05,
      "singular_value_overlap": 0.008445673622190952,
      "subspace_overlap": -0.0014024314004927874,
      "right_subspace_overlap": 0.011210983619093895,
      "activation_l2_distance": -0.0016580860828980803,
      "activation_cosine_similarity": 0.015191597864031792,
      "activation_magnitude_ratio": -0.0020339174661785364,
      "activation_dot_product": 0.007064687553793192,
      "encoder_gradient_cosine_similarity": 0.002147587016224861,
      "encoder_gradient_l2_distance": -0.03285149484872818,
      "encoder_gradient_dot_product": 0.0003085916396230459,
      "input_gradient_cosine_similarity": 0.0014924760907888412,
      "input_gradient_l2_distance": -0.020349230617284775,
      "input_gradient_dot_product": -0.0030782923568040133
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.00525326281785965,
      "right_subspace_overlap_bottom_k": 0.006289131008088589,
      "interaction_matrix_overlap_top_k": 0.0028389038052409887,
      "interaction_matrix_overlap_bottom_k": 0.0034924007486552,
      "effective_rank": 0.0008330994169227779,
      "effective_rank_mergeability_score": 0.0007454389124177396,
      "stable_rank": 0.00087262800661847,
      "spectral_gap": 0.0007419059984385967,
      "singular_value_ratio": 0.000810161407571286,
      "layerwise_effective_rank": 0.0014038217486813664,
      "layerwise_effective_rank_mergeability_score": 0.0012354424688965082,
      "task_vector_cosine_similarity": 0.003715971251949668,
      "task_vector_l2_distance": 0.004872738383710384,
      "task_vector_dot_product": 0.0021193912252783775,
      "weight_space_angle": 0.0022354410029947758,
      "task_vector_magnitude_ratio": 0.0007130084559321404,
      "singular_value_overlap": 0.005613329820334911,
      "subspace_overlap": 0.001869942876510322,
      "right_subspace_overlap": 0.005387477111071348,
      "activation_l2_distance": 0.0039334590546786785,
      "activation_cosine_similarity": 0.005800665356218815,
      "activation_magnitude_ratio": 0.0018591417465358973,
      "activation_dot_product": 0.011777758598327637,
      "encoder_gradient_cosine_similarity": 0.0012069897493347526,
      "encoder_gradient_l2_distance": 0.017338348552584648,
      "encoder_gradient_dot_product": 0.001695265294983983,
      "input_gradient_cosine_similarity": 0.0019309911876916885,
      "input_gradient_l2_distance": 0.01589168980717659,
      "input_gradient_dot_product": 0.002548891818150878
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 1.0,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.55,
      "interaction_matrix_overlap_bottom_k": 0.95,
      "effective_rank": 0.25,
      "effective_rank_mergeability_score": 0.25,
      "stable_rank": 0.25,
      "spectral_gap": 0.35,
      "singular_value_ratio": 0.35,
      "layerwise_effective_rank": 0.5,
      "layerwise_effective_rank_mergeability_score": 0.35,
      "task_vector_cosine_similarity": 0.6,
      "task_vector_l2_distance": 0.65,
      "task_vector_dot_product": 0.5,
      "weight_space_angle": 0.7,
      "task_vector_magnitude_ratio": 0.25,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.7,
      "right_subspace_overlap": 1.0,
      "activation_l2_distance": 0.75,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.7,
      "activation_dot_product": 0.9,
      "encoder_gradient_cosine_similarity": 0.85,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.65,
      "input_gradient_cosine_similarity": 0.55,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.9
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7605072750323043,
        "val_r": 0.5505701537713538,
        "n_iterations": 360,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011279534548521042,
          "right_subspace_overlap_bottom_k": -0.016956757754087448,
          "interaction_matrix_overlap_top_k": 0.002775129396468401,
          "interaction_matrix_overlap_bottom_k": 0.003477186895906925,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0010068779811263084,
          "task_vector_dot_product": -0.001079390523955226,
          "weight_space_angle": 0.0010632809717208147,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.00430840440094471,
          "subspace_overlap": 0.0012780365068465471,
          "right_subspace_overlap": 0.008646040223538876,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.01612822152674198,
          "activation_magnitude_ratio": -0.004243497271090746,
          "activation_dot_product": 0.0018759852973744273,
          "encoder_gradient_cosine_similarity": 0.0015677365008741617,
          "encoder_gradient_l2_distance": -0.025088081136345863,
          "encoder_gradient_dot_product": -0.0013096884358674288,
          "input_gradient_cosine_similarity": 0.0015351837500929832,
          "input_gradient_l2_distance": -0.016836825758218765,
          "input_gradient_dot_product": -0.005277296062558889
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7440066987745588,
        "val_r": 0.7746330397879727,
        "n_iterations": 394,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005723155569285154,
          "right_subspace_overlap_bottom_k": -0.019587988033890724,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.004545197822153568,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0012048811186105013,
          "singular_value_ratio": 0.0015569995157420635,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.00591505179181695,
          "subspace_overlap": -0.0017176385736092925,
          "right_subspace_overlap": 0.015010873787105083,
          "activation_l2_distance": 0.0013545204419642687,
          "activation_cosine_similarity": 0.012110763229429722,
          "activation_magnitude_ratio": -0.002098198514431715,
          "activation_dot_product": 0.0041094934567809105,
          "encoder_gradient_cosine_similarity": 0.0019204916898161173,
          "encoder_gradient_l2_distance": -0.018757550045847893,
          "encoder_gradient_dot_product": 0.001302910503000021,
          "input_gradient_cosine_similarity": 0.00106775329913944,
          "input_gradient_l2_distance": -0.01518365927040577,
          "input_gradient_dot_product": -0.002268670592457056
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7755225959542899,
        "val_r": 0.8392711213720558,
        "n_iterations": 391,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01290604006499052,
          "right_subspace_overlap_bottom_k": -0.01757785864174366,
          "interaction_matrix_overlap_top_k": -0.0022654018830507994,
          "interaction_matrix_overlap_bottom_k": 0.0015352494083344936,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.003120811888948083,
          "layerwise_effective_rank_mergeability_score": 0.002063373802229762,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.001689832890406251,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.001809729845263064,
          "subspace_overlap": -0.0031204097904264927,
          "right_subspace_overlap": 0.007481016684323549,
          "activation_l2_distance": 0.0012074918486177921,
          "activation_cosine_similarity": 0.013488546945154667,
          "activation_magnitude_ratio": -0.0029473337344825268,
          "activation_dot_product": -0.0011872007744386792,
          "encoder_gradient_cosine_similarity": 0.001881023170426488,
          "encoder_gradient_l2_distance": -0.020930826663970947,
          "encoder_gradient_dot_product": -0.0019620435778051615,
          "input_gradient_cosine_similarity": 0.0034199801739305258,
          "input_gradient_l2_distance": -0.006312255747616291,
          "input_gradient_dot_product": -0.002530083991587162
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7647306673104068,
        "val_r": 0.7240061695166632,
        "n_iterations": 299,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004994068294763565,
          "right_subspace_overlap_bottom_k": -0.023908359929919243,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0011087254388257861,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0038672201335430145,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.003315966110676527,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.006081376690417528,
          "subspace_overlap": -0.0011889039305970073,
          "right_subspace_overlap": 0.017194343730807304,
          "activation_l2_distance": 0.003646780736744404,
          "activation_cosine_similarity": 0.020680950954556465,
          "activation_magnitude_ratio": -0.0015463994350284338,
          "activation_dot_product": -0.0039402786642313,
          "encoder_gradient_cosine_similarity": 0.0029657480772584677,
          "encoder_gradient_l2_distance": -0.025155767798423767,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.003544297767803073,
          "input_gradient_dot_product": -0.005507552530616522
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7656315364861824,
        "val_r": 0.7472895003256594,
        "n_iterations": 437,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.014049637131392956,
          "right_subspace_overlap_bottom_k": -0.02564697153866291,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0027756551280617714,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.001435547135770321,
          "task_vector_magnitude_ratio": -0.0012113124830648303,
          "singular_value_overlap": 0.005397249944508076,
          "subspace_overlap": -0.0018222004873678088,
          "right_subspace_overlap": 0.009799395687878132,
          "activation_l2_distance": 0.0021184992510825396,
          "activation_cosine_similarity": 0.01923413760960102,
          "activation_magnitude_ratio": -0.0013707939069718122,
          "activation_dot_product": -0.0028390607330948114,
          "encoder_gradient_cosine_similarity": 0.0024015421513468027,
          "encoder_gradient_l2_distance": -0.027403265237808228,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0030479026027023792,
          "input_gradient_l2_distance": -0.004370464477688074,
          "input_gradient_dot_product": -0.0020416155457496643
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7299534724663884,
        "val_r": 0.7338795846776529,
        "n_iterations": 273,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.014973548240959644,
          "right_subspace_overlap_bottom_k": -0.04074452444911003,
          "interaction_matrix_overlap_top_k": 0.005485143978148699,
          "interaction_matrix_overlap_bottom_k": -0.0014797199983149767,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0017497187945991755,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.010279703885316849,
          "task_vector_l2_distance": -0.007582205347716808,
          "task_vector_dot_product": -0.006276184692978859,
          "weight_space_angle": 0.00736887427046895,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.02170000784099102,
          "subspace_overlap": -0.0032580541446805,
          "right_subspace_overlap": 0.01202761847525835,
          "activation_l2_distance": -0.010857366025447845,
          "activation_cosine_similarity": 0.026225818321108818,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.04006562754511833,
          "encoder_gradient_cosine_similarity": 0.0033371662721037865,
          "encoder_gradient_l2_distance": -0.0872500091791153,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.05878182500600815,
          "input_gradient_dot_product": -0.0029991932678967714
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7486886849809424,
        "val_r": 0.6860847163556371,
        "n_iterations": 466,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.007677366025745869,
          "right_subspace_overlap_bottom_k": -0.02394814044237137,
          "interaction_matrix_overlap_top_k": 0.0030758632346987724,
          "interaction_matrix_overlap_bottom_k": 0.005710020661354065,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005900510586798191,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.00273787509649992,
          "activation_l2_distance": -0.0017843247624114156,
          "activation_cosine_similarity": 0.008397962898015976,
          "activation_magnitude_ratio": -0.0016290000639855862,
          "activation_dot_product": 0.006313705816864967,
          "encoder_gradient_cosine_similarity": 0.0011863907566294074,
          "encoder_gradient_l2_distance": -0.02025531977415085,
          "encoder_gradient_dot_product": 0.0019180051749572158,
          "input_gradient_cosine_similarity": 0.0039000262040644884,
          "input_gradient_l2_distance": -0.018874499946832657,
          "input_gradient_dot_product": -0.006004870869219303
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7683721621891719,
        "val_r": 0.3869198832301105,
        "n_iterations": 345,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.020918821915984154,
          "right_subspace_overlap_bottom_k": -0.02194349840283394,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0010184048442170024,
          "layerwise_effective_rank_mergeability_score": 0.0012724248226732016,
          "task_vector_cosine_similarity": -0.005791707895696163,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.0045347390696406364,
          "weight_space_angle": 0.0027609155513346195,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0025309198535978794,
          "subspace_overlap": 0.0011412312742322683,
          "right_subspace_overlap": 0.008647488430142403,
          "activation_l2_distance": -0.006928625050932169,
          "activation_cosine_similarity": 0.01685091108083725,
          "activation_magnitude_ratio": -0.003886663820594549,
          "activation_dot_product": -0.0014185280306264758,
          "encoder_gradient_cosine_similarity": 0.004027705639600754,
          "encoder_gradient_l2_distance": -0.02669108472764492,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.011399266310036182,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7916270459486785,
        "val_r": 0.5606677271816939,
        "n_iterations": 286,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.008488948456943035,
          "right_subspace_overlap_bottom_k": -0.025246407836675644,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.002575280610471964,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.001120055909268558,
          "singular_value_ratio": 0.0010814610868692398,
          "layerwise_effective_rank": -0.002795466687530279,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0023053856566548347,
          "task_vector_l2_distance": 0.0015516034327447414,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.003200617851689458,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.006258614361286163,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.020490583032369614,
          "activation_l2_distance": 0.0029500515665858984,
          "activation_cosine_similarity": 0.01903063803911209,
          "activation_magnitude_ratio": -0.0019538269843906164,
          "activation_dot_product": -0.00407018419355154,
          "encoder_gradient_cosine_similarity": 0.0037245163694024086,
          "encoder_gradient_l2_distance": -0.024991579353809357,
          "encoder_gradient_dot_product": 0.004020919091999531,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.012454988434910774,
          "input_gradient_dot_product": -0.0016113759484142065
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7277840219375449,
        "val_r": 0.402159423879808,
        "n_iterations": 282,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010327713564038277,
          "right_subspace_overlap_bottom_k": -0.02147228829562664,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.004437221214175224,
          "effective_rank": -0.001165024470537901,
          "effective_rank_mergeability_score": 0.0010241720592603087,
          "stable_rank": -0.0018557531293481588,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0032533123157918453,
          "layerwise_effective_rank_mergeability_score": 0.0031466828659176826,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0031719491817057133,
          "task_vector_dot_product": -0.0017682032193988562,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005135305225849152,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.00977794174104929,
          "activation_l2_distance": -0.0012438071426004171,
          "activation_cosine_similarity": -0.0017164587043225765,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.0017593302763998508,
          "encoder_gradient_cosine_similarity": 0.003831550944596529,
          "encoder_gradient_l2_distance": -0.015016790479421616,
          "encoder_gradient_dot_product": -0.0015746428398415446,
          "input_gradient_cosine_similarity": 0.0036741946823894978,
          "input_gradient_l2_distance": -0.013926757499575615,
          "input_gradient_dot_product": -0.0017162543954327703
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7925714797826183,
        "val_r": 0.17632662333784133,
        "n_iterations": 198,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.016474906355142593,
          "right_subspace_overlap_bottom_k": -0.022344287484884262,
          "interaction_matrix_overlap_top_k": -0.00114294677041471,
          "interaction_matrix_overlap_bottom_k": -0.0016673888312652707,
          "effective_rank": -0.0019757940899580717,
          "effective_rank_mergeability_score": 0.0017073567723855376,
          "stable_rank": -0.0011342098005115986,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0013755521504208446,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.002504173666238785,
          "task_vector_l2_distance": -0.0024435720406472683,
          "task_vector_dot_product": -0.004616455174982548,
          "weight_space_angle": 0.00364964478649199,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.016335666179656982,
          "subspace_overlap": -0.004269873257726431,
          "right_subspace_overlap": 0.007169612683355808,
          "activation_l2_distance": -0.007307027466595173,
          "activation_cosine_similarity": 0.01952088624238968,
          "activation_magnitude_ratio": -0.003779035061597824,
          "activation_dot_product": 0.0117418197914958,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.04022065922617912,
          "encoder_gradient_dot_product": -0.0020927165169268847,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.015976902097463608,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7651211540789623,
        "val_r": 0.7349544037647776,
        "n_iterations": 232,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009406491182744503,
          "right_subspace_overlap_bottom_k": -0.019022492691874504,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0016355746192857623,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0013455834705382586,
          "singular_value_ratio": -0.0013342146994546056,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.003125191433355212,
          "task_vector_l2_distance": 0.0018896044930443168,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0029780957847833633,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.002907977905124426,
          "subspace_overlap": -0.003228006884455681,
          "right_subspace_overlap": 0.011431070044636726,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.010472480207681656,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0028725024312734604,
          "encoder_gradient_cosine_similarity": 0.002216352615505457,
          "encoder_gradient_l2_distance": -0.020108316093683243,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": -0.0019841715693473816,
          "input_gradient_l2_distance": -0.0046949852257966995,
          "input_gradient_dot_product": -0.001459138235077262
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7359434448055462,
        "val_r": 0.7137428510828359,
        "n_iterations": 409,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.013682922348380089,
          "right_subspace_overlap_bottom_k": -0.03012780286371708,
          "interaction_matrix_overlap_top_k": 0.0018480441067367792,
          "interaction_matrix_overlap_bottom_k": -0.006973499432206154,
          "effective_rank": 0.0016161950770765543,
          "effective_rank_mergeability_score": -0.001972475554794073,
          "stable_rank": 0.001250073197297752,
          "spectral_gap": -0.0015385511796921492,
          "singular_value_ratio": 0.0019444352947175503,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.00871219765394926,
          "task_vector_l2_distance": -0.001186045934446156,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.016496190801262856,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.010623179376125336,
          "activation_l2_distance": -0.0027231902349740267,
          "activation_cosine_similarity": 0.016176259145140648,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.022464606910943985,
          "encoder_gradient_cosine_similarity": 0.0024915789254009724,
          "encoder_gradient_l2_distance": -0.04979262873530388,
          "encoder_gradient_dot_product": -0.0010443704668432474,
          "input_gradient_cosine_similarity": 0.004663615021854639,
          "input_gradient_l2_distance": -0.03470746427774429,
          "input_gradient_dot_product": -0.0032492876052856445
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7728701274275775,
        "val_r": 0.7454163692123964,
        "n_iterations": 259,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005594575311988592,
          "right_subspace_overlap_bottom_k": -0.01489097997546196,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.001642466988414526,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": -0.0013653134228661656,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0050249407067894936,
          "task_vector_l2_distance": 0.003217422403395176,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.004388502333313227,
          "subspace_overlap": -0.0017839110223576427,
          "right_subspace_overlap": 0.013215694576501846,
          "activation_l2_distance": 0.003046841360628605,
          "activation_cosine_similarity": 0.013804864138364792,
          "activation_magnitude_ratio": -0.0010642834240570664,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0015434627421200275,
          "encoder_gradient_l2_distance": -0.01740739867091179,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.006026380229741335,
          "input_gradient_dot_product": -0.003746457863599062
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7427707954175713,
        "val_r": 0.7519253866781546,
        "n_iterations": 241,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010393500328063965,
          "right_subspace_overlap_bottom_k": -0.02685997448861599,
          "interaction_matrix_overlap_top_k": 0.006351139862090349,
          "interaction_matrix_overlap_bottom_k": -0.002924423897638917,
          "effective_rank": 0.0018411200726404786,
          "effective_rank_mergeability_score": -0.0012519990559667349,
          "stable_rank": 0.0,
          "spectral_gap": -0.0013890379341319203,
          "singular_value_ratio": 0.0010564371477812529,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0022435064893215895,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0010026635136455297,
          "task_vector_magnitude_ratio": 0.001395947067067027,
          "singular_value_overlap": 0.010595962405204773,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.018772851675748825,
          "activation_l2_distance": -0.0059678805992007256,
          "activation_cosine_similarity": 0.017151013016700745,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.005371175706386566,
          "encoder_gradient_cosine_similarity": 0.002383455168455839,
          "encoder_gradient_l2_distance": -0.03810879960656166,
          "encoder_gradient_dot_product": 0.001435756916180253,
          "input_gradient_cosine_similarity": 0.004854185972362757,
          "input_gradient_l2_distance": -0.026896633207798004,
          "input_gradient_dot_product": -0.003939148969948292
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.7956247397726592,
        "val_r": 0.7446621147708151,
        "n_iterations": 227,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.012487822212278843,
          "right_subspace_overlap_bottom_k": -0.027465885505080223,
          "interaction_matrix_overlap_top_k": 0.001480477163568139,
          "interaction_matrix_overlap_bottom_k": 0.001503401785157621,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0028159539215266705,
          "task_vector_l2_distance": -0.008648897521197796,
          "task_vector_dot_product": 0.0016758847050368786,
          "weight_space_angle": 0.0010538893984630704,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.012045689858496189,
          "subspace_overlap": -0.0048063769936561584,
          "right_subspace_overlap": 0.017619961872696877,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.02233990654349327,
          "activation_magnitude_ratio": -0.005951200611889362,
          "activation_dot_product": -0.001565081300213933,
          "encoder_gradient_cosine_similarity": 0.002529281424358487,
          "encoder_gradient_l2_distance": -0.05339976027607918,
          "encoder_gradient_dot_product": 0.0014937825035303831,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.016979947686195374,
          "input_gradient_dot_product": -0.009070808067917824
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7740638658055193,
        "val_r": 0.7857705247792569,
        "n_iterations": 316,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002798784291371703,
          "right_subspace_overlap_bottom_k": -0.01705768331885338,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.003015739843249321,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0013786975760012865,
          "layerwise_effective_rank_mergeability_score": 0.001139903673902154,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.0018089249497279525,
          "weight_space_angle": 0.0016415781574323773,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.004015233367681503,
          "subspace_overlap": -0.0033668610267341137,
          "right_subspace_overlap": 0.014815614558756351,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.01149412989616394,
          "activation_magnitude_ratio": -0.0021870480850338936,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.003474715631455183,
          "encoder_gradient_l2_distance": -0.013635251671075821,
          "encoder_gradient_dot_product": -0.0017685218481346965,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.008968002162873745,
          "input_gradient_dot_product": -0.002765445038676262
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7457279379953815,
        "val_r": 0.6523384392021477,
        "n_iterations": 271,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.015205107629299164,
          "right_subspace_overlap_bottom_k": -0.02714559994637966,
          "interaction_matrix_overlap_top_k": 0.005057595204561949,
          "interaction_matrix_overlap_bottom_k": -0.001162748783826828,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0012813315261155367,
          "spectral_gap": -0.0011747176758944988,
          "singular_value_ratio": 0.0010865326039493084,
          "layerwise_effective_rank": -0.0019385417690500617,
          "layerwise_effective_rank_mergeability_score": 0.0013222681591287255,
          "task_vector_cosine_similarity": 0.0026931308675557375,
          "task_vector_l2_distance": -0.006867572665214539,
          "task_vector_dot_product": 0.0030305555555969477,
          "weight_space_angle": -0.001204392989166081,
          "task_vector_magnitude_ratio": 0.0016970597207546234,
          "singular_value_overlap": 0.018111400306224823,
          "subspace_overlap": 0.0013067257823422551,
          "right_subspace_overlap": 0.009014850482344627,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0157439224421978,
          "activation_magnitude_ratio": -0.005899697542190552,
          "activation_dot_product": 0.02050957828760147,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.03963863477110863,
          "encoder_gradient_dot_product": 0.0024527637287974358,
          "input_gradient_cosine_similarity": 0.0022864225320518017,
          "input_gradient_l2_distance": -0.045430682599544525,
          "input_gradient_dot_product": -0.0041196937672793865
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7339981743717914,
        "val_r": 0.6518770823840464,
        "n_iterations": 343,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.013206004165112972,
          "right_subspace_overlap_bottom_k": -0.030229942873120308,
          "interaction_matrix_overlap_top_k": 0.004116016905754805,
          "interaction_matrix_overlap_bottom_k": -0.0011576219694688916,
          "effective_rank": -0.0016451459378004074,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.003019864670932293,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0015532312681898475,
          "layerwise_effective_rank": -0.003988835960626602,
          "layerwise_effective_rank_mergeability_score": 0.004237051587551832,
          "task_vector_cosine_similarity": -0.002323820721358061,
          "task_vector_l2_distance": -0.009179670363664627,
          "task_vector_dot_product": -0.0021503600291907787,
          "weight_space_angle": 0.00571716483682394,
          "task_vector_magnitude_ratio": -0.0015450587961822748,
          "singular_value_overlap": 0.011472200974822044,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.012726440094411373,
          "activation_l2_distance": -0.004513949155807495,
          "activation_cosine_similarity": 0.016688821837306023,
          "activation_magnitude_ratio": -0.0021213688887655735,
          "activation_dot_product": 0.01669168472290039,
          "encoder_gradient_cosine_similarity": 0.001469018287025392,
          "encoder_gradient_l2_distance": -0.045609042048454285,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.003384430892765522,
          "input_gradient_l2_distance": -0.03516083583235741,
          "input_gradient_dot_product": -0.0061300466768443584
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.837298241735103,
        "val_r": 0.6872361169150321,
        "n_iterations": 235,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.002751868451014161,
          "right_subspace_overlap_bottom_k": -0.01250816322863102,
          "interaction_matrix_overlap_top_k": -0.0063217333517968655,
          "interaction_matrix_overlap_bottom_k": -0.008059263229370117,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.001245375256985426,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0016800565645098686,
          "layerwise_effective_rank_mergeability_score": 0.0024388178717345,
          "task_vector_cosine_similarity": 0.0019877683371305466,
          "task_vector_l2_distance": -0.01633143611252308,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0019443046767264605,
          "task_vector_magnitude_ratio": -0.0012348252348601818,
          "singular_value_overlap": 0.007507462054491043,
          "subspace_overlap": -0.0032123855780810118,
          "right_subspace_overlap": -0.002982762409374118,
          "activation_l2_distance": -0.006159732583910227,
          "activation_cosine_similarity": 0.010008213110268116,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.02605723962187767,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0475691594183445,
          "encoder_gradient_dot_product": 0.0032996786758303642,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0504579022526741,
          "input_gradient_dot_product": 0.0028710952028632164
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.5,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "isotropic": {
    "aggregate_metrics": {
      "train_r": 0.45407499129750556,
      "train_p": 1.0944677397522091e-163,
      "val_r": 0.044611329527150745,
      "val_p": 0.40003818347787967
    },
    "per_fold_stats": {
      "train_r_mean": 0.5545384121093118,
      "train_r_std": 0.04099603834025219,
      "val_r_mean": 0.4431387291223253,
      "val_r_std": 0.1459124731344027,
      "n_nonzero_mean": 18.7,
      "n_nonzero_std": 3.479942528261063
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.0009750762837938964,
      "right_subspace_overlap_bottom_k": 0.004742247052490711,
      "interaction_matrix_overlap_top_k": -0.000578699167817831,
      "interaction_matrix_overlap_bottom_k": 0.02730504237115383,
      "effective_rank": -0.0003203979867976159,
      "effective_rank_mergeability_score": 0.0003351555787958205,
      "stable_rank": -0.0005377558409236372,
      "spectral_gap": 0.0005061282427050173,
      "singular_value_ratio": -0.00046937866136431694,
      "layerwise_effective_rank": -0.0005517587414942682,
      "layerwise_effective_rank_mergeability_score": 0.00043108206591568887,
      "task_vector_cosine_similarity": -0.0002924669242929667,
      "task_vector_l2_distance": -0.01851021498441696,
      "task_vector_dot_product": -0.000510625948663801,
      "weight_space_angle": 0.0011753311846405268,
      "task_vector_magnitude_ratio": -0.004185675643384457,
      "singular_value_overlap": -0.018195267766714096,
      "subspace_overlap": 0.0027204789221286774,
      "right_subspace_overlap": 0.0009801069973036647,
      "activation_l2_distance": -0.00044936599442735314,
      "activation_cosine_similarity": 0.0001255279639735818,
      "activation_magnitude_ratio": -0.0049768188036978245,
      "activation_dot_product": -0.002195653971284628,
      "encoder_gradient_cosine_similarity": 0.00015232068835757673,
      "encoder_gradient_l2_distance": -0.011668307706713676,
      "encoder_gradient_dot_product": 0.0005043993587605655,
      "input_gradient_cosine_similarity": 0.0011440727394074202,
      "input_gradient_l2_distance": -0.02112356200814247,
      "input_gradient_dot_product": -0.004989933222532272
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.0026086147408932447,
      "right_subspace_overlap_bottom_k": 0.004568357020616531,
      "interaction_matrix_overlap_top_k": 0.001916107488796115,
      "interaction_matrix_overlap_bottom_k": 0.007318887393921614,
      "effective_rank": 0.0005613246466964483,
      "effective_rank_mergeability_score": 0.0006856020190753043,
      "stable_rank": 0.0006818942492827773,
      "spectral_gap": 0.0008963276050053537,
      "singular_value_ratio": 0.0009193715522997081,
      "layerwise_effective_rank": 0.0013081200886517763,
      "layerwise_effective_rank_mergeability_score": 0.0009728326695039868,
      "task_vector_cosine_similarity": 0.0011729317484423518,
      "task_vector_l2_distance": 0.007536298595368862,
      "task_vector_dot_product": 0.00265966122969985,
      "weight_space_angle": 0.0019250301411375403,
      "task_vector_magnitude_ratio": 0.001963724149391055,
      "singular_value_overlap": 0.006089130416512489,
      "subspace_overlap": 0.0026353122666478157,
      "right_subspace_overlap": 0.0030862672720104456,
      "activation_l2_distance": 0.0031041877809911966,
      "activation_cosine_similarity": 0.002082545543089509,
      "activation_magnitude_ratio": 0.0020626522600650787,
      "activation_dot_product": 0.004247982520610094,
      "encoder_gradient_cosine_similarity": 0.0017669587396085262,
      "encoder_gradient_l2_distance": 0.004704682622104883,
      "encoder_gradient_dot_product": 0.0014577734982594848,
      "input_gradient_cosine_similarity": 0.0012497496791183949,
      "input_gradient_l2_distance": 0.006714371498674154,
      "input_gradient_dot_product": 0.0032374041620641947
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.45,
      "right_subspace_overlap_bottom_k": 0.8,
      "interaction_matrix_overlap_top_k": 0.4,
      "interaction_matrix_overlap_bottom_k": 1.0,
      "effective_rank": 0.25,
      "effective_rank_mergeability_score": 0.35,
      "stable_rank": 0.4,
      "spectral_gap": 0.45,
      "singular_value_ratio": 0.4,
      "layerwise_effective_rank": 0.2,
      "layerwise_effective_rank_mergeability_score": 0.2,
      "task_vector_cosine_similarity": 0.3,
      "task_vector_l2_distance": 1.0,
      "task_vector_dot_product": 0.6,
      "weight_space_angle": 0.75,
      "task_vector_magnitude_ratio": 1.0,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.8,
      "right_subspace_overlap": 0.55,
      "activation_l2_distance": 0.9,
      "activation_cosine_similarity": 0.6,
      "activation_magnitude_ratio": 0.95,
      "activation_dot_product": 0.8,
      "encoder_gradient_cosine_similarity": 0.5,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.55,
      "input_gradient_cosine_similarity": 0.5,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 1.0
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6069669389747144,
        "val_r": 0.6216906850658248,
        "n_iterations": 209,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.001524151535704732,
          "right_subspace_overlap_bottom_k": 0.005971998907625675,
          "interaction_matrix_overlap_top_k": -0.0024150696117430925,
          "interaction_matrix_overlap_bottom_k": 0.03424370288848877,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0014240657910704613,
          "task_vector_l2_distance": -0.024421220645308495,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.004702414385974407,
          "task_vector_magnitude_ratio": -0.005878467112779617,
          "singular_value_overlap": -0.025676751509308815,
          "subspace_overlap": 0.0069850729778409,
          "right_subspace_overlap": -0.0020423561800271273,
          "activation_l2_distance": 0.001793664414435625,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.007859897799789906,
          "activation_dot_product": -0.005102195776998997,
          "encoder_gradient_cosine_similarity": -0.0020026019774377346,
          "encoder_gradient_l2_distance": -0.012159079313278198,
          "encoder_gradient_dot_product": 0.0012017423287034035,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.019374113529920578,
          "input_gradient_dot_product": -0.005960147362202406
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5427429750133878,
        "val_r": 0.5722878283435049,
        "n_iterations": 285,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004076370969414711,
          "right_subspace_overlap_bottom_k": 0.009004411287605762,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0332949161529541,
          "effective_rank": -0.001061383867636323,
          "effective_rank_mergeability_score": 0.0011477397056296468,
          "stable_rank": 0.0,
          "spectral_gap": 0.0016484237276017666,
          "singular_value_ratio": -0.001763252541422844,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.003885365556925535,
          "task_vector_l2_distance": -0.019061792641878128,
          "task_vector_dot_product": -0.005565094295889139,
          "weight_space_angle": 0.004030839540064335,
          "task_vector_magnitude_ratio": -0.006631467957049608,
          "singular_value_overlap": -0.027768077328801155,
          "subspace_overlap": 0.002981973346322775,
          "right_subspace_overlap": 0.0042241839691996574,
          "activation_l2_distance": -0.003849123604595661,
          "activation_cosine_similarity": 0.004013813566416502,
          "activation_magnitude_ratio": -0.00516230333596468,
          "activation_dot_product": -0.006769961677491665,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.02189590036869049,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.03315090760588646,
          "input_gradient_dot_product": -0.009675076231360435
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5436327474745457,
        "val_r": 0.4944656114086446,
        "n_iterations": 360,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.01131760235875845,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.03337346762418747,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0011112620122730732,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.02523939125239849,
          "task_vector_dot_product": 0.0019361465238034725,
          "weight_space_angle": 0.0010576883796602488,
          "task_vector_magnitude_ratio": -0.004404345527291298,
          "singular_value_overlap": -0.023091088980436325,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.003449718002229929,
          "activation_cosine_similarity": -0.0011386937694624066,
          "activation_magnitude_ratio": -0.005633268505334854,
          "activation_dot_product": 0.0010728633496910334,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.010564908385276794,
          "encoder_gradient_dot_product": -0.0017121769487857819,
          "input_gradient_cosine_similarity": 0.0020911889150738716,
          "input_gradient_l2_distance": -0.025726240128278732,
          "input_gradient_dot_product": -0.0077710445038974285
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5523244641491509,
        "val_r": 0.4961566155415025,
        "n_iterations": 312,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.003222195664420724,
          "interaction_matrix_overlap_top_k": -0.0011159993009641767,
          "interaction_matrix_overlap_bottom_k": 0.026475343853235245,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0013092323206365108,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0010392768308520317,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.017166607081890106,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.004562309477478266,
          "singular_value_overlap": -0.018783332780003548,
          "subspace_overlap": 0.005598260089755058,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": -0.0025193211622536182,
          "activation_magnitude_ratio": -0.007717553526163101,
          "activation_dot_product": -0.0029515058267861605,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.008273190818727016,
          "encoder_gradient_dot_product": 0.0011292226845398545,
          "input_gradient_cosine_similarity": 0.0027370338793843985,
          "input_gradient_l2_distance": -0.018112044781446457,
          "input_gradient_dot_product": -0.004235783126205206
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5714641337863879,
        "val_r": 0.5433104574757851,
        "n_iterations": 285,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.027806423604488373,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01366439275443554,
          "task_vector_dot_product": -0.005453597754240036,
          "weight_space_angle": 0.0019243372371420264,
          "task_vector_magnitude_ratio": -0.0023501699324697256,
          "singular_value_overlap": -0.01663006842136383,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.003317030146718025,
          "activation_l2_distance": -0.0015805643051862717,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.003356881905347109,
          "activation_dot_product": -0.0034704525023698807,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.008563730865716934,
          "encoder_gradient_dot_product": 0.0012573954882100224,
          "input_gradient_cosine_similarity": 0.002073411364108324,
          "input_gradient_l2_distance": -0.01798323169350624,
          "input_gradient_dot_product": -0.005510477814823389
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5564378383511293,
        "val_r": 0.6466885078100408,
        "n_iterations": 765,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0114522660151124,
          "interaction_matrix_overlap_top_k": -0.001710810698568821,
          "interaction_matrix_overlap_bottom_k": 0.033472802489995956,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0011312816059216857,
          "singular_value_ratio": -0.0018455003155395389,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.027337050065398216,
          "task_vector_dot_product": 0.004322591703385115,
          "weight_space_angle": 0.0038204360753297806,
          "task_vector_magnitude_ratio": -0.00638490729033947,
          "singular_value_overlap": -0.021145012229681015,
          "subspace_overlap": -0.0019058939069509506,
          "right_subspace_overlap": -0.003010713029652834,
          "activation_l2_distance": 0.004081739578396082,
          "activation_cosine_similarity": -0.001595612266100943,
          "activation_magnitude_ratio": -0.006089236121624708,
          "activation_dot_product": 0.0013372208923101425,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.012300750240683556,
          "encoder_gradient_dot_product": 0.0022348302882164717,
          "input_gradient_cosine_similarity": 0.0037616384215652943,
          "input_gradient_l2_distance": -0.017388854175806046,
          "input_gradient_dot_product": -0.005182607099413872
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.5902396783824847,
        "val_r": 0.29220096697621006,
        "n_iterations": 395,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.00239451602101326,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.024971920996904373,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01178243663161993,
          "task_vector_dot_product": -0.003880639560520649,
          "weight_space_angle": 0.0011536937672644854,
          "task_vector_magnitude_ratio": -0.004681247286498547,
          "singular_value_overlap": -0.012164960615336895,
          "subspace_overlap": 0.0012366395676508546,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.007749900687485933,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.007878783158957958,
          "encoder_gradient_cosine_similarity": 0.0017331610433757305,
          "encoder_gradient_l2_distance": -0.013126324862241745,
          "encoder_gradient_dot_product": 0.0017383486265316606,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.014035208150744438,
          "input_gradient_dot_product": -0.004471853841096163
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5122449608095287,
        "val_r": 0.3374151268819038,
        "n_iterations": 243,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0021791732870042324,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.0011922621633857489,
          "interaction_matrix_overlap_bottom_k": 0.025361433625221252,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": -0.0010983586544170976,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.015579388476908207,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.004077722318470478,
          "singular_value_overlap": -0.016301028430461884,
          "subspace_overlap": 0.004408565815538168,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0014040053356438875,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0050685470923781395,
          "activation_dot_product": -0.004974489565938711,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.009209288284182549,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.00830375961959362,
          "input_gradient_dot_product": -0.0015971586108207703
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5493423879828563,
        "val_r": 0.45109733930877816,
        "n_iterations": 232,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.011151542887091637,
          "interaction_matrix_overlap_top_k": -0.0026049152947962284,
          "interaction_matrix_overlap_bottom_k": 0.03412509337067604,
          "effective_rank": -0.001292076543904841,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0011578128905966878,
          "spectral_gap": 0.0013079139171168208,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0015961683820933104,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.028163794428110123,
          "task_vector_dot_product": 0.0010001088958233595,
          "weight_space_angle": 0.002746023004874587,
          "task_vector_magnitude_ratio": -0.003284938633441925,
          "singular_value_overlap": -0.02574317529797554,
          "subspace_overlap": 0.002121339552104473,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0011354736052453518,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.008996433578431606,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0017176879337057471,
          "encoder_gradient_l2_distance": -0.010216271504759789,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0325823538005352,
          "input_gradient_dot_product": -0.001331257983110845
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5508031848690376,
        "val_r": 0.06715384739538477,
        "n_iterations": 313,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0015862876316532493,
          "right_subspace_overlap_bottom_k": 0.0075697097927331924,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.031408343464136124,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.022758115082979202,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.002797291148453951,
          "singular_value_overlap": -0.024546215310692787,
          "subspace_overlap": 0.0039932141080498695,
          "right_subspace_overlap": -0.001178162288852036,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": -0.0037631168961524963,
          "activation_magnitude_ratio": -0.00643800338730216,
          "activation_dot_product": -0.005684833973646164,
          "encoder_gradient_cosine_similarity": -0.0012444216990843415,
          "encoder_gradient_l2_distance": -0.011957656592130661,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.024428268894553185,
          "input_gradient_dot_product": -0.001133285346440971
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5207867116157635,
        "val_r": 0.38158294441729423,
        "n_iterations": 250,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.004498228896409273,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.02378096804022789,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0011707751546055079,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.014857947826385498,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0013641791883856058,
          "task_vector_magnitude_ratio": -0.0030622310005128384,
          "singular_value_overlap": -0.014363059774041176,
          "subspace_overlap": 0.0013521979562938213,
          "right_subspace_overlap": 0.0016890456900000572,
          "activation_l2_distance": -0.0018602557247504592,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.005566183477640152,
          "activation_dot_product": -0.0033922994043678045,
          "encoder_gradient_cosine_similarity": -0.002531364792957902,
          "encoder_gradient_l2_distance": -0.00836719386279583,
          "encoder_gradient_dot_product": -0.002757422160357237,
          "input_gradient_cosine_similarity": 0.00286948517896235,
          "input_gradient_l2_distance": -0.014766799286007881,
          "input_gradient_dot_product": -0.0025439895689487457
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.4989191103229239,
        "val_r": 0.4109307517590827,
        "n_iterations": 434,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.002873252145946026,
          "right_subspace_overlap_bottom_k": 0.004442664794623852,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.025784851983189583,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0010592297185212374,
          "singular_value_ratio": -0.0010790824890136719,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.015519039705395699,
          "task_vector_dot_product": -0.0011730091646313667,
          "weight_space_angle": 0.001927834004163742,
          "task_vector_magnitude_ratio": -0.004846005234867334,
          "singular_value_overlap": -0.015634071081876755,
          "subspace_overlap": 0.006941605359315872,
          "right_subspace_overlap": 0.0020716465078294277,
          "activation_l2_distance": -0.004540099762380123,
          "activation_cosine_similarity": 0.004206611774861813,
          "activation_magnitude_ratio": -0.0023550947662442923,
          "activation_dot_product": -0.004065544810146093,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.01053873635828495,
          "encoder_gradient_dot_product": -0.0011821193620562553,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.017835164442658424,
          "input_gradient_dot_product": -0.0048109968192875385
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5233722699895743,
        "val_r": 0.5498429125769141,
        "n_iterations": 290,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0107567785307765,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.03383341059088707,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0012821524869650602,
          "stable_rank": -0.0011420247610658407,
          "spectral_gap": 0.001424700254574418,
          "singular_value_ratio": -0.0014580392744392157,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0017128832405433059,
          "task_vector_l2_distance": -0.028372550383210182,
          "task_vector_dot_product": 0.001766058849170804,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0059733763337135315,
          "singular_value_overlap": -0.024399764835834503,
          "subspace_overlap": 0.0013220380060374737,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0018565452191978693,
          "activation_cosine_similarity": -0.0012813906650990248,
          "activation_magnitude_ratio": -0.006371192168444395,
          "activation_dot_product": -0.0033955180551856756,
          "encoder_gradient_cosine_similarity": 0.0012701674131676555,
          "encoder_gradient_l2_distance": -0.012103792279958725,
          "encoder_gradient_dot_product": 0.0035612762439996004,
          "input_gradient_cosine_similarity": 0.0011294233845546842,
          "input_gradient_l2_distance": -0.027677413076162338,
          "input_gradient_dot_product": -0.005082476418465376
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5041144651738104,
        "val_r": 0.646321400391478,
        "n_iterations": 429,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003290496300905943,
          "right_subspace_overlap_bottom_k": -0.002646005479618907,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.027032697573304176,
          "effective_rank": -0.0011400794610381126,
          "effective_rank_mergeability_score": 0.0011529546463862062,
          "stable_rank": -0.0011741681955754757,
          "spectral_gap": 0.0017073079943656921,
          "singular_value_ratio": -0.0014137664111331105,
          "layerwise_effective_rank": -0.0011874032206833363,
          "layerwise_effective_rank_mergeability_score": 0.0013008976820856333,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.009128854610025883,
          "task_vector_dot_product": -0.0023865802213549614,
          "weight_space_angle": 0.0012414141092449427,
          "task_vector_magnitude_ratio": -0.00372564559802413,
          "singular_value_overlap": -0.01447802409529686,
          "subspace_overlap": 0.006005384027957916,
          "right_subspace_overlap": 0.0018590305699035525,
          "activation_l2_distance": -0.00407383730635047,
          "activation_cosine_similarity": 0.0017713172128424048,
          "activation_magnitude_ratio": -0.002142716431990266,
          "activation_dot_product": -0.0036503244191408157,
          "encoder_gradient_cosine_similarity": 0.002177273156121373,
          "encoder_gradient_l2_distance": -0.013312062248587608,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.019395483657717705,
          "input_gradient_dot_product": -0.010785548016428947
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5242619987231514,
        "val_r": 0.5649183417729386,
        "n_iterations": 225,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.02186451479792595,
          "effective_rank": -0.0015350099420174956,
          "effective_rank_mergeability_score": 0.0016513252630829811,
          "stable_rank": -0.0018564281053841114,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01716323010623455,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.002855539321899414,
          "task_vector_magnitude_ratio": -0.004322884138673544,
          "singular_value_overlap": -0.015294932760298252,
          "subspace_overlap": 0.0070470054633915424,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.002003840869292617,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.004908533301204443,
          "activation_dot_product": -0.004647768102586269,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.008104262873530388,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01780577003955841,
          "input_gradient_dot_product": -0.0039016446098685265
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.5667117284122014,
        "val_r": 0.35328108368180833,
        "n_iterations": 183,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.004551155027002096,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.017724795266985893,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.001761134946718812,
          "task_vector_l2_distance": -0.015276627615094185,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0015753747429698706,
          "task_vector_magnitude_ratio": -0.0047744521871209145,
          "singular_value_overlap": -0.00700373575091362,
          "subspace_overlap": 0.0018156659789383411,
          "right_subspace_overlap": 0.002126511186361313,
          "activation_l2_distance": 0.004210122395306826,
          "activation_cosine_similarity": 0.002321334322914481,
          "activation_magnitude_ratio": -0.00409039156511426,
          "activation_dot_product": -0.0029630884528160095,
          "encoder_gradient_cosine_similarity": -0.0013543220702558756,
          "encoder_gradient_l2_distance": -0.009860232472419739,
          "encoder_gradient_dot_product": 0.0022873710840940475,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01297613326460123,
          "input_gradient_dot_product": -0.004677534569054842
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.537329918510123,
        "val_r": 0.351163707356006,
        "n_iterations": 269,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0021509374491870403,
          "right_subspace_overlap_bottom_k": 0.0018643452785909176,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.024103112518787384,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.017252828925848007,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.00219882489182055,
          "singular_value_overlap": -0.016546916216611862,
          "subspace_overlap": 0.00323116360232234,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0020421750377863646,
          "activation_cosine_similarity": -0.0010964109096676111,
          "activation_magnitude_ratio": -0.005013597197830677,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.008674830198287964,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0014979124534875154,
          "input_gradient_l2_distance": -0.01757928915321827,
          "input_gradient_dot_product": -0.005983153358101845
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5899216415369546,
        "val_r": 0.25577508889577494,
        "n_iterations": 279,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.005119509529322386,
          "interaction_matrix_overlap_top_k": -0.003921323921531439,
          "interaction_matrix_overlap_bottom_k": 0.033923979848623276,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.001030385261401534,
          "stable_rank": -0.0017580670537427068,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.001090093282982707,
          "layerwise_effective_rank": -0.003051054896786809,
          "layerwise_effective_rank_mergeability_score": 0.0034089256078004837,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.02207309380173683,
          "task_vector_dot_product": 0.0015252488665282726,
          "weight_space_angle": -0.0010877965250983834,
          "task_vector_magnitude_ratio": -0.0025957778561860323,
          "singular_value_overlap": -0.012887339107692242,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0028888797387480736,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0032698067370802164,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0033198785968124866,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.002239546738564968,
          "input_gradient_l2_distance": -0.025030171498656273,
          "input_gradient_dot_product": -0.0037472674157470465
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6838945455079937,
        "val_r": 0.5112175347497101,
        "n_iterations": 203,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010056748986244202,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.00546695152297616,
          "interaction_matrix_overlap_bottom_k": 0.00290966616012156,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0016769955400377512,
          "singular_value_ratio": 0.0016369145596399903,
          "layerwise_effective_rank": -0.005200548563152552,
          "layerwise_effective_rank_mergeability_score": 0.002872541779652238,
          "task_vector_cosine_similarity": -0.0019700180273503065,
          "task_vector_l2_distance": 0.0028844575863331556,
          "task_vector_dot_product": 0.002867761068046093,
          "weight_space_angle": 0.003683126997202635,
          "task_vector_magnitude_ratio": 0.0011206995695829391,
          "singular_value_overlap": -0.0064803361892700195,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.01218353770673275,
          "activation_l2_distance": -0.001341237802989781,
          "activation_cosine_similarity": 0.003647384699434042,
          "activation_magnitude_ratio": -0.004091414622962475,
          "activation_dot_product": 0.01262359507381916,
          "encoder_gradient_cosine_similarity": 0.005603737663477659,
          "encoder_gradient_l2_distance": -0.02500222809612751,
          "encoder_gradient_dot_product": 0.002329519484192133,
          "input_gradient_cosine_similarity": 0.0018601412884891033,
          "input_gradient_l2_distance": -0.026760468259453773,
          "input_gradient_dot_product": -0.012541331350803375
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5652565426005156,
        "val_r": 0.31527383063792014,
        "n_iterations": 403,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0020150139462202787,
          "right_subspace_overlap_bottom_k": 0.008963054046034813,
          "interaction_matrix_overlap_top_k": -0.0040805526077747345,
          "interaction_matrix_overlap_bottom_k": 0.030609438195824623,
          "effective_rank": -0.0013794098049402237,
          "effective_rank_mergeability_score": 0.0015369127504527569,
          "stable_rank": -0.001384578994475305,
          "spectral_gap": 0.002211470389738679,
          "singular_value_ratio": -0.002374752424657345,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.001478362362831831,
          "task_vector_l2_distance": -0.02827039733529091,
          "task_vector_dot_product": -0.005171515047550201,
          "weight_space_angle": -0.0016093741869553924,
          "task_vector_magnitude_ratio": -0.00828215479850769,
          "singular_value_overlap": -0.024967461824417114,
          "subspace_overlap": 0.0012753440532833338,
          "right_subspace_overlap": -0.0016376128187403083,
          "activation_l2_distance": -0.0020427724812179804,
          "activation_cosine_similarity": -0.0020553567446768284,
          "activation_magnitude_ratio": -0.00540532311424613,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": -0.0023229029029607773,
          "encoder_gradient_l2_distance": -0.015815820544958115,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0026216718833893538,
          "input_gradient_l2_distance": -0.031559545546770096,
          "input_gradient_dot_product": 0.001143971923738718
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.5,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  }
}