{
  "aggregate_metrics": {
    "train_r": 0.438980796821664,
    "train_p": 6.724466343789123e-152,
    "val_r": 0.4159104598373235,
    "val_p": 2.0844921215022924e-16
  },
  "per_fold_stats": {
    "train_r_mean": 0.7968741573787207,
    "train_r_std": 0.036367077032669594,
    "val_r_mean": 0.6629868873977324,
    "val_r_std": 0.16993783895203574,
    "n_nonzero_mean": 22.8,
    "n_nonzero_std": 3.2341923257592455
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.030056670308113098,
    "right_subspace_overlap_bottom_k": -0.1013614758849144,
    "interaction_matrix_overlap_top_k": -0.005001015029847622,
    "interaction_matrix_overlap_bottom_k": 0.050837256014347076,
    "effective_rank": 0.003884870558977127,
    "effective_rank_mergeability_score": -0.0034219257067888975,
    "stable_rank": -0.0016614932101219893,
    "spectral_gap": -0.0003077681176364422,
    "singular_value_ratio": 0.00042055780068039894,
    "layerwise_effective_rank": -0.006883519701659679,
    "layerwise_effective_rank_mergeability_score": 0.007575678173452616,
    "task_vector_cosine_similarity": -0.0015233650337904692,
    "task_vector_l2_distance": -0.0013908336404711008,
    "task_vector_dot_product": -0.0013836368452757597,
    "weight_space_angle": 0.0007174712372943759,
    "task_vector_magnitude_ratio": -9.522870823275298e-05,
    "singular_value_overlap": 0.014255454763770103,
    "subspace_overlap": -0.005170200485736132,
    "right_subspace_overlap": 0.028200801461935043,
    "activation_l2_distance": -0.003984223119914532,
    "activation_cosine_similarity": 0.036967821419239044,
    "activation_magnitude_ratio": -0.0069925785064697266,
    "activation_dot_product": 0.009557710029184818,
    "encoder_gradient_cosine_similarity": 0.008791299536824226,
    "encoder_gradient_l2_distance": -0.06361252814531326,
    "encoder_gradient_dot_product": 0.0014922574628144503,
    "input_gradient_cosine_similarity": 0.0027093091048300266,
    "input_gradient_l2_distance": -0.041553299874067307,
    "input_gradient_dot_product": -0.009057190269231796
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.01743181422352791,
    "right_subspace_overlap_bottom_k": 0.02706310711801052,
    "interaction_matrix_overlap_top_k": 0.01399348396807909,
    "interaction_matrix_overlap_bottom_k": 0.036805566400289536,
    "effective_rank": 0.004970437381416559,
    "effective_rank_mergeability_score": 0.0046432469971477985,
    "stable_rank": 0.0033464787993580103,
    "spectral_gap": 0.002550069708377123,
    "singular_value_ratio": 0.0025158466305583715,
    "layerwise_effective_rank": 0.005976445507258177,
    "layerwise_effective_rank_mergeability_score": 0.0059612467885017395,
    "task_vector_cosine_similarity": 0.011031746864318848,
    "task_vector_l2_distance": 0.01269769947975874,
    "task_vector_dot_product": 0.006659740582108498,
    "weight_space_angle": 0.011874698102474213,
    "task_vector_magnitude_ratio": 0.0024170682299882174,
    "singular_value_overlap": 0.01306287944316864,
    "subspace_overlap": 0.01193271391093731,
    "right_subspace_overlap": 0.01852329634130001,
    "activation_l2_distance": 0.011264074593782425,
    "activation_cosine_similarity": 0.020354721695184708,
    "activation_magnitude_ratio": 0.012040982022881508,
    "activation_dot_product": 0.03572951257228851,
    "encoder_gradient_cosine_similarity": 0.013342869468033314,
    "encoder_gradient_l2_distance": 0.0410960391163826,
    "encoder_gradient_dot_product": 0.0029736030846834183,
    "input_gradient_cosine_similarity": 0.002769788494333625,
    "input_gradient_l2_distance": 0.03963271155953407,
    "input_gradient_dot_product": 0.013722820207476616
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 1.0,
    "right_subspace_overlap_bottom_k": 1.0,
    "interaction_matrix_overlap_top_k": 0.8,
    "interaction_matrix_overlap_bottom_k": 0.95,
    "effective_rank": 0.7,
    "effective_rank_mergeability_score": 0.7,
    "stable_rank": 0.6,
    "spectral_gap": 0.35,
    "singular_value_ratio": 0.4,
    "layerwise_effective_rank": 0.8,
    "layerwise_effective_rank_mergeability_score": 0.75,
    "task_vector_cosine_similarity": 0.75,
    "task_vector_l2_distance": 0.95,
    "task_vector_dot_product": 0.7,
    "weight_space_angle": 0.8,
    "task_vector_magnitude_ratio": 0.55,
    "singular_value_overlap": 0.85,
    "subspace_overlap": 0.8,
    "right_subspace_overlap": 1.0,
    "activation_l2_distance": 0.75,
    "activation_cosine_similarity": 1.0,
    "activation_magnitude_ratio": 0.65,
    "activation_dot_product": 0.95,
    "encoder_gradient_cosine_similarity": 0.85,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.55,
    "input_gradient_cosine_similarity": 0.7,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.9
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7674318569194027,
      "val_r": 0.4484381159593573,
      "n_iterations": 322,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01963035576045513,
        "right_subspace_overlap_bottom_k": -0.11471404880285263,
        "interaction_matrix_overlap_top_k": -0.031062589958310127,
        "interaction_matrix_overlap_bottom_k": 0.1044297143816948,
        "effective_rank": 0.0057217334397137165,
        "effective_rank_mergeability_score": -0.005751829594373703,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.00455058179795742,
        "task_vector_l2_distance": 0.003051408799365163,
        "task_vector_dot_product": -0.0014805591199547052,
        "weight_space_angle": -0.003721419954672456,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.005833246745169163,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.024433594197034836,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.02772456780076027,
        "activation_magnitude_ratio": -0.0027715791948139668,
        "activation_dot_product": -0.005095755215734243,
        "encoder_gradient_cosine_similarity": 0.003424876369535923,
        "encoder_gradient_l2_distance": -0.02468065731227398,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.006127507425844669,
        "input_gradient_l2_distance": -0.022938765585422516,
        "input_gradient_dot_product": -0.00618253368884325
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.771941273532615,
      "val_r": 0.8078412005939141,
      "n_iterations": 231,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009869561530649662,
        "right_subspace_overlap_bottom_k": -0.11643677204847336,
        "interaction_matrix_overlap_top_k": -0.01102204155176878,
        "interaction_matrix_overlap_bottom_k": 0.0793951228260994,
        "effective_rank": 0.006519319489598274,
        "effective_rank_mergeability_score": -0.001498304889537394,
        "stable_rank": -0.0029130750335752964,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.005274685565382242,
        "layerwise_effective_rank_mergeability_score": 0.0147336320951581,
        "task_vector_cosine_similarity": -0.01251072809100151,
        "task_vector_l2_distance": -0.005954214371740818,
        "task_vector_dot_product": -0.004023891407996416,
        "weight_space_angle": 0.010560942813754082,
        "task_vector_magnitude_ratio": -0.0011142862495034933,
        "singular_value_overlap": 0.01289702020585537,
        "subspace_overlap": 0.004557320848107338,
        "right_subspace_overlap": 0.03905551880598068,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.03533171862363815,
        "activation_magnitude_ratio": -0.0058800228871405125,
        "activation_dot_product": 0.006872063968330622,
        "encoder_gradient_cosine_similarity": 0.008403354324400425,
        "encoder_gradient_l2_distance": -0.06926456093788147,
        "encoder_gradient_dot_product": 0.007246136665344238,
        "input_gradient_cosine_similarity": 0.0016016119625419378,
        "input_gradient_l2_distance": -0.044693540781736374,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7713546895340353,
      "val_r": 0.781232332630473,
      "n_iterations": 298,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.03669136017560959,
        "right_subspace_overlap_bottom_k": -0.10945488512516022,
        "interaction_matrix_overlap_top_k": 0.018611561506986618,
        "interaction_matrix_overlap_bottom_k": 0.018971987068653107,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.004006428178399801,
        "spectral_gap": -0.0025916588492691517,
        "singular_value_ratio": 0.001997384475544095,
        "layerwise_effective_rank": -0.022436315193772316,
        "layerwise_effective_rank_mergeability_score": 0.011690162122249603,
        "task_vector_cosine_similarity": -0.013292193412780762,
        "task_vector_l2_distance": -0.021290719509124756,
        "task_vector_dot_product": -0.00883319042623043,
        "weight_space_angle": 0.012111136689782143,
        "task_vector_magnitude_ratio": 0.002418435411527753,
        "singular_value_overlap": 0.0340283066034317,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.06334427744150162,
        "activation_l2_distance": -0.015524733811616898,
        "activation_cosine_similarity": 0.05451330915093422,
        "activation_magnitude_ratio": -0.010952770709991455,
        "activation_dot_product": 0.0376710444688797,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.14645056426525116,
        "encoder_gradient_dot_product": 0.002583912806585431,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.11314693838357925,
        "input_gradient_dot_product": 0.0030524726025760174
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8197728350725311,
      "val_r": 0.8108741777717086,
      "n_iterations": 501,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005518726073205471,
        "right_subspace_overlap_bottom_k": -0.10027695447206497,
        "interaction_matrix_overlap_top_k": -0.016652105376124382,
        "interaction_matrix_overlap_bottom_k": 0.08631615340709686,
        "effective_rank": 0.010555700398981571,
        "effective_rank_mergeability_score": -0.011319081299006939,
        "stable_rank": -0.0014907543081790209,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.00817175954580307,
        "layerwise_effective_rank_mergeability_score": 0.013272492215037346,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.005722522735595703,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0019158257637172937,
        "subspace_overlap": -0.0011413625907152891,
        "right_subspace_overlap": 0.025112444534897804,
        "activation_l2_distance": 0.0014269538223743439,
        "activation_cosine_similarity": 0.01915149949491024,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.003730164375156164,
        "encoder_gradient_cosine_similarity": 0.0018215118907392025,
        "encoder_gradient_l2_distance": -0.017880184575915337,
        "encoder_gradient_dot_product": 0.002532169222831726,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.012151137925684452,
        "input_gradient_dot_product": -0.0023086632136255503
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7995133395557238,
      "val_r": 0.7650896527722779,
      "n_iterations": 308,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.03599615395069122,
        "right_subspace_overlap_bottom_k": -0.11231553554534912,
        "interaction_matrix_overlap_top_k": -0.015456902794539928,
        "interaction_matrix_overlap_bottom_k": 0.08413047343492508,
        "effective_rank": 0.01286693848669529,
        "effective_rank_mergeability_score": -0.010422374121844769,
        "stable_rank": -0.005663004238158464,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.001194292213767767,
        "layerwise_effective_rank": -0.010417742654681206,
        "layerwise_effective_rank_mergeability_score": 0.007032470311969519,
        "task_vector_cosine_similarity": -0.005699130240827799,
        "task_vector_l2_distance": 0.0018833719659596682,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.004686628933995962,
        "task_vector_magnitude_ratio": 0.0011619884753599763,
        "singular_value_overlap": 0.004894136916846037,
        "subspace_overlap": -0.0018163046333938837,
        "right_subspace_overlap": 0.018592096865177155,
        "activation_l2_distance": -0.0015923463506624103,
        "activation_cosine_similarity": 0.025467567145824432,
        "activation_magnitude_ratio": -0.003783827181905508,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0066008432768285275,
        "encoder_gradient_l2_distance": -0.04385312274098396,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0038647635374218225,
        "input_gradient_l2_distance": -0.023015355691313744,
        "input_gradient_dot_product": -0.004183616954833269
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7195312972699152,
      "val_r": 0.6892903517074052,
      "n_iterations": 375,
      "n_nonzero_coefficients": 28,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.04730851948261261,
        "right_subspace_overlap_bottom_k": -0.15644074976444244,
        "interaction_matrix_overlap_top_k": 0.030360912904143333,
        "interaction_matrix_overlap_bottom_k": -0.010450848378241062,
        "effective_rank": -0.006759911775588989,
        "effective_rank_mergeability_score": 0.006713410839438438,
        "stable_rank": -0.01176681462675333,
        "spectral_gap": 0.009280247613787651,
        "singular_value_ratio": -0.008836875669658184,
        "layerwise_effective_rank": -0.019158905372023582,
        "layerwise_effective_rank_mergeability_score": 0.020002776756882668,
        "task_vector_cosine_similarity": 0.03577582910656929,
        "task_vector_l2_distance": -0.027345366775989532,
        "task_vector_dot_product": 0.021247517317533493,
        "weight_space_angle": -0.04185526818037033,
        "task_vector_magnitude_ratio": -0.008772184140980244,
        "singular_value_overlap": 0.0479060597717762,
        "subspace_overlap": 0.022295471280813217,
        "right_subspace_overlap": 0.04919459670782089,
        "activation_l2_distance": -0.03318082168698311,
        "activation_cosine_similarity": 0.07902733981609344,
        "activation_magnitude_ratio": -0.05613492429256439,
        "activation_dot_product": 0.13716913759708405,
        "encoder_gradient_cosine_similarity": 0.06283914297819138,
        "encoder_gradient_l2_distance": -0.12820081412792206,
        "encoder_gradient_dot_product": 0.0020087200682610273,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.15519022941589355,
        "input_gradient_dot_product": -0.059458229690790176
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7291207463546748,
      "val_r": 0.6171089820978894,
      "n_iterations": 291,
      "n_nonzero_coefficients": 29,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.032229792326688766,
        "right_subspace_overlap_bottom_k": -0.08984437584877014,
        "interaction_matrix_overlap_top_k": 0.004168340470641851,
        "interaction_matrix_overlap_bottom_k": 0.03143477439880371,
        "effective_rank": 0.004820946138352156,
        "effective_rank_mergeability_score": -0.0044808052480220795,
        "stable_rank": 0.0013353475369513035,
        "spectral_gap": -0.002590474672615528,
        "singular_value_ratio": 0.003441112581640482,
        "layerwise_effective_rank": -0.001685063005425036,
        "layerwise_effective_rank_mergeability_score": 0.0016441521001979709,
        "task_vector_cosine_similarity": 0.005538849160075188,
        "task_vector_l2_distance": -0.009463952854275703,
        "task_vector_dot_product": 0.0033239307813346386,
        "weight_space_angle": -0.006874145939946175,
        "task_vector_magnitude_ratio": 0.0025017333682626486,
        "singular_value_overlap": 0.01872309297323227,
        "subspace_overlap": 0.008907695300877094,
        "right_subspace_overlap": 0.012579855509102345,
        "activation_l2_distance": 0.008608666248619556,
        "activation_cosine_similarity": 0.04269815608859062,
        "activation_magnitude_ratio": -0.005912551656365395,
        "activation_dot_product": 0.03131917864084244,
        "encoder_gradient_cosine_similarity": 0.013735847547650337,
        "encoder_gradient_l2_distance": -0.0728398859500885,
        "encoder_gradient_dot_product": 0.011044754646718502,
        "input_gradient_cosine_similarity": 0.0075733899138867855,
        "input_gradient_l2_distance": -0.06928267329931259,
        "input_gradient_dot_product": -0.03125787153840065
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.780574654898055,
      "val_r": 0.37075940241764305,
      "n_iterations": 370,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.06272883713245392,
        "right_subspace_overlap_bottom_k": -0.12480125576257706,
        "interaction_matrix_overlap_top_k": 0.004737778566777706,
        "interaction_matrix_overlap_bottom_k": 0.04050017148256302,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.002074427902698517,
        "spectral_gap": -0.004173255525529385,
        "singular_value_ratio": 0.004181772004812956,
        "layerwise_effective_rank": -0.0073715029284358025,
        "layerwise_effective_rank_mergeability_score": 0.0060626547783613205,
        "task_vector_cosine_similarity": -0.019421666860580444,
        "task_vector_l2_distance": -0.001323436270467937,
        "task_vector_dot_product": -0.008421351201832294,
        "weight_space_angle": 0.0210723914206028,
        "task_vector_magnitude_ratio": 0.0020881269592791796,
        "singular_value_overlap": 0.011056353338062763,
        "subspace_overlap": -0.009664081037044525,
        "right_subspace_overlap": 0.05463835224509239,
        "activation_l2_distance": -0.028638124465942383,
        "activation_cosine_similarity": 0.06260645389556885,
        "activation_magnitude_ratio": -0.015163451433181763,
        "activation_dot_product": -0.012982867658138275,
        "encoder_gradient_cosine_similarity": 0.01679292879998684,
        "encoder_gradient_l2_distance": -0.11099714040756226,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.007534513249993324,
        "input_gradient_l2_distance": -0.04657342657446861,
        "input_gradient_dot_product": 0.0011879266239702702
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.8703726300704653,
      "val_r": 0.35261318811597475,
      "n_iterations": 826,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01377064548432827,
        "right_subspace_overlap_bottom_k": -0.10628422349691391,
        "interaction_matrix_overlap_top_k": -0.028126824647188187,
        "interaction_matrix_overlap_bottom_k": 0.09949558228254318,
        "effective_rank": 0.003782300977036357,
        "effective_rank_mergeability_score": -0.004409360699355602,
        "stable_rank": 0.0,
        "spectral_gap": -0.001052685547620058,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.002173621905967593,
        "layerwise_effective_rank_mergeability_score": 0.014270767569541931,
        "task_vector_cosine_similarity": -0.0011207431089133024,
        "task_vector_l2_distance": 0.00528627447783947,
        "task_vector_dot_product": 0.004329116083681583,
        "weight_space_angle": -0.0027923118323087692,
        "task_vector_magnitude_ratio": 0.0022181274835020304,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.014022380113601685,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.019153928384184837,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.012499413453042507,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.008760460652410984,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0017531519988551736,
        "input_gradient_l2_distance": -0.013094248250126839,
        "input_gradient_dot_product": -0.003561051795259118
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7990119390652979,
      "val_r": 0.5904187223872387,
      "n_iterations": 287,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.05268121138215065,
        "right_subspace_overlap_bottom_k": -0.1320262998342514,
        "interaction_matrix_overlap_top_k": -0.008647006936371326,
        "interaction_matrix_overlap_bottom_k": 0.07437389343976974,
        "effective_rank": 0.0030593411065638065,
        "effective_rank_mergeability_score": -0.0034882300533354282,
        "stable_rank": 0.002717456081882119,
        "spectral_gap": -0.0017266711220145226,
        "singular_value_ratio": 0.0018279465148225427,
        "layerwise_effective_rank": -0.006283259484916925,
        "layerwise_effective_rank_mergeability_score": 0.012388870120048523,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.008313314989209175,
        "task_vector_dot_product": -0.0043460107408463955,
        "weight_space_angle": 0.0017427755519747734,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.007463868707418442,
        "subspace_overlap": -0.007393007632344961,
        "right_subspace_overlap": 0.02328440733253956,
        "activation_l2_distance": -0.009903808124363422,
        "activation_cosine_similarity": -0.002378950361162424,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.019171910360455513,
        "encoder_gradient_cosine_similarity": 0.012958293780684471,
        "encoder_gradient_l2_distance": -0.04805904999375343,
        "encoder_gradient_dot_product": 0.0027804572600871325,
        "input_gradient_cosine_similarity": 0.005468939896672964,
        "input_gradient_l2_distance": -0.02858654595911503,
        "input_gradient_dot_product": -0.009589515626430511
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8104690424650616,
      "val_r": 0.2362852093473216,
      "n_iterations": 233,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.049209970980882645,
        "right_subspace_overlap_bottom_k": -0.06643228232860565,
        "interaction_matrix_overlap_top_k": 0.002340862527489662,
        "interaction_matrix_overlap_bottom_k": 0.008703320287168026,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0021660870406776667,
        "task_vector_l2_distance": 0.012770534493029118,
        "task_vector_dot_product": -0.0019515047315508127,
        "weight_space_angle": 0.0021229260601103306,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.025562254711985588,
        "subspace_overlap": -0.029598059132695198,
        "right_subspace_overlap": 0.015978429466485977,
        "activation_l2_distance": -0.00894690677523613,
        "activation_cosine_similarity": 0.05295422673225403,
        "activation_magnitude_ratio": -0.004973527044057846,
        "activation_dot_product": -0.00195766007527709,
        "encoder_gradient_cosine_similarity": 0.0015732678584754467,
        "encoder_gradient_l2_distance": -0.06257523596286774,
        "encoder_gradient_dot_product": 0.002060783328488469,
        "input_gradient_cosine_similarity": 0.0032012229785323143,
        "input_gradient_l2_distance": -0.008488493040204048,
        "input_gradient_dot_product": -0.0017669845838099718
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.8032700045075876,
      "val_r": 0.7476920294000085,
      "n_iterations": 354,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01964999921619892,
        "right_subspace_overlap_bottom_k": -0.07547663152217865,
        "interaction_matrix_overlap_top_k": -0.0030373618938028812,
        "interaction_matrix_overlap_bottom_k": 0.029347887262701988,
        "effective_rank": 0.0012174341827630997,
        "effective_rank_mergeability_score": -0.00195487798191607,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.015559349209070206,
        "task_vector_l2_distance": 0.007511953357607126,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.012718630023300648,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.009271588176488876,
        "subspace_overlap": -0.0024871351197361946,
        "right_subspace_overlap": 0.04209384694695473,
        "activation_l2_distance": 0.015043631196022034,
        "activation_cosine_similarity": 0.05061688274145126,
        "activation_magnitude_ratio": -0.004303815774619579,
        "activation_dot_product": -0.011475986801087856,
        "encoder_gradient_cosine_similarity": 0.006162513047456741,
        "encoder_gradient_l2_distance": -0.043800558894872665,
        "encoder_gradient_dot_product": -0.0011187184136360884,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.022208206355571747,
        "input_gradient_dot_product": -0.004782133270055056
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7773810872640365,
      "val_r": 0.7818297702820192,
      "n_iterations": 389,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.02882099710404873,
        "right_subspace_overlap_bottom_k": -0.08743973821401596,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.021245257928967476,
        "effective_rank": 0.0010515697067603469,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0015479987487196922,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.012487109750509262,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0025010660756379366,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.016053665429353714,
        "subspace_overlap": -0.015258722938597202,
        "right_subspace_overlap": 0.03884014114737511,
        "activation_l2_distance": 0.0026693129912018776,
        "activation_cosine_similarity": 0.060859255492687225,
        "activation_magnitude_ratio": -0.005834565497934818,
        "activation_dot_product": -0.015425305813550949,
        "encoder_gradient_cosine_similarity": 0.010096612386405468,
        "encoder_gradient_l2_distance": -0.0810745358467102,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.003306034253910184,
        "input_gradient_l2_distance": -0.025153907015919685,
        "input_gradient_dot_product": -0.014113114215433598
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8294592282881545,
      "val_r": 0.8358442794544827,
      "n_iterations": 300,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.03394048288464546,
        "right_subspace_overlap_bottom_k": -0.09644437581300735,
        "interaction_matrix_overlap_top_k": -0.017266426235437393,
        "interaction_matrix_overlap_bottom_k": 0.0809098482131958,
        "effective_rank": 0.004783712327480316,
        "effective_rank_mergeability_score": -0.00525104021653533,
        "stable_rank": 0.0028143206145614386,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.006398811936378479,
        "layerwise_effective_rank_mergeability_score": 0.005578687414526939,
        "task_vector_cosine_similarity": 0.0046905456110835075,
        "task_vector_l2_distance": 0.005637043155729771,
        "task_vector_dot_product": 0.0014058604137971997,
        "weight_space_angle": -0.0031706031877547503,
        "task_vector_magnitude_ratio": -0.0019431489054113626,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.02487192489206791,
        "right_subspace_overlap": 0.00584295392036438,
        "activation_l2_distance": 0.005453609861433506,
        "activation_cosine_similarity": 0.02147425338625908,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.005963167175650597,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.015826178714632988,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.004233780317008495,
        "input_gradient_l2_distance": -0.012209777720272541,
        "input_gradient_dot_product": -0.0048857699148356915
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8258821655521162,
      "val_r": 0.8009921059177965,
      "n_iterations": 592,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.008629260584712029,
        "right_subspace_overlap_bottom_k": -0.10558179020881653,
        "interaction_matrix_overlap_top_k": -0.014241974800825119,
        "interaction_matrix_overlap_bottom_k": 0.08683852106332779,
        "effective_rank": 0.010775544680655003,
        "effective_rank_mergeability_score": -0.013458224013447762,
        "stable_rank": -0.006484506651759148,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.009074307046830654,
        "layerwise_effective_rank_mergeability_score": 0.009211142547428608,
        "task_vector_cosine_similarity": 0.0016881102928891778,
        "task_vector_l2_distance": 0.008684411644935608,
        "task_vector_dot_product": -0.0026188238989561796,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0013570302398875356,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.014209505170583725,
        "activation_l2_distance": -0.0051995315589010715,
        "activation_cosine_similarity": 0.016419902443885803,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.010872146114706993,
        "encoder_gradient_cosine_similarity": 0.0016879482427611947,
        "encoder_gradient_l2_distance": -0.01208570972084999,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.011205845512449741,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.8196899248039113,
      "val_r": 0.7136440569306393,
      "n_iterations": 263,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.04481792449951172,
        "right_subspace_overlap_bottom_k": -0.07275110483169556,
        "interaction_matrix_overlap_top_k": -0.004536018706858158,
        "interaction_matrix_overlap_bottom_k": 0.007823394611477852,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0011317281750962138,
        "task_vector_l2_distance": 0.0015360212419182062,
        "task_vector_dot_product": -0.011079948395490646,
        "weight_space_angle": -0.001775022828951478,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.026019684970378876,
        "subspace_overlap": -0.02797703444957733,
        "right_subspace_overlap": 0.047291118651628494,
        "activation_l2_distance": 0.0036026365123689175,
        "activation_cosine_similarity": 0.048700131475925446,
        "activation_magnitude_ratio": -0.009408175013959408,
        "activation_dot_product": -0.01718882843852043,
        "encoder_gradient_cosine_similarity": 0.004349647089838982,
        "encoder_gradient_l2_distance": -0.07581435143947601,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.019071808084845543,
        "input_gradient_dot_product": -0.011222224682569504
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.8011389978021523,
      "val_r": 0.7734663939773697,
      "n_iterations": 217,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.04676549509167671,
        "right_subspace_overlap_bottom_k": -0.11911236494779587,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.07466328889131546,
        "effective_rank": 0.006242389790713787,
        "effective_rank_mergeability_score": -0.0033150098752230406,
        "stable_rank": -0.0017933847848325968,
        "spectral_gap": -0.0033008644822984934,
        "singular_value_ratio": 0.003596107941120863,
        "layerwise_effective_rank": -0.010181856341660023,
        "layerwise_effective_rank_mergeability_score": 0.012070016004145145,
        "task_vector_cosine_similarity": -0.011100090108811855,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.0094254519790411,
        "weight_space_angle": 0.00950655061751604,
        "task_vector_magnitude_ratio": 0.002691621659323573,
        "singular_value_overlap": 0.009914559312164783,
        "subspace_overlap": -0.003977013286203146,
        "right_subspace_overlap": 0.019458139315247536,
        "activation_l2_distance": -0.002181436400860548,
        "activation_cosine_similarity": 0.02948758751153946,
        "activation_magnitude_ratio": -0.009683242999017239,
        "activation_dot_product": 0.008686789311468601,
        "encoder_gradient_cosine_similarity": 0.01012042723596096,
        "encoder_gradient_l2_distance": -0.0599873922765255,
        "encoder_gradient_dot_product": -0.0011609925422817469,
        "input_gradient_cosine_similarity": 0.0042988089844584465,
        "input_gradient_l2_distance": -0.02917511761188507,
        "input_gradient_dot_product": -0.009138106368482113
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.768797508020277,
      "val_r": 0.7009664642315763,
      "n_iterations": 444,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.03275538608431816,
        "right_subspace_overlap_bottom_k": -0.11306658387184143,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.01366149540990591,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0010094153694808483,
        "layerwise_effective_rank": -0.008724241517484188,
        "layerwise_effective_rank_mergeability_score": 0.008528485894203186,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.005761174019426107,
        "task_vector_dot_product": -0.005798427853733301,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.03565770760178566,
        "subspace_overlap": -0.005544393789023161,
        "right_subspace_overlap": 0.05365310609340668,
        "activation_l2_distance": -0.011321578174829483,
        "activation_cosine_similarity": 0.0597548671066761,
        "activation_magnitude_ratio": -0.005049116909503937,
        "activation_dot_product": 0.02747291699051857,
        "encoder_gradient_cosine_similarity": 0.010599849745631218,
        "encoder_gradient_l2_distance": -0.13135136663913727,
        "encoder_gradient_dot_product": 0.0035267015919089317,
        "input_gradient_cosine_similarity": -0.0024720404762774706,
        "input_gradient_l2_distance": -0.10901626944541931,
        "input_gradient_dot_product": -0.015084308572113514
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8193951842384096,
      "val_r": 0.7180083532085991,
      "n_iterations": 336,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.02551516331732273,
        "right_subspace_overlap_bottom_k": -0.10423911362886429,
        "interaction_matrix_overlap_top_k": -0.010190502740442753,
        "interaction_matrix_overlap_bottom_k": 0.08495497703552246,
        "effective_rank": 0.013060382567346096,
        "effective_rank_mergeability_score": -0.00843674037605524,
        "stable_rank": -0.0039045941084623337,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.011031667701900005,
        "layerwise_effective_rank_mergeability_score": 0.011708109639585018,
        "task_vector_cosine_similarity": -0.002972960937768221,
        "task_vector_l2_distance": 0.005684764124453068,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.002517280401661992,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0033251584973186255,
        "subspace_overlap": -0.008260194212198257,
        "right_subspace_overlap": 0.007750269956886768,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.018525488674640656,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.002540506422519684,
        "encoder_gradient_cosine_similarity": 0.002358047291636467,
        "encoder_gradient_l2_distance": -0.022565932944417,
        "encoder_gradient_dot_product": -0.0016587763093411922,
        "input_gradient_cosine_similarity": 0.002299696207046509,
        "input_gradient_l2_distance": -0.008824353106319904,
        "input_gradient_dot_product": -0.0030956841073930264
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8533747423599914,
      "val_r": 0.717342958750952,
      "n_iterations": 236,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.00539645180106163,
        "right_subspace_overlap_bottom_k": -0.02409028261899948,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": -0.0013660467229783535,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.007738652639091015,
        "layerwise_effective_rank_mergeability_score": 0.003319147974252701,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.03524653613567352,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0017979579279199243,
        "singular_value_overlap": 0.014586539939045906,
        "subspace_overlap": -0.0011752640129998326,
        "right_subspace_overlap": -0.005359017290174961,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.017268221825361252,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": 0.060866761952638626,
        "encoder_gradient_cosine_similarity": 0.0023008910939097404,
        "encoder_gradient_l2_distance": -0.09618279337882996,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0053947982378304005,
        "input_gradient_l2_distance": -0.057039353996515274,
        "input_gradient_dot_product": -0.0047543905675411224
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.1,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}