{
  "weight_avg": {
    "aggregate_metrics": {
      "train_r": 0.5926168702577306,
      "train_p": 7.56942168062438e-305,
      "val_r": 0.4396257068269801,
      "val_p": 2.3738329626086106e-18
    },
    "per_fold_stats": {
      "train_r_mean": 0.7471577939569263,
      "train_r_std": 0.027050015865128108,
      "val_r_mean": 0.6253752447783778,
      "val_r_std": 0.16719451651075096,
      "n_nonzero_mean": 21.25,
      "n_nonzero_std": 3.207413287993925
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.013724428601562977,
      "right_subspace_overlap_bottom_k": -0.017672907561063766,
      "interaction_matrix_overlap_top_k": 0.0005202004685997963,
      "interaction_matrix_overlap_bottom_k": 0.0018436642130836844,
      "effective_rank": -0.0007864800281822681,
      "effective_rank_mergeability_score": 0.0009055379778146744,
      "stable_rank": -0.0012206590035930276,
      "spectral_gap": 4.150969471083954e-05,
      "singular_value_ratio": 4.0163868106901646e-06,
      "layerwise_effective_rank": -0.0017830576980486512,
      "layerwise_effective_rank_mergeability_score": 0.001600724644958973,
      "task_vector_cosine_similarity": -0.000994836213067174,
      "task_vector_l2_distance": -0.008177132345736027,
      "task_vector_dot_product": -0.0024344122502952814,
      "weight_space_angle": 0.0016768056666478515,
      "task_vector_magnitude_ratio": -0.0007848691311664879,
      "singular_value_overlap": 0.00024485308676958084,
      "subspace_overlap": -0.0008565217140130699,
      "right_subspace_overlap": 0.01227252185344696,
      "activation_l2_distance": -0.002632628194987774,
      "activation_cosine_similarity": 0.01959354244172573,
      "activation_magnitude_ratio": -0.004180660471320152,
      "activation_dot_product": 0.005457724444568157,
      "encoder_gradient_cosine_similarity": 0.004266757518053055,
      "encoder_gradient_l2_distance": -0.044720977544784546,
      "encoder_gradient_dot_product": 0.0013078686315566301,
      "input_gradient_cosine_similarity": 0.0021346337161958218,
      "input_gradient_l2_distance": -0.03384353220462799,
      "input_gradient_dot_product": -0.007391627877950668
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.007847652770578861,
      "right_subspace_overlap_bottom_k": 0.005689507350325584,
      "interaction_matrix_overlap_top_k": 0.0020071661565452814,
      "interaction_matrix_overlap_bottom_k": 0.0028948558028787374,
      "effective_rank": 0.0013003022177144885,
      "effective_rank_mergeability_score": 0.0013669293839484453,
      "stable_rank": 0.0015239563072100282,
      "spectral_gap": 0.0012949913507327437,
      "singular_value_ratio": 0.0013379754964262247,
      "layerwise_effective_rank": 0.0012649433920159936,
      "layerwise_effective_rank_mergeability_score": 0.0014054446946829557,
      "task_vector_cosine_similarity": 0.0044459449127316475,
      "task_vector_l2_distance": 0.007551178336143494,
      "task_vector_dot_product": 0.0018911801744252443,
      "weight_space_angle": 0.0033015210647135973,
      "task_vector_magnitude_ratio": 0.0012510051019489765,
      "singular_value_overlap": 0.0032466573175042868,
      "subspace_overlap": 0.0015549649251624942,
      "right_subspace_overlap": 0.006801805924624205,
      "activation_l2_distance": 0.004796684253960848,
      "activation_cosine_similarity": 0.007266839034855366,
      "activation_magnitude_ratio": 0.0023644070606678724,
      "activation_dot_product": 0.010821906849741936,
      "encoder_gradient_cosine_similarity": 0.002439163625240326,
      "encoder_gradient_l2_distance": 0.018027573823928833,
      "encoder_gradient_dot_product": 0.0019537152256816626,
      "input_gradient_cosine_similarity": 0.002079788828268647,
      "input_gradient_l2_distance": 0.015846868976950645,
      "input_gradient_dot_product": 0.0038701763842254877
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 1.0,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.55,
      "interaction_matrix_overlap_bottom_k": 0.65,
      "effective_rank": 0.35,
      "effective_rank_mergeability_score": 0.4,
      "stable_rank": 0.55,
      "spectral_gap": 0.45,
      "singular_value_ratio": 0.45,
      "layerwise_effective_rank": 0.8,
      "layerwise_effective_rank_mergeability_score": 0.75,
      "task_vector_cosine_similarity": 0.55,
      "task_vector_l2_distance": 0.85,
      "task_vector_dot_product": 0.75,
      "weight_space_angle": 0.8,
      "task_vector_magnitude_ratio": 0.6,
      "singular_value_overlap": 0.55,
      "subspace_overlap": 0.4,
      "right_subspace_overlap": 0.95,
      "activation_l2_distance": 0.85,
      "activation_cosine_similarity": 1.0,
      "activation_magnitude_ratio": 0.95,
      "activation_dot_product": 0.8,
      "encoder_gradient_cosine_similarity": 0.95,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.55,
      "input_gradient_cosine_similarity": 0.8,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.95
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7641664039687966,
        "val_r": 0.6153039611742014,
        "n_iterations": 268,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009024444036185741,
          "right_subspace_overlap_bottom_k": -0.008244887925684452,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0019921937491744757,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.003889478277415037,
          "task_vector_dot_product": -0.0032076286152005196,
          "weight_space_angle": 0.0021412780042737722,
          "task_vector_magnitude_ratio": -0.0025716102682054043,
          "singular_value_overlap": -0.003299061441794038,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.005398551467806101,
          "activation_l2_distance": 0.0030883632134646177,
          "activation_cosine_similarity": 0.0194547101855278,
          "activation_magnitude_ratio": -0.004809306003153324,
          "activation_dot_product": -0.003896509064361453,
          "encoder_gradient_cosine_similarity": 0.0013710171915590763,
          "encoder_gradient_l2_distance": -0.023211752995848656,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0019323891028761864,
          "input_gradient_l2_distance": -0.014405721798539162,
          "input_gradient_dot_product": -0.00660921772941947
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.730118415975912,
        "val_r": 0.8074247432351749,
        "n_iterations": 363,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01893748715519905,
          "right_subspace_overlap_bottom_k": -0.022701263427734375,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0012041323352605104,
          "stable_rank": -0.00200723041780293,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0019095820607617497,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0028800847940146923,
          "task_vector_l2_distance": -0.01565822958946228,
          "task_vector_dot_product": -0.0032834301237016916,
          "weight_space_angle": -0.0028945463709533215,
          "task_vector_magnitude_ratio": -0.001960551831871271,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.023850498721003532,
          "activation_l2_distance": -0.010261435061693192,
          "activation_cosine_similarity": 0.027808653190732002,
          "activation_magnitude_ratio": -0.009713947772979736,
          "activation_dot_product": 0.002853161422535777,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.0780031606554985,
          "encoder_gradient_dot_product": 0.0011548787588253617,
          "input_gradient_cosine_similarity": 0.003538701683282852,
          "input_gradient_l2_distance": -0.055419743061065674,
          "input_gradient_dot_product": -0.007235167548060417
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.754263263771205,
        "val_r": 0.7039496065953981,
        "n_iterations": 251,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.010079054161906242,
          "right_subspace_overlap_bottom_k": -0.01398113090544939,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.004095263779163361,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0014630267396569252,
          "singular_value_ratio": 0.0011625145561993122,
          "layerwise_effective_rank": -0.0014414484612643719,
          "layerwise_effective_rank_mergeability_score": 0.0023569809272885323,
          "task_vector_cosine_similarity": -0.002901046071201563,
          "task_vector_l2_distance": -0.003846214385703206,
          "task_vector_dot_product": -0.0013853444252163172,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0033738981001079082,
          "subspace_overlap": -0.0014376253820955753,
          "right_subspace_overlap": 0.013598824851214886,
          "activation_l2_distance": -0.0026845026295632124,
          "activation_cosine_similarity": 0.011262585408985615,
          "activation_magnitude_ratio": -0.004477307666093111,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0035502049140632153,
          "encoder_gradient_l2_distance": -0.027852047234773636,
          "encoder_gradient_dot_product": 0.0013247421011328697,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.021327678114175797,
          "input_gradient_dot_product": -0.004185395315289497
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7196474653919857,
        "val_r": 0.6810674152992265,
        "n_iterations": 352,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.02211422473192215,
          "right_subspace_overlap_bottom_k": -0.019439078867435455,
          "interaction_matrix_overlap_top_k": 0.001992088044062257,
          "interaction_matrix_overlap_bottom_k": 0.0015709990402683616,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0016915041487663984,
          "singular_value_ratio": 0.001967239659279585,
          "layerwise_effective_rank": -0.0013050900306552649,
          "layerwise_effective_rank_mergeability_score": 0.0023458702489733696,
          "task_vector_cosine_similarity": -0.004860764369368553,
          "task_vector_l2_distance": -0.005447322968393564,
          "task_vector_dot_product": -0.003574846312403679,
          "weight_space_angle": 0.004859617445617914,
          "task_vector_magnitude_ratio": 0.0011478158412501216,
          "singular_value_overlap": 0.0010869349353015423,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.012776152230799198,
          "activation_l2_distance": -0.004869913682341576,
          "activation_cosine_similarity": 0.01670333370566368,
          "activation_magnitude_ratio": -0.0033908402547240257,
          "activation_dot_product": 0.010115502402186394,
          "encoder_gradient_cosine_similarity": 0.0034999498166143894,
          "encoder_gradient_l2_distance": -0.041647572070360184,
          "encoder_gradient_dot_product": 0.006208838429301977,
          "input_gradient_cosine_similarity": 0.0010595244821161032,
          "input_gradient_l2_distance": -0.046172238886356354,
          "input_gradient_dot_product": -0.01623384840786457
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7462125872818015,
        "val_r": 0.7514684124466295,
        "n_iterations": 440,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004185941070318222,
          "right_subspace_overlap_bottom_k": -0.013581870123744011,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0010601093526929617,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0038691931404173374,
          "task_vector_dot_product": -0.005899668671190739,
          "weight_space_angle": -0.001241954043507576,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.015142606571316719,
          "activation_l2_distance": 0.004897105973213911,
          "activation_cosine_similarity": 0.01942877098917961,
          "activation_magnitude_ratio": -0.001824579550884664,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0038254931569099426,
          "encoder_gradient_l2_distance": -0.03272353112697601,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0038864687085151672,
          "input_gradient_l2_distance": -0.014108595438301563,
          "input_gradient_dot_product": -0.004445265047252178
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7525996654142924,
        "val_r": 0.7391552716275007,
        "n_iterations": 478,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.014290638267993927,
          "right_subspace_overlap_bottom_k": -0.017581820487976074,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.004876903723925352,
          "effective_rank": -0.0015727923018857837,
          "effective_rank_mergeability_score": 0.0023316596634685993,
          "stable_rank": -0.002273554913699627,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0014160670107230544,
          "layerwise_effective_rank": -0.004074912052601576,
          "layerwise_effective_rank_mergeability_score": 0.003375114407390356,
          "task_vector_cosine_similarity": -0.004311664029955864,
          "task_vector_l2_distance": -0.018005521968007088,
          "task_vector_dot_product": -0.002802510280162096,
          "weight_space_angle": 0.002506366465240717,
          "task_vector_magnitude_ratio": -0.0015196388121694326,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0018256640760228038,
          "right_subspace_overlap": 0.017304373905062675,
          "activation_l2_distance": -0.005916747730225325,
          "activation_cosine_similarity": 0.025627408176660538,
          "activation_magnitude_ratio": -0.0027990953531116247,
          "activation_dot_product": 0.01228634174913168,
          "encoder_gradient_cosine_similarity": 0.00622007017955184,
          "encoder_gradient_l2_distance": -0.0587986521422863,
          "encoder_gradient_dot_product": 0.0020890221931040287,
          "input_gradient_cosine_similarity": -0.00152248190715909,
          "input_gradient_l2_distance": -0.043945275247097015,
          "input_gradient_dot_product": -0.00805825088173151
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.7259063729155306,
        "val_r": 0.49780274754581244,
        "n_iterations": 304,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009785105474293232,
          "right_subspace_overlap_bottom_k": -0.0200701504945755,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.006183536723256111,
          "effective_rank": -0.0012233412126079202,
          "effective_rank_mergeability_score": 0.0012737842043861747,
          "stable_rank": -0.0013075992465019226,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0012396026868373156,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0015219768974930048,
          "task_vector_dot_product": -0.0026822444051504135,
          "weight_space_angle": -0.0012440318241715431,
          "task_vector_magnitude_ratio": -0.00120331603102386,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0034993065055459738,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.016480136662721634,
          "activation_magnitude_ratio": -0.0015140390023589134,
          "activation_dot_product": 0.003780159866437316,
          "encoder_gradient_cosine_similarity": 0.005221265833824873,
          "encoder_gradient_l2_distance": -0.01721865125000477,
          "encoder_gradient_dot_product": 0.0022854001726955175,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0179677065461874,
          "input_gradient_dot_product": -0.006860287860035896
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7060389098640025,
        "val_r": 0.2722380462033936,
        "n_iterations": 479,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.030054859817028046,
          "right_subspace_overlap_bottom_k": -0.02478799968957901,
          "interaction_matrix_overlap_top_k": -0.002422543242573738,
          "interaction_matrix_overlap_bottom_k": 0.004152490757405758,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0017252020770683885,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.001073662657290697,
          "layerwise_effective_rank_mergeability_score": 0.0021859491243958473,
          "task_vector_cosine_similarity": -0.010733035393059254,
          "task_vector_l2_distance": -0.014200001955032349,
          "task_vector_dot_product": -0.002910345559939742,
          "weight_space_angle": 0.010968262329697609,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0043721566908061504,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.024936897680163383,
          "activation_l2_distance": -0.011034197174012661,
          "activation_cosine_similarity": 0.029618892818689346,
          "activation_magnitude_ratio": -0.004215111956000328,
          "activation_dot_product": -0.0042027672752738,
          "encoder_gradient_cosine_similarity": 0.010568803176283836,
          "encoder_gradient_l2_distance": -0.06069960072636604,
          "encoder_gradient_dot_product": 0.0020332925487309694,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.038265760987997055,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7591427971681964,
        "val_r": 0.6189433560218425,
        "n_iterations": 187,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.017747929319739342,
          "right_subspace_overlap_bottom_k": -0.021278705447912216,
          "interaction_matrix_overlap_top_k": 0.0021786759607493877,
          "interaction_matrix_overlap_bottom_k": 0.0065699415281414986,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.001526752021163702,
          "spectral_gap": -0.0031862056348472834,
          "singular_value_ratio": 0.0027245250530540943,
          "layerwise_effective_rank": -0.004383462481200695,
          "layerwise_effective_rank_mergeability_score": 0.003994102589786053,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.004722667392343283,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0012491440866142511,
          "task_vector_magnitude_ratio": 0.0019025335786864161,
          "singular_value_overlap": -0.0019733207300305367,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.006208611186593771,
          "activation_l2_distance": -0.0044011203572154045,
          "activation_cosine_similarity": 0.017060110345482826,
          "activation_magnitude_ratio": -0.005756118334829807,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.004744283854961395,
          "encoder_gradient_l2_distance": -0.02991599589586258,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.004956371150910854,
          "input_gradient_l2_distance": -0.02839987352490425,
          "input_gradient_dot_product": -0.007848180830478668
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7349620442817367,
        "val_r": 0.6152144310905914,
        "n_iterations": 254,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.014216461218893528,
          "right_subspace_overlap_bottom_k": -0.023823179304599762,
          "interaction_matrix_overlap_top_k": 0.003184329252690077,
          "interaction_matrix_overlap_bottom_k": 0.003712557489052415,
          "effective_rank": -0.0033978791907429695,
          "effective_rank_mergeability_score": 0.0024487380869686604,
          "stable_rank": -0.0020762972999364138,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.002724051009863615,
          "layerwise_effective_rank_mergeability_score": 0.0033531985245645046,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.012868841178715229,
          "task_vector_dot_product": -0.006415230222046375,
          "weight_space_angle": -0.0022127665579319,
          "task_vector_magnitude_ratio": -0.0013413499109447002,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.022689227014780045,
          "activation_l2_distance": 0.00134569825604558,
          "activation_cosine_similarity": -0.0021292383316904306,
          "activation_magnitude_ratio": -0.005899706389755011,
          "activation_dot_product": -0.010568046011030674,
          "encoder_gradient_cosine_similarity": 0.008499148301780224,
          "encoder_gradient_l2_distance": -0.05076603963971138,
          "encoder_gradient_dot_product": 0.0010547306155785918,
          "input_gradient_cosine_similarity": 0.004541718401014805,
          "input_gradient_l2_distance": -0.053588271141052246,
          "input_gradient_dot_product": -0.002088692970573902
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7054484165480448,
        "val_r": 0.26136735414719764,
        "n_iterations": 310,
        "n_nonzero_coefficients": 27,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.012821526266634464,
          "right_subspace_overlap_bottom_k": -0.022019999101758003,
          "interaction_matrix_overlap_top_k": 0.005976258777081966,
          "interaction_matrix_overlap_bottom_k": -0.004340771585702896,
          "effective_rank": -0.004729022271931171,
          "effective_rank_mergeability_score": 0.005406461656093597,
          "stable_rank": -0.006539618596434593,
          "spectral_gap": 0.0023966648150235415,
          "singular_value_ratio": -0.003477207152172923,
          "layerwise_effective_rank": -0.0026298908051103354,
          "layerwise_effective_rank_mergeability_score": 0.002686650026589632,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.004734812304377556,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0020765839144587517,
          "task_vector_magnitude_ratio": -0.0030663474462926388,
          "singular_value_overlap": 0.0060920435935258865,
          "subspace_overlap": -0.002572115743532777,
          "right_subspace_overlap": 0.008638577535748482,
          "activation_l2_distance": -0.008787206374108791,
          "activation_cosine_similarity": 0.03005586937069893,
          "activation_magnitude_ratio": -0.005545899737626314,
          "activation_dot_product": 0.029498688876628876,
          "encoder_gradient_cosine_similarity": 0.00320868450216949,
          "encoder_gradient_l2_distance": -0.0375351645052433,
          "encoder_gradient_dot_product": 0.005873317830264568,
          "input_gradient_cosine_similarity": 0.0014119953848421574,
          "input_gradient_l2_distance": -0.041166406124830246,
          "input_gradient_dot_product": -0.009113937616348267
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.757778231678134,
        "val_r": 0.7140636247528799,
        "n_iterations": 209,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.016635656356811523,
          "right_subspace_overlap_bottom_k": -0.015986386686563492,
          "interaction_matrix_overlap_top_k": 0.00211039325222373,
          "interaction_matrix_overlap_bottom_k": 0.007080634590238333,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": -0.001175688928924501,
          "task_vector_cosine_similarity": -0.008779001422226429,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.00446076737716794,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0011676839785650373,
          "right_subspace_overlap": 0.004299739375710487,
          "activation_l2_distance": 0.0038857818581163883,
          "activation_cosine_similarity": 0.016197286546230316,
          "activation_magnitude_ratio": -0.003487923415377736,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.002721168100833893,
          "encoder_gradient_l2_distance": -0.018344474956393242,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0018111434765160084,
          "input_gradient_l2_distance": -0.012977203354239464,
          "input_gradient_dot_product": -0.0054010022431612015
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7278187325872895,
        "val_r": 0.8183353100284848,
        "n_iterations": 362,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006364190950989723,
          "right_subspace_overlap_bottom_k": -0.019425740465521812,
          "interaction_matrix_overlap_top_k": 0.0018334193155169487,
          "interaction_matrix_overlap_bottom_k": 0.0016667958116158843,
          "effective_rank": -0.001490980852395296,
          "effective_rank_mergeability_score": 0.0015422215219587088,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.003506589448079467,
          "layerwise_effective_rank_mergeability_score": 0.0010039167245849967,
          "task_vector_cosine_similarity": 0.012441861443221569,
          "task_vector_l2_distance": -0.004098247736692429,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.008566705510020256,
          "activation_l2_distance": -0.007735807914286852,
          "activation_cosine_similarity": 0.023099595680832863,
          "activation_magnitude_ratio": -0.0028621808160096407,
          "activation_dot_product": 0.008074057288467884,
          "encoder_gradient_cosine_similarity": 0.0051712230779230595,
          "encoder_gradient_l2_distance": -0.058995574712753296,
          "encoder_gradient_dot_product": -0.0010496970498934388,
          "input_gradient_cosine_similarity": 0.0033295771572738886,
          "input_gradient_l2_distance": -0.043086856603622437,
          "input_gradient_dot_product": -0.007075058296322823
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7492601739327347,
        "val_r": 0.7859336855668348,
        "n_iterations": 253,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.021160941570997238,
          "right_subspace_overlap_bottom_k": -0.015317363664507866,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.001307524275034666,
          "layerwise_effective_rank": -0.002226038370281458,
          "layerwise_effective_rank_mergeability_score": 0.0021475672256201506,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.005956275388598442,
          "task_vector_dot_product": -0.0013219465035945177,
          "weight_space_angle": 0.002626296365633607,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0014109014300629497,
          "subspace_overlap": -0.0035646886099129915,
          "right_subspace_overlap": 0.009010427631437778,
          "activation_l2_distance": -0.007929421029984951,
          "activation_cosine_similarity": 0.021180855110287666,
          "activation_magnitude_ratio": -0.007386836223304272,
          "activation_dot_product": 0.0031920447945594788,
          "encoder_gradient_cosine_similarity": 0.0028589414432644844,
          "encoder_gradient_l2_distance": -0.06026922166347504,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0022507542744278908,
          "input_gradient_l2_distance": -0.028379365801811218,
          "input_gradient_dot_product": -0.00940703321248293
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.746111195906735,
        "val_r": 0.7806589203106321,
        "n_iterations": 341,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.006757151335477829,
          "right_subspace_overlap_bottom_k": -0.019720816984772682,
          "interaction_matrix_overlap_top_k": -0.00109042227268219,
          "interaction_matrix_overlap_bottom_k": 0.0011011767201125622,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0010852421401068568,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.003485080087557435,
          "weight_space_angle": 0.0017584264278411865,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0,
          "subspace_overlap": -0.0015870778588578105,
          "right_subspace_overlap": 0.018559304997324944,
          "activation_l2_distance": 0.0010629722382873297,
          "activation_cosine_similarity": 0.0188126303255558,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.002221245551481843,
          "encoder_gradient_cosine_similarity": 0.005323193501681089,
          "encoder_gradient_l2_distance": -0.03288792446255684,
          "encoder_gradient_dot_product": 0.0010024562943726778,
          "input_gradient_cosine_similarity": 0.0017165795434266329,
          "input_gradient_l2_distance": -0.01384043786674738,
          "input_gradient_dot_product": -0.008036444894969463
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.7525361574010614,
        "val_r": 0.42756164255633106,
        "n_iterations": 423,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.005229653790593147,
          "right_subspace_overlap_bottom_k": -0.01776239648461342,
          "interaction_matrix_overlap_top_k": 0.0016371412202715874,
          "interaction_matrix_overlap_bottom_k": -0.0017884373664855957,
          "effective_rank": -0.0021998626179993153,
          "effective_rank_mergeability_score": 0.0018167418893426657,
          "stable_rank": -0.0017287026857957244,
          "spectral_gap": 0.0017883226973935962,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.001267933053895831,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.008537495508790016,
          "task_vector_dot_product": -0.00513132568448782,
          "weight_space_angle": 0.005972873419523239,
          "task_vector_magnitude_ratio": -0.0016035446897149086,
          "singular_value_overlap": 0.009759016335010529,
          "subspace_overlap": -0.0016931984573602676,
          "right_subspace_overlap": 0.017752300947904587,
          "activation_l2_distance": 0.00311657995916903,
          "activation_cosine_similarity": 0.015923980623483658,
          "activation_magnitude_ratio": -0.005429686047136784,
          "activation_dot_product": 0.004836803302168846,
          "encoder_gradient_cosine_similarity": 0.0027307490818202496,
          "encoder_gradient_l2_distance": -0.02157631143927574,
          "encoder_gradient_dot_product": 0.004180391319096088,
          "input_gradient_cosine_similarity": 0.0022879166062921286,
          "input_gradient_l2_distance": -0.03157041594386101,
          "input_gradient_dot_product": -0.01736190728843212
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7518049289246553,
        "val_r": 0.7278667931551717,
        "n_iterations": 206,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.016549212858080864,
          "right_subspace_overlap_bottom_k": -0.013803927227854729,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0010129817528650165,
          "spectral_gap": 0.0012918879510834813,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0015972958644852042,
          "layerwise_effective_rank_mergeability_score": 0.0014201197773218155,
          "task_vector_cosine_similarity": -0.002141362288966775,
          "task_vector_l2_distance": -0.010634166188538074,
          "task_vector_dot_product": -0.001959742046892643,
          "weight_space_angle": 0.005505270790308714,
          "task_vector_magnitude_ratio": -0.001316078007221222,
          "singular_value_overlap": 0.0,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.01093937549740076,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.020296644419431686,
          "activation_magnitude_ratio": -0.007883104495704174,
          "activation_dot_product": 0.006282632239162922,
          "encoder_gradient_cosine_similarity": 0.006608420517295599,
          "encoder_gradient_l2_distance": -0.05440318211913109,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.027965735644102097,
          "input_gradient_dot_product": -0.007845163345336914
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7394327794364381,
        "val_r": 0.6074179170427889,
        "n_iterations": 196,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.015506061725318432,
          "right_subspace_overlap_bottom_k": -0.016460388898849487,
          "interaction_matrix_overlap_top_k": -0.0016651960322633386,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": -0.001115723280236125,
          "effective_rank_mergeability_score": 0.002087018918246031,
          "stable_rank": -0.0019379123114049435,
          "spectral_gap": 0.001872456632554531,
          "singular_value_ratio": -0.0013450533151626587,
          "layerwise_effective_rank": -0.002345075597986579,
          "layerwise_effective_rank_mergeability_score": 0.0033561561722308397,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.014298549853265285,
          "task_vector_dot_product": -0.002441608114168048,
          "weight_space_angle": 0.0011576928663998842,
          "task_vector_magnitude_ratio": -0.001702269073575735,
          "singular_value_overlap": 0.003908418584614992,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.010884804651141167,
          "activation_l2_distance": -0.004723794758319855,
          "activation_cosine_similarity": 0.02964034304022789,
          "activation_magnitude_ratio": -0.0020637144334614277,
          "activation_dot_product": 0.00542818196117878,
          "encoder_gradient_cosine_similarity": 0.00177172408439219,
          "encoder_gradient_l2_distance": -0.06673489511013031,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0018217565957456827,
          "input_gradient_l2_distance": -0.06397051364183426,
          "input_gradient_dot_product": -0.005294123664498329
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.793324840347617,
        "val_r": 0.3752508647756753,
        "n_iterations": 348,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.02648795396089554,
          "right_subspace_overlap_bottom_k": -0.026196200400590897,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0015534237027168274,
          "singular_value_ratio": 0.0011891598114743829,
          "layerwise_effective_rank": -0.0025411027017980814,
          "layerwise_effective_rank_mergeability_score": 0.0017523241695016623,
          "task_vector_cosine_similarity": -0.0014325263909995556,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.0021872972138226032,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.001958777429535985,
          "subspace_overlap": -0.0056177470833063126,
          "right_subspace_overlap": 0.011394129134714603,
          "activation_l2_distance": -0.0017049160087481141,
          "activation_cosine_similarity": 0.02136583812534809,
          "activation_magnitude_ratio": -0.0014903763076290488,
          "activation_dot_product": 0.005718467757105827,
          "encoder_gradient_cosine_similarity": 0.005513570737093687,
          "encoder_gradient_l2_distance": -0.05814121663570404,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0018379519460722804,
          "input_gradient_l2_distance": -0.022040730342268944,
          "input_gradient_dot_product": -0.008500522933900356
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.8265824963423563,
        "val_r": 0.7064807919917905,
        "n_iterations": 248,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.003459973493590951,
          "right_subspace_overlap_bottom_k": -0.0012748793233186007,
          "interaction_matrix_overlap_top_k": -0.003330135252326727,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.002277329796925187,
          "spectral_gap": 0.0013750221114605665,
          "singular_value_ratio": -0.002032308140769601,
          "layerwise_effective_rank": -0.001395418425090611,
          "layerwise_effective_rank_mergeability_score": 0.002152122324332595,
          "task_vector_cosine_similarity": -0.001144513487815857,
          "task_vector_l2_distance": -0.0312536396086216,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.002463025040924549,
          "singular_value_overlap": -0.0034787904005497694,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.013982431031763554,
          "activation_magnitude_ratio": -0.003063442185521126,
          "activation_dot_product": 0.037977010011672974,
          "encoder_gradient_cosine_similarity": 0.0019272355129942298,
          "encoder_gradient_l2_distance": -0.06469450145959854,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.007832312025129795,
          "input_gradient_l2_distance": -0.058272115886211395,
          "input_gradient_dot_product": -0.0062330723740160465
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.3,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "arithmetic": {
    "aggregate_metrics": {
      "train_r": 0.3969919351551527,
      "train_p": 4.2744540672952456e-122,
      "val_r": 0.06638532008320312,
      "val_p": 0.21018420497155335
    },
    "per_fold_stats": {
      "train_r_mean": 0.5886771611431418,
      "train_r_std": 0.06504344261757135,
      "val_r_mean": 0.45068477523106826,
      "val_r_std": 0.17596868409316313,
      "n_nonzero_mean": 19.85,
      "n_nonzero_std": 3.380458548777074
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.003782773856073618,
      "right_subspace_overlap_bottom_k": -0.0016126602422446012,
      "interaction_matrix_overlap_top_k": 3.919284790754318e-05,
      "interaction_matrix_overlap_bottom_k": 0.02263762429356575,
      "effective_rank": -0.0009269095025956631,
      "effective_rank_mergeability_score": 0.0011344959493726492,
      "stable_rank": -0.0008139209821820259,
      "spectral_gap": 0.0002752138243522495,
      "singular_value_ratio": -0.00040968164103105664,
      "layerwise_effective_rank": -7.422269118251279e-05,
      "layerwise_effective_rank_mergeability_score": 7.365470810327679e-05,
      "task_vector_cosine_similarity": -0.001376676606014371,
      "task_vector_l2_distance": -0.021419819444417953,
      "task_vector_dot_product": -0.0008720580372028053,
      "weight_space_angle": 0.0009181160712614655,
      "task_vector_magnitude_ratio": -0.004384725354611874,
      "singular_value_overlap": -0.015078742988407612,
      "subspace_overlap": 0.0030640901532024145,
      "right_subspace_overlap": 0.003953299019485712,
      "activation_l2_distance": -0.0007296672556549311,
      "activation_cosine_similarity": 0.004410469904541969,
      "activation_magnitude_ratio": -0.003674296196550131,
      "activation_dot_product": 0.0031240207608789206,
      "encoder_gradient_cosine_similarity": 0.0013526377733796835,
      "encoder_gradient_l2_distance": -0.026707783341407776,
      "encoder_gradient_dot_product": 0.0014674466801807284,
      "input_gradient_cosine_similarity": 0.0016204711282625794,
      "input_gradient_l2_distance": -0.026874344795942307,
      "input_gradient_dot_product": -0.00783727876842022
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.004989170003682375,
      "right_subspace_overlap_bottom_k": 0.008167548105120659,
      "interaction_matrix_overlap_top_k": 0.0024676055181771517,
      "interaction_matrix_overlap_bottom_k": 0.008478006348013878,
      "effective_rank": 0.0013631018809974194,
      "effective_rank_mergeability_score": 0.0015160468174144626,
      "stable_rank": 0.0012111476389691234,
      "spectral_gap": 0.00091951759532094,
      "singular_value_ratio": 0.0009574048453941941,
      "layerwise_effective_rank": 0.001077749882824719,
      "layerwise_effective_rank_mergeability_score": 0.0016378131695091724,
      "task_vector_cosine_similarity": 0.002594121266156435,
      "task_vector_l2_distance": 0.011569597758352757,
      "task_vector_dot_product": 0.003976170904934406,
      "weight_space_angle": 0.002751634456217289,
      "task_vector_magnitude_ratio": 0.0018921077717095613,
      "singular_value_overlap": 0.007941373623907566,
      "subspace_overlap": 0.004105299711227417,
      "right_subspace_overlap": 0.005735222715884447,
      "activation_l2_distance": 0.0030209971591830254,
      "activation_cosine_similarity": 0.0052911462262272835,
      "activation_magnitude_ratio": 0.0022261522244662046,
      "activation_dot_product": 0.004497924819588661,
      "encoder_gradient_cosine_similarity": 0.0013251072959974408,
      "encoder_gradient_l2_distance": 0.013947958126664162,
      "encoder_gradient_dot_product": 0.001985466806218028,
      "input_gradient_cosine_similarity": 0.0017180655850097537,
      "input_gradient_l2_distance": 0.01668107695877552,
      "input_gradient_dot_product": 0.005649831146001816
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.8,
      "right_subspace_overlap_bottom_k": 0.85,
      "interaction_matrix_overlap_top_k": 0.5,
      "interaction_matrix_overlap_bottom_k": 0.95,
      "effective_rank": 0.4,
      "effective_rank_mergeability_score": 0.55,
      "stable_rank": 0.5,
      "spectral_gap": 0.35,
      "singular_value_ratio": 0.35,
      "layerwise_effective_rank": 0.4,
      "layerwise_effective_rank_mergeability_score": 0.35,
      "task_vector_cosine_similarity": 0.6,
      "task_vector_l2_distance": 0.95,
      "task_vector_dot_product": 0.6,
      "weight_space_angle": 0.65,
      "task_vector_magnitude_ratio": 0.95,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.7,
      "right_subspace_overlap": 0.65,
      "activation_l2_distance": 0.75,
      "activation_cosine_similarity": 0.8,
      "activation_magnitude_ratio": 0.9,
      "activation_dot_product": 0.8,
      "encoder_gradient_cosine_similarity": 0.6,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.45,
      "input_gradient_cosine_similarity": 0.55,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 0.9
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.62598268311578,
        "val_r": 0.6069644376601067,
        "n_iterations": 482,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0027112921234220266,
          "right_subspace_overlap_bottom_k": 0.006611906923353672,
          "interaction_matrix_overlap_top_k": -0.0019699796102941036,
          "interaction_matrix_overlap_bottom_k": 0.032874200493097305,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0010580765083432198,
          "layerwise_effective_rank": 0.0028221013490110636,
          "layerwise_effective_rank_mergeability_score": -0.0039050057530403137,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0321345254778862,
          "task_vector_dot_product": -0.003933998756110668,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.00610487861558795,
          "singular_value_overlap": -0.029399026185274124,
          "subspace_overlap": 0.015052501112222672,
          "right_subspace_overlap": 0.0014592737425118685,
          "activation_l2_distance": -0.0012064268812537193,
          "activation_cosine_similarity": 0.010025318711996078,
          "activation_magnitude_ratio": -0.010392112657427788,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.034717585891485214,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.004944451153278351,
          "input_gradient_l2_distance": -0.03056325763463974,
          "input_gradient_dot_product": -0.007859572768211365
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.47742064573700466,
        "val_r": 0.4149946628671065,
        "n_iterations": 317,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00605149008333683,
          "right_subspace_overlap_bottom_k": -0.010352012701332569,
          "interaction_matrix_overlap_top_k": 0.0016768991481512785,
          "interaction_matrix_overlap_bottom_k": 0.024332385510206223,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0014189973007887602,
          "spectral_gap": -0.001624859170988202,
          "singular_value_ratio": 0.0017392014851793647,
          "layerwise_effective_rank": 0.0014829867286607623,
          "layerwise_effective_rank_mergeability_score": -0.001912758918479085,
          "task_vector_cosine_similarity": 0.0010974827455356717,
          "task_vector_l2_distance": -0.00920994020998478,
          "task_vector_dot_product": 0.0022897357121109962,
          "weight_space_angle": -0.0028311586938798428,
          "task_vector_magnitude_ratio": -0.004225633107125759,
          "singular_value_overlap": -0.00555286044254899,
          "subspace_overlap": 0.0026813976000994444,
          "right_subspace_overlap": 0.004424413666129112,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.003307162318378687,
          "activation_magnitude_ratio": -0.0015295286430045962,
          "activation_dot_product": 0.004668941721320152,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.014745364896953106,
          "encoder_gradient_dot_product": 0.003107246942818165,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01559995487332344,
          "input_gradient_dot_product": -0.0049713049083948135
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.550082604806365,
        "val_r": 0.5444917628831509,
        "n_iterations": 215,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00864087138324976,
          "right_subspace_overlap_bottom_k": -0.008983196690678596,
          "interaction_matrix_overlap_top_k": 0.0025953773874789476,
          "interaction_matrix_overlap_bottom_k": 0.016862036660313606,
          "effective_rank": -0.002775118686258793,
          "effective_rank_mergeability_score": 0.002072329632937908,
          "stable_rank": -0.001963934162631631,
          "spectral_gap": 0.0015397162642329931,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0015531667741015553,
          "layerwise_effective_rank_mergeability_score": 0.0011188734788447618,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.012248340994119644,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.002720718737691641,
          "task_vector_magnitude_ratio": -0.006185466889292002,
          "singular_value_overlap": -0.014468288980424404,
          "subspace_overlap": 0.002102792728692293,
          "right_subspace_overlap": 0.002890111645683646,
          "activation_l2_distance": -0.00113798794336617,
          "activation_cosine_similarity": 0.0050964439287781715,
          "activation_magnitude_ratio": -0.005145775619894266,
          "activation_dot_product": 0.0027657360769808292,
          "encoder_gradient_cosine_similarity": 0.0020676911808550358,
          "encoder_gradient_l2_distance": -0.01917426474392414,
          "encoder_gradient_dot_product": 0.003126688301563263,
          "input_gradient_cosine_similarity": 0.0014000269584357738,
          "input_gradient_l2_distance": -0.024122724309563637,
          "input_gradient_dot_product": -0.01518973521888256
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5654733255226047,
        "val_r": 0.41536706901372233,
        "n_iterations": 276,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004074949771165848,
          "right_subspace_overlap_bottom_k": -0.008789895102381706,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.02106073684990406,
          "effective_rank": -0.0014471448957920074,
          "effective_rank_mergeability_score": 0.0014554124791175127,
          "stable_rank": -0.001483917934820056,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0011165683390572667,
          "task_vector_l2_distance": -0.01214651484042406,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.006253329571336508,
          "singular_value_overlap": -0.010230659507215023,
          "subspace_overlap": 0.0023111216723918915,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0012222264194861054,
          "activation_cosine_similarity": 0.0022414447739720345,
          "activation_magnitude_ratio": -0.0024976427666842937,
          "activation_dot_product": 0.0032684565521776676,
          "encoder_gradient_cosine_similarity": 0.001224359730258584,
          "encoder_gradient_l2_distance": -0.011838630773127079,
          "encoder_gradient_dot_product": 0.003973703365772963,
          "input_gradient_cosine_similarity": 0.0017384011298418045,
          "input_gradient_l2_distance": -0.01396102923899889,
          "input_gradient_dot_product": -0.0072121829725801945
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6342907731030996,
        "val_r": 0.7332804981536657,
        "n_iterations": 405,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.00399859668686986,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.033627402037382126,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0014466664288192987,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0011358840856701136,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.02765839174389839,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0010326531482860446,
          "task_vector_magnitude_ratio": -0.003355965716764331,
          "singular_value_overlap": -0.018375828862190247,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0011152717052027583,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.004530394449830055,
          "activation_dot_product": 0.0022279543336480856,
          "encoder_gradient_cosine_similarity": 0.0013564021792262793,
          "encoder_gradient_l2_distance": -0.01761046051979065,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.002695862203836441,
          "input_gradient_l2_distance": -0.025880247354507446,
          "input_gradient_dot_product": -0.0023263334296643734
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.6109649631453478,
        "val_r": 0.6620668002364513,
        "n_iterations": 317,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0010259830160066485,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.02442559041082859,
          "effective_rank": -0.0015273533063009381,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0017164999153465033,
          "task_vector_l2_distance": -0.022187545895576477,
          "task_vector_dot_product": 0.0046730050817132,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0061234538443386555,
          "singular_value_overlap": -0.0149494968354702,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0013467057142406702,
          "activation_cosine_similarity": 0.0020077144727110863,
          "activation_magnitude_ratio": -0.0038837238680571318,
          "activation_dot_product": 0.002789819613099098,
          "encoder_gradient_cosine_similarity": 0.003128728596493602,
          "encoder_gradient_l2_distance": -0.022205332294106483,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.00277901953086257,
          "input_gradient_l2_distance": -0.01142074353992939,
          "input_gradient_dot_product": -0.006130892783403397
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.5941591344957584,
        "val_r": 0.1420182043761619,
        "n_iterations": 271,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0018623759970068932,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.014939460903406143,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0010115024633705616,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0017795951571315527,
          "task_vector_l2_distance": -0.015300845727324486,
          "task_vector_dot_product": -0.0034842314198613167,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.004405296873301268,
          "singular_value_overlap": -0.011105028912425041,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0012988531962037086,
          "activation_cosine_similarity": 0.0026525547727942467,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0020921325776726007,
          "encoder_gradient_l2_distance": -0.02470073103904724,
          "encoder_gradient_dot_product": 0.0031359673012048006,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0186931099742651,
          "input_gradient_dot_product": -0.0061933910474181175
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5456735748148034,
        "val_r": 0.218234676468107,
        "n_iterations": 296,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0025540830101817846,
          "right_subspace_overlap_bottom_k": -0.006310112774372101,
          "interaction_matrix_overlap_top_k": -0.0020702520851045847,
          "interaction_matrix_overlap_bottom_k": 0.02584431879222393,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0010806478094309568,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.02205166406929493,
          "task_vector_dot_product": -0.0010230811312794685,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.005647765006870031,
          "singular_value_overlap": -0.016316015273332596,
          "subspace_overlap": 0.006132957059890032,
          "right_subspace_overlap": 0.004088551737368107,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.004580298438668251,
          "activation_magnitude_ratio": -0.005903948098421097,
          "activation_dot_product": 0.0010341686429455876,
          "encoder_gradient_cosine_similarity": 0.0020937081426382065,
          "encoder_gradient_l2_distance": -0.024023281410336494,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.013134424574673176,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5832961659278566,
        "val_r": 0.46817225310998656,
        "n_iterations": 367,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.017862267792224884,
          "right_subspace_overlap_bottom_k": 0.015222576446831226,
          "interaction_matrix_overlap_top_k": 0.0023496723733842373,
          "interaction_matrix_overlap_bottom_k": 0.025218866765499115,
          "effective_rank": -0.005202149040997028,
          "effective_rank_mergeability_score": 0.006594863720238209,
          "stable_rank": -0.0037083192728459835,
          "spectral_gap": 0.001671244390308857,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0011602991726249456,
          "layerwise_effective_rank_mergeability_score": 0.003534168004989624,
          "task_vector_cosine_similarity": -0.009298569522798061,
          "task_vector_l2_distance": -0.05171538516879082,
          "task_vector_dot_product": -0.013468698598444462,
          "weight_space_angle": 0.009384207427501678,
          "task_vector_magnitude_ratio": -0.003887744853273034,
          "singular_value_overlap": -0.036215849220752716,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.015501661226153374,
          "activation_l2_distance": -0.01001013908535242,
          "activation_cosine_similarity": 0.017028484493494034,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.009890276938676834,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.06874821335077286,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.07933884114027023,
          "input_gradient_dot_product": -0.019205957651138306
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5982035854472662,
        "val_r": 0.11118263810488499,
        "n_iterations": 216,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0012849525082856417,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.02554757334291935,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0012429719790816307,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0017955484800040722,
          "task_vector_l2_distance": -0.02140290103852749,
          "task_vector_dot_product": 0.00208811042830348,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0028038639575242996,
          "singular_value_overlap": -0.014742684550583363,
          "subspace_overlap": 0.007869618944823742,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": -0.00716578122228384,
          "activation_magnitude_ratio": -0.002429869258776307,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0035320979077368975,
          "encoder_gradient_l2_distance": -0.017343884333968163,
          "encoder_gradient_dot_product": 0.0022991334553807974,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.024021346122026443,
          "input_gradient_dot_product": -0.005260368809103966
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5700026263246705,
        "val_r": 0.19174402064582424,
        "n_iterations": 285,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.008211788721382618,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.028891686350107193,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0015946872299537063,
          "stable_rank": -0.0015866563189774752,
          "spectral_gap": 0.0011684262426570058,
          "singular_value_ratio": -0.001028523431159556,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0344122014939785,
          "task_vector_dot_product": 0.0020368006080389023,
          "weight_space_angle": 0.0016669894102960825,
          "task_vector_magnitude_ratio": -0.003190940711647272,
          "singular_value_overlap": -0.01802612841129303,
          "subspace_overlap": 0.0023875765036791563,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0011961404234170914,
          "activation_cosine_similarity": 0.002780165756121278,
          "activation_magnitude_ratio": -0.004539423156529665,
          "activation_dot_product": 0.009351343847811222,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.038478750735521317,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.019502807408571243,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5396948308400396,
        "val_r": 0.4691565843375923,
        "n_iterations": 208,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0020308338571339846,
          "right_subspace_overlap_bottom_k": -0.008749177679419518,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.018698707222938538,
          "effective_rank": -0.0026335171423852444,
          "effective_rank_mergeability_score": 0.0027776637580245733,
          "stable_rank": -0.0027884971350431442,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.001917990273796022,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.004837851971387863,
          "task_vector_l2_distance": -0.012224910780787468,
          "task_vector_dot_product": -0.00366635131649673,
          "weight_space_angle": 0.0042332373559474945,
          "task_vector_magnitude_ratio": -0.0062951561994850636,
          "singular_value_overlap": -0.015345431864261627,
          "subspace_overlap": 0.007730948273092508,
          "right_subspace_overlap": 0.009389771148562431,
          "activation_l2_distance": -0.004846248310059309,
          "activation_cosine_similarity": 0.005613371264189482,
          "activation_magnitude_ratio": -0.004692621063441038,
          "activation_dot_product": 0.0019461135379970074,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.022736918181180954,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0030732606537640095,
          "input_gradient_l2_distance": -0.026746651157736778,
          "input_gradient_dot_product": -0.010087172500789165
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5672930912602308,
        "val_r": 0.4907708629962491,
        "n_iterations": 217,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.0034816686529666185,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.027981339022517204,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.020368337631225586,
          "task_vector_dot_product": 0.005801868159323931,
          "weight_space_angle": -0.0021740305237472057,
          "task_vector_magnitude_ratio": -0.005218622274696827,
          "singular_value_overlap": -0.013299915008246899,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0022318821866065264,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0018159919418394566,
          "activation_dot_product": 0.006954758893698454,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.021638624370098114,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0028000171296298504,
          "input_gradient_l2_distance": -0.017894292250275612,
          "input_gradient_dot_product": -0.007077984511852264
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5510972676849942,
        "val_r": 0.6379396901828287,
        "n_iterations": 343,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01172013022005558,
          "right_subspace_overlap_bottom_k": -0.005743416491895914,
          "interaction_matrix_overlap_top_k": 0.0048704142682254314,
          "interaction_matrix_overlap_bottom_k": 0.022783061489462852,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.001069835969246924,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0014590146020054817,
          "layerwise_effective_rank_mergeability_score": -0.0023767086677253246,
          "task_vector_cosine_similarity": -0.0011444611009210348,
          "task_vector_l2_distance": -0.020671773701906204,
          "task_vector_dot_product": -0.004782233387231827,
          "weight_space_angle": 0.0012193178990855813,
          "task_vector_magnitude_ratio": -0.002111252164468169,
          "singular_value_overlap": -0.022601371631026268,
          "subspace_overlap": 0.008383545093238354,
          "right_subspace_overlap": 0.011000371538102627,
          "activation_l2_distance": -0.004465809091925621,
          "activation_cosine_similarity": 0.009507899172604084,
          "activation_magnitude_ratio": -0.002973764669150114,
          "activation_dot_product": 0.0012340706307440996,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.04150902107357979,
          "encoder_gradient_dot_product": 0.007696888875216246,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.04768839851021767,
          "input_gradient_dot_product": -0.023274550214409828
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.4866480605935888,
        "val_r": 0.6126121041482812,
        "n_iterations": 234,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.008123998530209064,
          "interaction_matrix_overlap_top_k": -0.0023063826374709606,
          "interaction_matrix_overlap_bottom_k": 0.011876455508172512,
          "effective_rank": -0.001768458285368979,
          "effective_rank_mergeability_score": 0.0018348186276853085,
          "stable_rank": -0.0023255026899278164,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.01133954431861639,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0031460258178412914,
          "task_vector_magnitude_ratio": -0.004816416185349226,
          "singular_value_overlap": -0.009605800732970238,
          "subspace_overlap": 0.0013536268379539251,
          "right_subspace_overlap": 0.0041817910969257355,
          "activation_l2_distance": -0.0010227428283542395,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.004670524969696999,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0011449818266555667,
          "encoder_gradient_l2_distance": -0.013578797690570354,
          "encoder_gradient_dot_product": 0.0021319000516086817,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.015407631173729897,
          "input_gradient_dot_product": -0.004800369497388601
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.607790473972281,
        "val_r": 0.3177408248671441,
        "n_iterations": 255,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.004240983631461859,
          "right_subspace_overlap_bottom_k": -0.005693979095667601,
          "interaction_matrix_overlap_top_k": 0.0018480815924704075,
          "interaction_matrix_overlap_bottom_k": 0.014391524717211723,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0011983360163867474,
          "stable_rank": -0.0012794057838618755,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.013590481132268906,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0010090830037370324,
          "task_vector_magnitude_ratio": -0.006317033898085356,
          "singular_value_overlap": -0.0036585612688213587,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.00545478006824851,
          "activation_l2_distance": 0.0023327814415097237,
          "activation_cosine_similarity": 0.004443441983312368,
          "activation_magnitude_ratio": -0.0027804579585790634,
          "activation_dot_product": 0.0019350413931533694,
          "encoder_gradient_cosine_similarity": 0.0010693459771573544,
          "encoder_gradient_l2_distance": -0.015038993209600449,
          "encoder_gradient_dot_product": 0.0023017143830657005,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.0157734677195549,
          "input_gradient_dot_product": -0.0087199155241251
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.6142691436932504,
        "val_r": 0.5047744565517832,
        "n_iterations": 256,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0025929659605026245,
          "right_subspace_overlap_bottom_k": -0.0020835930481553078,
          "interaction_matrix_overlap_top_k": 0.0017343799117952585,
          "interaction_matrix_overlap_bottom_k": 0.020968738943338394,
          "effective_rank": -0.0014915346400812268,
          "effective_rank_mergeability_score": 0.001078072702512145,
          "stable_rank": -0.0015496821142733097,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0030157282017171383,
          "task_vector_l2_distance": -0.020308734849095345,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0037698366213589907,
          "task_vector_magnitude_ratio": -0.0023042752873152494,
          "singular_value_overlap": -0.011441349051892757,
          "subspace_overlap": 0.0028176300693303347,
          "right_subspace_overlap": 0.002299138344824314,
          "activation_l2_distance": 0.004637942183762789,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0035954974591732025,
          "activation_dot_product": 0.011127224192023277,
          "encoder_gradient_cosine_similarity": 0.0023109051398932934,
          "encoder_gradient_l2_distance": -0.015150452964007854,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.004774636588990688,
          "input_gradient_l2_distance": -0.01519726775586605,
          "input_gradient_dot_product": -0.0064687873236835
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6008037845467854,
        "val_r": 0.3883841107661064,
        "n_iterations": 226,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0018182151252403855,
          "right_subspace_overlap_bottom_k": 0.0169275663793087,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0400463230907917,
          "effective_rank": -0.0016929141711443663,
          "effective_rank_mergeability_score": 0.0013940958306193352,
          "stable_rank": 0.0,
          "spectral_gap": 0.001270742155611515,
          "singular_value_ratio": -0.0025280455593019724,
          "layerwise_effective_rank": -0.0014480819227173924,
          "layerwise_effective_rank_mergeability_score": 0.0013060690835118294,
          "task_vector_cosine_similarity": -0.0010366698261350393,
          "task_vector_l2_distance": -0.037593405693769455,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.0021712842863053083,
          "task_vector_magnitude_ratio": -0.0014855992048978806,
          "singular_value_overlap": -0.014400534331798553,
          "subspace_overlap": 0.0010845991782844067,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0014314244035631418,
          "activation_cosine_similarity": 0.006204295437783003,
          "activation_magnitude_ratio": -0.004362908191978931,
          "activation_dot_product": 0.006908752024173737,
          "encoder_gradient_cosine_similarity": 0.0029922088142484426,
          "encoder_gradient_l2_distance": -0.032044339925050735,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.001054086023941636,
          "input_gradient_l2_distance": -0.05690222233533859,
          "input_gradient_dot_product": -0.0035247216001152992
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7985743096227778,
        "val_r": 0.6485117998611863,
        "n_iterations": 211,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.011859321966767311,
          "right_subspace_overlap_bottom_k": -0.01314103975892067,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0020063607953488827,
          "layerwise_effective_rank_mergeability_score": 0.003708456875756383,
          "task_vector_cosine_similarity": -0.005639017093926668,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.003972087521106005,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.0011898300144821405,
          "subspace_overlap": -0.003443934489041567,
          "right_subspace_overlap": 0.02028021402657032,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.014819180592894554,
          "activation_magnitude_ratio": -0.002555566607043147,
          "activation_dot_product": 0.007341211196035147,
          "encoder_gradient_cosine_similarity": 0.004040193278342485,
          "encoder_gradient_l2_distance": -0.050453417003154755,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.00401134230196476,
          "input_gradient_l2_distance": -0.02723843976855278,
          "input_gradient_dot_product": -0.0104000149294734
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.6518221782083343,
        "val_r": 0.43528804739102533,
        "n_iterations": 295,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0026232823729515076,
          "right_subspace_overlap_bottom_k": 0.00622364180162549,
          "interaction_matrix_overlap_top_k": -0.007944352924823761,
          "interaction_matrix_overlap_bottom_k": 0.022382063791155815,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0025488429237157106,
          "singular_value_ratio": -0.0022643140982836485,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.002749495906755328,
          "task_vector_l2_distance": -0.03183097764849663,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": -0.00264327647164464,
          "task_vector_magnitude_ratio": -0.006961815524846315,
          "singular_value_overlap": -0.020650213584303856,
          "subspace_overlap": 0.004817422479391098,
          "right_subspace_overlap": -0.0030193733982741833,
          "activation_l2_distance": -0.0023108285386115313,
          "activation_cosine_similarity": 0.005067398771643639,
          "activation_magnitude_ratio": -0.005186174996197224,
          "activation_dot_product": 0.008817099034786224,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.02841861918568611,
          "encoder_gradient_dot_product": 0.0015756909269839525,
          "input_gradient_cosine_similarity": 0.0031383181922137737,
          "input_gradient_l2_distance": -0.038400039076805115,
          "input_gradient_dot_product": -0.00804232619702816
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.3,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "tsv": {
    "aggregate_metrics": {
      "train_r": 0.5010419584391026,
      "train_p": 2.1049678397900135e-204,
      "val_r": 0.41113439539811647,
      "val_p": 4.922731681055768e-16
    },
    "per_fold_stats": {
      "train_r_mean": 0.752321260744318,
      "train_r_std": 0.08611818002791922,
      "val_r_mean": 0.6339301494701856,
      "val_r_std": 0.15659200054753425,
      "n_nonzero_mean": 20.65,
      "n_nonzero_std": 3.539420856580918
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.016838764771819115,
      "right_subspace_overlap_bottom_k": -0.03344161808490753,
      "interaction_matrix_overlap_top_k": 0.0006631833384744823,
      "interaction_matrix_overlap_bottom_k": 0.0016059704357758164,
      "effective_rank": 0.00019854112179018557,
      "effective_rank_mergeability_score": -2.7453818347566994e-06,
      "stable_rank": -0.00030911111389286816,
      "spectral_gap": -0.0004718953277915716,
      "singular_value_ratio": 0.0001685471652308479,
      "layerwise_effective_rank": -0.0017879221122711897,
      "layerwise_effective_rank_mergeability_score": 0.0015745064010843635,
      "task_vector_cosine_similarity": -0.0009089120430871844,
      "task_vector_l2_distance": -0.0009186530369333923,
      "task_vector_dot_product": -0.0009273619507439435,
      "weight_space_angle": 0.0013329994399100542,
      "task_vector_magnitude_ratio": 5.407524440670386e-05,
      "singular_value_overlap": 0.011035998351871967,
      "subspace_overlap": -0.0033972300589084625,
      "right_subspace_overlap": 0.018766013905405998,
      "activation_l2_distance": -0.0019305748865008354,
      "activation_cosine_similarity": 0.025048842653632164,
      "activation_magnitude_ratio": -0.0037035257555544376,
      "activation_dot_product": 0.0052244109101593494,
      "encoder_gradient_cosine_similarity": 0.004467204678803682,
      "encoder_gradient_l2_distance": -0.045101098716259,
      "encoder_gradient_dot_product": 3.6587203794624656e-05,
      "input_gradient_cosine_similarity": 0.0019958908669650555,
      "input_gradient_l2_distance": -0.025163492187857628,
      "input_gradient_dot_product": -0.003373838495463133
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.007814173586666584,
      "right_subspace_overlap_bottom_k": 0.00837439950555563,
      "interaction_matrix_overlap_top_k": 0.0035862051881849766,
      "interaction_matrix_overlap_bottom_k": 0.005865986924618483,
      "effective_rank": 0.0010545362019911408,
      "effective_rank_mergeability_score": 0.0011886422289535403,
      "stable_rank": 0.0009012783411890268,
      "spectral_gap": 0.0013872174313291907,
      "singular_value_ratio": 0.0016944174421951175,
      "layerwise_effective_rank": 0.002283903071656823,
      "layerwise_effective_rank_mergeability_score": 0.0024355240166187286,
      "task_vector_cosine_similarity": 0.004853693302720785,
      "task_vector_l2_distance": 0.005135438870638609,
      "task_vector_dot_product": 0.0038649989292025566,
      "weight_space_angle": 0.004675930831581354,
      "task_vector_magnitude_ratio": 0.0014355108141899109,
      "singular_value_overlap": 0.008168491534888744,
      "subspace_overlap": 0.00390060106292367,
      "right_subspace_overlap": 0.008578899316489697,
      "activation_l2_distance": 0.005541592836380005,
      "activation_cosine_similarity": 0.010923724621534348,
      "activation_magnitude_ratio": 0.0036924208980053663,
      "activation_dot_product": 0.017628155648708344,
      "encoder_gradient_cosine_similarity": 0.002315024845302105,
      "encoder_gradient_l2_distance": 0.024775903671979904,
      "encoder_gradient_dot_product": 0.0013508412521332502,
      "input_gradient_cosine_similarity": 0.0034671705216169357,
      "input_gradient_l2_distance": 0.01853375881910324,
      "input_gradient_dot_product": 0.002965184859931469
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 1.0,
      "right_subspace_overlap_bottom_k": 1.0,
      "interaction_matrix_overlap_top_k": 0.6,
      "interaction_matrix_overlap_bottom_k": 0.7,
      "effective_rank": 0.4,
      "effective_rank_mergeability_score": 0.3,
      "stable_rank": 0.25,
      "spectral_gap": 0.35,
      "singular_value_ratio": 0.35,
      "layerwise_effective_rank": 0.7,
      "layerwise_effective_rank_mergeability_score": 0.6,
      "task_vector_cosine_similarity": 0.65,
      "task_vector_l2_distance": 0.85,
      "task_vector_dot_product": 0.7,
      "weight_space_angle": 0.7,
      "task_vector_magnitude_ratio": 0.3,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 0.7,
      "right_subspace_overlap": 0.95,
      "activation_l2_distance": 1.0,
      "activation_cosine_similarity": 0.95,
      "activation_magnitude_ratio": 0.9,
      "activation_dot_product": 0.9,
      "encoder_gradient_cosine_similarity": 0.95,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.4,
      "input_gradient_cosine_similarity": 0.6,
      "input_gradient_l2_distance": 0.95,
      "input_gradient_dot_product": 0.9
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7699896473857593,
        "val_r": 0.5799781924450426,
        "n_iterations": 265,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.009458289481699467,
          "right_subspace_overlap_bottom_k": -0.028161603957414627,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.008411013521254063,
          "effective_rank": 0.0010897618485614657,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.00110152130946517,
          "singular_value_ratio": 0.0013218398671597242,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.0036956341937184334,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.003327519865706563,
          "weight_space_angle": 0.002803863026201725,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005551824811846018,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.018300892785191536,
          "activation_l2_distance": -0.001755217439495027,
          "activation_cosine_similarity": 0.022714775055646896,
          "activation_magnitude_ratio": -0.006470154505223036,
          "activation_dot_product": -0.0013992944732308388,
          "encoder_gradient_cosine_similarity": 0.0023605653550475836,
          "encoder_gradient_l2_distance": -0.036477409303188324,
          "encoder_gradient_dot_product": -0.0013625819701701403,
          "input_gradient_cosine_similarity": 0.001425337279215455,
          "input_gradient_l2_distance": -0.01933632791042328,
          "input_gradient_dot_product": -0.005019378382712603
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7574870530118776,
        "val_r": 0.7987633220869355,
        "n_iterations": 238,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.018910448998212814,
          "right_subspace_overlap_bottom_k": -0.04376354068517685,
          "interaction_matrix_overlap_top_k": 0.0017886771820485592,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0012975451536476612,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0010801150929182768,
          "layerwise_effective_rank_mergeability_score": 0.0014919156674295664,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.008682291023433208,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.012224880047142506,
          "subspace_overlap": 0.0017077355878427625,
          "right_subspace_overlap": 0.031250081956386566,
          "activation_l2_distance": -0.002373032970353961,
          "activation_cosine_similarity": 0.044331181794404984,
          "activation_magnitude_ratio": -0.0067260717041790485,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0016687549650669098,
          "encoder_gradient_l2_distance": -0.07878421992063522,
          "encoder_gradient_dot_product": 0.0017164071323350072,
          "input_gradient_cosine_similarity": 0.0011870920425280929,
          "input_gradient_l2_distance": -0.043496642261743546,
          "input_gradient_dot_product": -0.002694809576496482
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.3853961407627781,
        "val_r": 0.5187495553419181,
        "n_iterations": 334,
        "n_nonzero_coefficients": 26,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.003445527981966734,
          "right_subspace_overlap_bottom_k": -0.021755153313279152,
          "interaction_matrix_overlap_top_k": -0.002066396176815033,
          "interaction_matrix_overlap_bottom_k": 0.007947539910674095,
          "effective_rank": -0.0017405026592314243,
          "effective_rank_mergeability_score": 0.002821630798280239,
          "stable_rank": -0.0033020121045410633,
          "spectral_gap": 0.00323827238753438,
          "singular_value_ratio": -0.003761706408113241,
          "layerwise_effective_rank": -0.005884931422770023,
          "layerwise_effective_rank_mergeability_score": 0.007271526847034693,
          "task_vector_cosine_similarity": 0.001942767295986414,
          "task_vector_l2_distance": -0.0035582315176725388,
          "task_vector_dot_product": -0.0017129969783127308,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0033873848151415586,
          "singular_value_overlap": 0.0013192819897085428,
          "subspace_overlap": -0.010041161440312862,
          "right_subspace_overlap": 0.019280163571238518,
          "activation_l2_distance": 0.006053382530808449,
          "activation_cosine_similarity": 0.01895803213119507,
          "activation_magnitude_ratio": -0.0027459925040602684,
          "activation_dot_product": -0.003311010543256998,
          "encoder_gradient_cosine_similarity": 0.0012640038039535284,
          "encoder_gradient_l2_distance": -0.009722634218633175,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010558000765740871,
          "input_gradient_dot_product": -0.004233225714415312
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7481528857964836,
        "val_r": 0.7074417502887235,
        "n_iterations": 237,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01774042472243309,
          "right_subspace_overlap_bottom_k": -0.03539867699146271,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0013218207750469446,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.002483920892700553,
          "singular_value_ratio": 0.0022011350374668837,
          "layerwise_effective_rank": -0.003591397078707814,
          "layerwise_effective_rank_mergeability_score": 0.004399905446916819,
          "task_vector_cosine_similarity": -0.007364509627223015,
          "task_vector_l2_distance": -0.003194466233253479,
          "task_vector_dot_product": -0.002682430436834693,
          "weight_space_angle": 0.003110448829829693,
          "task_vector_magnitude_ratio": 0.0020502840634435415,
          "singular_value_overlap": 0.01635180599987507,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.03279640153050423,
          "activation_l2_distance": -0.0029436710756272078,
          "activation_cosine_similarity": 0.022302042692899704,
          "activation_magnitude_ratio": -0.005385689903050661,
          "activation_dot_product": 0.013732915744185448,
          "encoder_gradient_cosine_similarity": 0.00527321919798851,
          "encoder_gradient_l2_distance": -0.07222457975149155,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.035447895526885986,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7700296953466099,
        "val_r": 0.7702020608264998,
        "n_iterations": 301,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.025250134989619255,
          "right_subspace_overlap_bottom_k": -0.037915438413619995,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0016190198948606849,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.004528526682406664,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.007797308266162872,
          "subspace_overlap": -0.001056171371601522,
          "right_subspace_overlap": 0.01631624810397625,
          "activation_l2_distance": 0.0017123720608651638,
          "activation_cosine_similarity": 0.03802676126360893,
          "activation_magnitude_ratio": -0.0030600139871239662,
          "activation_dot_product": -0.004804419353604317,
          "encoder_gradient_cosine_similarity": 0.0059656379744410515,
          "encoder_gradient_l2_distance": -0.05292496457695961,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.003832542337477207,
          "input_gradient_l2_distance": -0.01567360758781433,
          "input_gradient_dot_product": -0.00411309115588665
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7688812261420489,
        "val_r": 0.7127934638401079,
        "n_iterations": 230,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.014735122211277485,
          "right_subspace_overlap_bottom_k": -0.03034292347729206,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0019040919141843915,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.003665668424218893,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.009948953054845333,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.009709886275231838,
          "activation_l2_distance": 0.00170164555311203,
          "activation_cosine_similarity": 0.03893569856882095,
          "activation_magnitude_ratio": -0.0015289245638996363,
          "activation_dot_product": -0.0021684470120817423,
          "encoder_gradient_cosine_similarity": 0.0071237413212656975,
          "encoder_gradient_l2_distance": -0.04895995184779167,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0029169730842113495,
          "input_gradient_l2_distance": 0.0,
          "input_gradient_dot_product": -0.004003751557320356
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.777837874977334,
        "val_r": 0.6971400075830951,
        "n_iterations": 332,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01652803272008896,
          "right_subspace_overlap_bottom_k": -0.034826721996068954,
          "interaction_matrix_overlap_top_k": -0.0014636680716648698,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0013163771945983171,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0011134515516459942,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.00540512427687645,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.00922065693885088,
          "subspace_overlap": -0.0031616846099495888,
          "right_subspace_overlap": 0.010241164825856686,
          "activation_l2_distance": -0.004509790800511837,
          "activation_cosine_similarity": 0.023357780650258064,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.006740889977663755,
          "encoder_gradient_cosine_similarity": 0.007190857082605362,
          "encoder_gradient_l2_distance": -0.041836585849523544,
          "encoder_gradient_dot_product": 0.0016327484045177698,
          "input_gradient_cosine_similarity": -0.0012281432282179594,
          "input_gradient_l2_distance": -0.00986893568187952,
          "input_gradient_dot_product": -0.004431502427905798
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7521300998933087,
        "val_r": 0.30633858711265183,
        "n_iterations": 325,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.024706749245524406,
          "right_subspace_overlap_bottom_k": -0.04130015894770622,
          "interaction_matrix_overlap_top_k": 0.004378859885036945,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0016879650065675378,
          "spectral_gap": -0.002276569837704301,
          "singular_value_ratio": 0.0020978753454983234,
          "layerwise_effective_rank": -0.0012999260798096657,
          "layerwise_effective_rank_mergeability_score": 0.003095767227932811,
          "task_vector_cosine_similarity": -0.010330046527087688,
          "task_vector_l2_distance": -0.005766547285020351,
          "task_vector_dot_product": -0.0010093064047396183,
          "weight_space_angle": 0.013612581416964531,
          "task_vector_magnitude_ratio": 0.0016548134153708816,
          "singular_value_overlap": 0.015735667198896408,
          "subspace_overlap": -0.0036057245451956987,
          "right_subspace_overlap": 0.023340782150626183,
          "activation_l2_distance": -0.012665909714996815,
          "activation_cosine_similarity": 0.023121746256947517,
          "activation_magnitude_ratio": -0.004828827455639839,
          "activation_dot_product": 0.010300792753696442,
          "encoder_gradient_cosine_similarity": 0.008952133357524872,
          "encoder_gradient_l2_distance": -0.060683511197566986,
          "encoder_gradient_dot_product": -0.001314123161137104,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.035480331629514694,
          "input_gradient_dot_product": 0.0034090224653482437
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.7955667767898834,
        "val_r": 0.3923637846421173,
        "n_iterations": 206,
        "n_nonzero_coefficients": 21,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.016810249537229538,
          "right_subspace_overlap_bottom_k": -0.04246967285871506,
          "interaction_matrix_overlap_top_k": 0.0015013858210295439,
          "interaction_matrix_overlap_bottom_k": 0.002833412028849125,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0062496354803442955,
          "layerwise_effective_rank_mergeability_score": 0.004748047795146704,
          "task_vector_cosine_similarity": -0.004264909774065018,
          "task_vector_l2_distance": 0.00285366945900023,
          "task_vector_dot_product": -0.003675454296171665,
          "weight_space_angle": 0.005386087112128735,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.006119220517575741,
          "subspace_overlap": -0.003088128287345171,
          "right_subspace_overlap": 0.028825024142861366,
          "activation_l2_distance": 0.002221824135631323,
          "activation_cosine_similarity": 0.036967236548662186,
          "activation_magnitude_ratio": -0.0016112590674310923,
          "activation_dot_product": -0.011099272407591343,
          "encoder_gradient_cosine_similarity": 0.004312921315431595,
          "encoder_gradient_l2_distance": -0.04483401030302048,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0030746881384402514,
          "input_gradient_l2_distance": -0.02720894105732441,
          "input_gradient_dot_product": 0.0
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7727587499479239,
        "val_r": 0.487065514281008,
        "n_iterations": 272,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.019984371960163116,
          "right_subspace_overlap_bottom_k": -0.04011644050478935,
          "interaction_matrix_overlap_top_k": -0.0023367092944681644,
          "interaction_matrix_overlap_bottom_k": 0.0018517692806199193,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0024628823157399893,
          "layerwise_effective_rank_mergeability_score": 0.002025397727265954,
          "task_vector_cosine_similarity": -0.0012137687299400568,
          "task_vector_l2_distance": 0.0034156842157244682,
          "task_vector_dot_product": -0.002285826951265335,
          "weight_space_angle": 0.0018608069512993097,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.005782742984592915,
          "subspace_overlap": -0.003669386263936758,
          "right_subspace_overlap": 0.02758338861167431,
          "activation_l2_distance": -0.002256612293422222,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": 0.0023958240635693073,
          "activation_dot_product": -0.011141635477542877,
          "encoder_gradient_cosine_similarity": 0.008709906600415707,
          "encoder_gradient_l2_distance": -0.029338205233216286,
          "encoder_gradient_dot_product": 0.0020928680896759033,
          "input_gradient_cosine_similarity": 0.0028339792042970657,
          "input_gradient_l2_distance": -0.012166459113359451,
          "input_gradient_dot_product": -0.005157559644430876
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7301184331546079,
        "val_r": 0.25862772222240205,
        "n_iterations": 299,
        "n_nonzero_coefficients": 28,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01715259626507759,
          "right_subspace_overlap_bottom_k": -0.039290912449359894,
          "interaction_matrix_overlap_top_k": 0.013889574445784092,
          "interaction_matrix_overlap_bottom_k": -0.015916956588625908,
          "effective_rank": 0.00251792068593204,
          "effective_rank_mergeability_score": -0.0024565281346440315,
          "stable_rank": 0.0012178472243249416,
          "spectral_gap": -0.003962845541536808,
          "singular_value_ratio": 0.005096020642668009,
          "layerwise_effective_rank": 0.0038171173073351383,
          "layerwise_effective_rank_mergeability_score": -0.004018776118755341,
          "task_vector_cosine_similarity": 0.010956551879644394,
          "task_vector_l2_distance": 0.0017388213891535997,
          "task_vector_dot_product": 0.01108989492058754,
          "weight_space_angle": -0.007483424618840218,
          "task_vector_magnitude_ratio": 0.004093156661838293,
          "singular_value_overlap": 0.03578398376703262,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.029772071167826653,
          "activation_l2_distance": -0.013580786995589733,
          "activation_cosine_similarity": 0.03936244174838066,
          "activation_magnitude_ratio": -0.015746166929602623,
          "activation_dot_product": 0.06318000704050064,
          "encoder_gradient_cosine_similarity": 0.0037774285301566124,
          "encoder_gradient_l2_distance": -0.06372082233428955,
          "encoder_gradient_dot_product": -0.0018120144959539175,
          "input_gradient_cosine_similarity": 0.01575412228703499,
          "input_gradient_l2_distance": -0.06607828289270401,
          "input_gradient_dot_product": -0.0029854571912437677
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7902835126372765,
        "val_r": 0.777250283278053,
        "n_iterations": 313,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.01937883347272873,
          "right_subspace_overlap_bottom_k": -0.03175074979662895,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.005493140313774347,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": -0.005082754418253899,
          "task_vector_l2_distance": 0.0031673195771872997,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.005415224004536867,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0066698272712528706,
          "subspace_overlap": -0.004569229204207659,
          "right_subspace_overlap": 0.01145471353083849,
          "activation_l2_distance": 0.005708540789783001,
          "activation_cosine_similarity": 0.023651478812098503,
          "activation_magnitude_ratio": -0.0011451388709247112,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0031342064030468464,
          "encoder_gradient_l2_distance": -0.028747960925102234,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0027810262981802225,
          "input_gradient_l2_distance": -0.009198595769703388,
          "input_gradient_dot_product": -0.0031709184404462576
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7813442537646849,
        "val_r": 0.7924472706242145,
        "n_iterations": 256,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.00801519863307476,
          "right_subspace_overlap_bottom_k": -0.02952522225677967,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.008381418883800507,
          "effective_rank": 0.0016642697155475616,
          "effective_rank_mergeability_score": -0.0018833121284842491,
          "stable_rank": 0.0,
          "spectral_gap": -0.0011811184231191874,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0020822277292609215,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0052402438595891,
          "task_vector_l2_distance": 0.006571640260517597,
          "task_vector_dot_product": -0.0015809042379260063,
          "weight_space_angle": -0.0028230296447873116,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.006444264203310013,
          "subspace_overlap": -0.008459323085844517,
          "right_subspace_overlap": 0.01198591198772192,
          "activation_l2_distance": 0.005098126363009214,
          "activation_cosine_similarity": 0.02287730947136879,
          "activation_magnitude_ratio": 0.0,
          "activation_dot_product": -0.006165016908198595,
          "encoder_gradient_cosine_similarity": 0.003597631584852934,
          "encoder_gradient_l2_distance": -0.016167806461453438,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.003022926626726985,
          "input_gradient_l2_distance": -0.013594754971563816,
          "input_gradient_dot_product": -0.0031757564283907413
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7581641910110042,
        "val_r": 0.7471406549191938,
        "n_iterations": 331,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.032977424561977386,
          "right_subspace_overlap_bottom_k": -0.041553813964128494,
          "interaction_matrix_overlap_top_k": -0.004144025035202503,
          "interaction_matrix_overlap_bottom_k": 0.0010645636357367039,
          "effective_rank": -0.001415084581822157,
          "effective_rank_mergeability_score": 0.0019958443008363247,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.003334588138386607,
          "layerwise_effective_rank_mergeability_score": 0.003556896699592471,
          "task_vector_cosine_similarity": 0.001034163637086749,
          "task_vector_l2_distance": -0.004824329633265734,
          "task_vector_dot_product": -0.010473182424902916,
          "weight_space_angle": -0.0010060666827484965,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.028279505670070648,
          "subspace_overlap": -0.004485655575990677,
          "right_subspace_overlap": 0.02136920392513275,
          "activation_l2_distance": -0.009927925653755665,
          "activation_cosine_similarity": 0.029602648690342903,
          "activation_magnitude_ratio": -0.003732345998287201,
          "activation_dot_product": 0.03295544162392616,
          "encoder_gradient_cosine_similarity": 0.0036632211413234472,
          "encoder_gradient_l2_distance": -0.11015128344297409,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0023607423063367605,
          "input_gradient_l2_distance": -0.06227148696780205,
          "input_gradient_dot_product": -0.0017406935803592205
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7909086906614332,
        "val_r": 0.7663144715869367,
        "n_iterations": 331,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.014456156641244888,
          "right_subspace_overlap_bottom_k": -0.04071410745382309,
          "interaction_matrix_overlap_top_k": -0.001501791994087398,
          "interaction_matrix_overlap_bottom_k": 0.0066762324422597885,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": 0.007213900331407785,
          "task_vector_dot_product": -0.0044606951996684074,
          "weight_space_angle": 0.001412629964761436,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.007375389337539673,
          "subspace_overlap": -0.0038580521941184998,
          "right_subspace_overlap": 0.021209755912423134,
          "activation_l2_distance": -0.0024864748120307922,
          "activation_cosine_similarity": 0.026096312329173088,
          "activation_magnitude_ratio": -0.0024268818087875843,
          "activation_dot_product": -0.0071185571141541,
          "encoder_gradient_cosine_similarity": 0.0053602298721671104,
          "encoder_gradient_l2_distance": -0.03431965410709381,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.01037103682756424,
          "input_gradient_dot_product": -0.006339618936181068
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.8122893319572404,
        "val_r": 0.6453293748598998,
        "n_iterations": 415,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0067427316680550575,
          "right_subspace_overlap_bottom_k": -0.02111029252409935,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.0036922406870871782,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.00182614685036242,
          "task_vector_dot_product": -0.0014412426389753819,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0011357280891388655,
          "singular_value_overlap": 0.007783778011798859,
          "subspace_overlap": -0.012146273627877235,
          "right_subspace_overlap": 0.020579468458890915,
          "activation_l2_distance": 0.0014891638420522213,
          "activation_cosine_similarity": 0.014592590741813183,
          "activation_magnitude_ratio": -0.0024656709283590317,
          "activation_dot_product": -0.004043205175548792,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.015380941331386566,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.009007161483168602,
          "input_gradient_dot_product": -0.0034401905722916126
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.7706920495167346,
        "val_r": 0.6872071147393481,
        "n_iterations": 248,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.024107038974761963,
          "right_subspace_overlap_bottom_k": -0.023981530219316483,
          "interaction_matrix_overlap_top_k": -0.0019114884780719876,
          "interaction_matrix_overlap_bottom_k": 0.010237151756882668,
          "effective_rank": 0.0019708899781107903,
          "effective_rank_mergeability_score": -0.0020813981536775827,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0012688061688095331,
          "task_vector_l2_distance": 0.0014270446263253689,
          "task_vector_dot_product": -0.0019605965353548527,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.0030077723786234856,
          "subspace_overlap": -0.010394120588898659,
          "right_subspace_overlap": 0.005891080480068922,
          "activation_l2_distance": 0.003929058089852333,
          "activation_cosine_similarity": 0.01510532945394516,
          "activation_magnitude_ratio": -0.0033655755687505007,
          "activation_dot_product": -0.0013728669146075845,
          "encoder_gradient_cosine_similarity": 0.003101370297372341,
          "encoder_gradient_l2_distance": -0.012691045179963112,
          "encoder_gradient_dot_product": 0.003022804856300354,
          "input_gradient_cosine_similarity": 0.0019565292168408632,
          "input_gradient_l2_distance": -0.011797493323683739,
          "input_gradient_dot_product": -0.004037077073007822
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7626192729885066,
        "val_r": 0.6819787927745028,
        "n_iterations": 316,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.019609056413173676,
          "right_subspace_overlap_bottom_k": -0.0379418283700943,
          "interaction_matrix_overlap_top_k": 0.00298659922555089,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0013872624840587378,
          "layerwise_effective_rank_mergeability_score": 0.0014100667322054505,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.005598884541541338,
          "task_vector_dot_product": 0.0015775234205648303,
          "weight_space_angle": -0.0034674236085265875,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.014646326191723347,
          "subspace_overlap": -0.001117429113946855,
          "right_subspace_overlap": 0.016854288056492805,
          "activation_l2_distance": -0.0026464895345270634,
          "activation_cosine_similarity": 0.033790137618780136,
          "activation_magnitude_ratio": -0.0049504442140460014,
          "activation_dot_product": 0.0022860169410705566,
          "encoder_gradient_cosine_similarity": 0.004753071814775467,
          "encoder_gradient_l2_distance": -0.06017278879880905,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.05234226584434509,
          "input_gradient_dot_product": -0.009859222918748856
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7624767674650563,
        "val_r": 0.6734807086167082,
        "n_iterations": 240,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.025597117841243744,
          "right_subspace_overlap_bottom_k": -0.035206861793994904,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": -0.00221051974222064,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0011125473538413644,
          "spectral_gap": -0.0016702029388397932,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.004095255397260189,
          "layerwise_effective_rank_mergeability_score": 0.001610070699825883,
          "task_vector_cosine_similarity": -0.01009437721222639,
          "task_vector_l2_distance": -0.0030742392409592867,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.00883825495839119,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": 0.01476062461733818,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.018559826537966728,
          "activation_l2_distance": -0.005012974143028259,
          "activation_cosine_similarity": 0.01842840015888214,
          "activation_magnitude_ratio": -0.0022925150115042925,
          "activation_dot_product": 0.014143076725304127,
          "encoder_gradient_cosine_similarity": 0.003390370635315776,
          "encoder_gradient_l2_distance": -0.0586981326341629,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.03544384986162186,
          "input_gradient_dot_product": 0.0014320391928777099
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7892985616758073,
        "val_r": 0.6779903573343538,
        "n_iterations": 288,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0011697730515152216,
          "right_subspace_overlap_bottom_k": -0.011706741526722908,
          "interaction_matrix_overlap_top_k": 0.0021426493767648935,
          "interaction_matrix_overlap_bottom_k": -0.008245693519711494,
          "effective_rank": -0.0014382535591721535,
          "effective_rank_mergeability_score": 0.0015488556819036603,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.0022678442765027285,
          "layerwise_effective_rank": -0.002822648733854294,
          "layerwise_effective_rank_mergeability_score": 0.004785857629030943,
          "task_vector_cosine_similarity": 0.0034252272453159094,
          "task_vector_l2_distance": -0.013641128316521645,
          "task_vector_dot_product": 0.003395499661564827,
          "weight_space_angle": -0.005528485402464867,
          "task_vector_magnitude_ratio": -0.002193636493757367,
          "singular_value_overlap": 0.005916162393987179,
          "subspace_overlap": 0.0,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.006366726942360401,
          "activation_cosine_similarity": 0.008754981681704521,
          "activation_magnitude_ratio": -0.007984671741724014,
          "activation_dot_product": 0.027254583314061165,
          "encoder_gradient_cosine_similarity": 0.005744819529354572,
          "encoder_gradient_l2_distance": -0.02618548832833767,
          "encoder_gradient_dot_product": -0.0032443644013255835,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.023927811533212662,
          "input_gradient_dot_product": -0.007915576919913292
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.3,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  },
  "isotropic": {
    "aggregate_metrics": {
      "train_r": 0.41581203760359914,
      "train_p": 6.26827177401533e-135,
      "val_r": 0.04981601091731226,
      "val_p": 0.3472942834632255
    },
    "per_fold_stats": {
      "train_r_mean": 0.5590102767517646,
      "train_r_std": 0.049449218859214356,
      "val_r_mean": 0.4424779064804386,
      "val_r_std": 0.14324887784596263,
      "n_nonzero_mean": 19.95,
      "n_nonzero_std": 3.761316258971054
    },
    "average_coefficients": {
      "right_subspace_overlap_top_k": 0.000771186372730881,
      "right_subspace_overlap_bottom_k": 0.003557309042662382,
      "interaction_matrix_overlap_top_k": -0.0028331605717539787,
      "interaction_matrix_overlap_bottom_k": 0.03447685018181801,
      "effective_rank": -0.0006774563225917518,
      "effective_rank_mergeability_score": 0.0006938888691365719,
      "stable_rank": -0.0005642032483592629,
      "spectral_gap": 0.0002990943903569132,
      "singular_value_ratio": -0.0003529852838255465,
      "layerwise_effective_rank": -0.0008602337911725044,
      "layerwise_effective_rank_mergeability_score": 0.000725827063433826,
      "task_vector_cosine_similarity": -0.00022301636636257172,
      "task_vector_l2_distance": -0.022900372743606567,
      "task_vector_dot_product": -0.0005278041353449225,
      "weight_space_angle": 0.0008843258256092668,
      "task_vector_magnitude_ratio": -0.0058045280165970325,
      "singular_value_overlap": -0.021344900131225586,
      "subspace_overlap": 0.005373373627662659,
      "right_subspace_overlap": 0.00020797635079361498,
      "activation_l2_distance": -0.0001187356174341403,
      "activation_cosine_similarity": 0.0009398626280017197,
      "activation_magnitude_ratio": -0.005558758974075317,
      "activation_dot_product": -0.00347595801576972,
      "encoder_gradient_cosine_similarity": 0.0002979594864882529,
      "encoder_gradient_l2_distance": -0.013393186032772064,
      "encoder_gradient_dot_product": 0.00018637647735886276,
      "input_gradient_cosine_similarity": 0.0015135946450755,
      "input_gradient_l2_distance": -0.023171164095401764,
      "input_gradient_dot_product": -0.006487053819000721
    },
    "coefficient_std": {
      "right_subspace_overlap_top_k": 0.004998355638235807,
      "right_subspace_overlap_bottom_k": 0.0055370330810546875,
      "interaction_matrix_overlap_top_k": 0.0031822386663407087,
      "interaction_matrix_overlap_bottom_k": 0.010634368285536766,
      "effective_rank": 0.0008734894217923284,
      "effective_rank_mergeability_score": 0.0008940139086917043,
      "stable_rank": 0.0007777729770168662,
      "spectral_gap": 0.0011336508905515075,
      "singular_value_ratio": 0.0008909093448892236,
      "layerwise_effective_rank": 0.0024193539284169674,
      "layerwise_effective_rank_mergeability_score": 0.0019393087131902575,
      "task_vector_cosine_similarity": 0.0019462124910205603,
      "task_vector_l2_distance": 0.010333985090255737,
      "task_vector_dot_product": 0.00223797676153481,
      "weight_space_angle": 0.0016441672341898084,
      "task_vector_magnitude_ratio": 0.0020388911943882704,
      "singular_value_overlap": 0.007576433941721916,
      "subspace_overlap": 0.004089727532118559,
      "right_subspace_overlap": 0.0021585174836218357,
      "activation_l2_distance": 0.004841342102736235,
      "activation_cosine_similarity": 0.0040938896127045155,
      "activation_magnitude_ratio": 0.0029136950615793467,
      "activation_dot_product": 0.0046693370677530766,
      "encoder_gradient_cosine_similarity": 0.0018286538543179631,
      "encoder_gradient_l2_distance": 0.005508338566869497,
      "encoder_gradient_dot_product": 0.001587862498126924,
      "input_gradient_cosine_similarity": 0.0012973534176126122,
      "input_gradient_l2_distance": 0.008264075964689255,
      "input_gradient_dot_product": 0.003065883880481124
    },
    "nonzero_frequency": {
      "right_subspace_overlap_top_k": 0.45,
      "right_subspace_overlap_bottom_k": 0.9,
      "interaction_matrix_overlap_top_k": 0.7,
      "interaction_matrix_overlap_bottom_k": 0.95,
      "effective_rank": 0.4,
      "effective_rank_mergeability_score": 0.4,
      "stable_rank": 0.35,
      "spectral_gap": 0.5,
      "singular_value_ratio": 0.4,
      "layerwise_effective_rank": 0.55,
      "layerwise_effective_rank_mergeability_score": 0.55,
      "task_vector_cosine_similarity": 0.4,
      "task_vector_l2_distance": 0.95,
      "task_vector_dot_product": 0.65,
      "weight_space_angle": 0.5,
      "task_vector_magnitude_ratio": 0.95,
      "singular_value_overlap": 1.0,
      "subspace_overlap": 1.0,
      "right_subspace_overlap": 0.35,
      "activation_l2_distance": 0.75,
      "activation_cosine_similarity": 0.75,
      "activation_magnitude_ratio": 1.0,
      "activation_dot_product": 0.8,
      "encoder_gradient_cosine_similarity": 0.55,
      "encoder_gradient_l2_distance": 1.0,
      "encoder_gradient_dot_product": 0.5,
      "input_gradient_cosine_similarity": 0.65,
      "input_gradient_l2_distance": 1.0,
      "input_gradient_dot_product": 1.0
    },
    "fold_results": [
      {
        "fold": 0,
        "held_out_task": "SUN397",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5854617798954647,
        "val_r": 0.5964049741628756,
        "n_iterations": 336,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.0027587604708969593,
          "interaction_matrix_overlap_top_k": -0.010969525203108788,
          "interaction_matrix_overlap_bottom_k": 0.027749070897698402,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0010086281690746546,
          "stable_rank": 0.0,
          "spectral_gap": -0.0011178120039403439,
          "singular_value_ratio": 0.0012271103914827108,
          "layerwise_effective_rank": 0.002391842193901539,
          "layerwise_effective_rank_mergeability_score": -0.0028714342042803764,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.012460729107260704,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.005719712004065514,
          "singular_value_overlap": -0.012858293019235134,
          "subspace_overlap": 0.011259743943810463,
          "right_subspace_overlap": 0.0010688547044992447,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.003077899571508169,
          "activation_magnitude_ratio": -0.004687635228037834,
          "activation_dot_product": -0.003703347872942686,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.007720253895968199,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.010256273671984673,
          "input_gradient_dot_product": -0.0031393738463521004
        }
      },
      {
        "fold": 1,
        "held_out_task": "Cars",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5598343160521068,
        "val_r": 0.4802319593241553,
        "n_iterations": 279,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0029595668893307447,
          "interaction_matrix_overlap_top_k": -0.00288494979031384,
          "interaction_matrix_overlap_bottom_k": 0.03384906053543091,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.023483099415898323,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.006840126123279333,
          "singular_value_overlap": -0.018337465822696686,
          "subspace_overlap": 0.0018112375400960445,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0024381298571825027,
          "activation_cosine_similarity": 0.0017118381801992655,
          "activation_magnitude_ratio": -0.004561457317322493,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": -0.0014926593285053968,
          "encoder_gradient_l2_distance": -0.016845522448420525,
          "encoder_gradient_dot_product": 0.001872923457995057,
          "input_gradient_cosine_similarity": 0.0017683302285149693,
          "input_gradient_l2_distance": -0.018842626363039017,
          "input_gradient_dot_product": -0.0027029349002987146
        }
      },
      {
        "fold": 2,
        "held_out_task": "RESISC45",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5509785595039542,
        "val_r": 0.4823206829271176,
        "n_iterations": 247,
        "n_nonzero_coefficients": 14,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.002037945669144392,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.025325004011392593,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.001185643021017313,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.015621689148247242,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.004695940297096968,
          "singular_value_overlap": -0.01590060070157051,
          "subspace_overlap": 0.003792770905420184,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.00423771096393466,
          "activation_dot_product": -0.0023560859262943268,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.009173925034701824,
          "encoder_gradient_dot_product": 0.0011871347669512033,
          "input_gradient_cosine_similarity": 0.001575128873810172,
          "input_gradient_l2_distance": -0.01621313765645027,
          "input_gradient_dot_product": -0.0069977943785488605
        }
      },
      {
        "fold": 3,
        "held_out_task": "EuroSAT",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5520038409731195,
        "val_r": 0.5049641080599196,
        "n_iterations": 378,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.011175630614161491,
          "interaction_matrix_overlap_top_k": -0.0037786581087857485,
          "interaction_matrix_overlap_bottom_k": 0.04352420195937157,
          "effective_rank": -0.0013932869769632816,
          "effective_rank_mergeability_score": 0.0019557003397494555,
          "stable_rank": -0.0014668668154627085,
          "spectral_gap": 0.0018305128905922174,
          "singular_value_ratio": -0.001493343384936452,
          "layerwise_effective_rank": -0.001542452024295926,
          "layerwise_effective_rank_mergeability_score": 0.0017373127629980445,
          "task_vector_cosine_similarity": -0.0015584758948534727,
          "task_vector_l2_distance": -0.03321041166782379,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.00815115962177515,
          "singular_value_overlap": -0.029935145750641823,
          "subspace_overlap": 0.005895503796637058,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0061234477907419205,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.00944657251238823,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.009805815294384956,
          "encoder_gradient_dot_product": -0.0012849490158259869,
          "input_gradient_cosine_similarity": 0.0037005236372351646,
          "input_gradient_l2_distance": -0.02814554050564766,
          "input_gradient_dot_product": -0.008749538101255894
        }
      },
      {
        "fold": 4,
        "held_out_task": "SVHN",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5939355863621305,
        "val_r": 0.5782080618901905,
        "n_iterations": 492,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0014651904348284006,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.031933967024087906,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.020801737904548645,
          "task_vector_dot_product": -0.003315472276881337,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.0045225354842841625,
          "singular_value_overlap": -0.018129179254174232,
          "subspace_overlap": -0.0012885385658591986,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.001202852581627667,
          "activation_cosine_similarity": -0.0018208229448646307,
          "activation_magnitude_ratio": -0.005765118636190891,
          "activation_dot_product": -0.0012034588726237416,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.007299884222447872,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0025344151072204113,
          "input_gradient_l2_distance": -0.018506305292248726,
          "input_gradient_dot_product": -0.002709774998947978
        }
      },
      {
        "fold": 5,
        "held_out_task": "GTSRB",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.5663035228595943,
        "val_r": 0.6179450677284435,
        "n_iterations": 295,
        "n_nonzero_coefficients": 15,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": -0.00376480957493186,
          "interaction_matrix_overlap_top_k": -0.005165766924619675,
          "interaction_matrix_overlap_bottom_k": 0.03284291923046112,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.017333179712295532,
          "task_vector_dot_product": 0.00436348607763648,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.006775065790861845,
          "singular_value_overlap": -0.015592200681567192,
          "subspace_overlap": 0.0016271410277113318,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.004894510842859745,
          "activation_dot_product": -0.0016683286521583796,
          "encoder_gradient_cosine_similarity": 0.001641861512325704,
          "encoder_gradient_l2_distance": -0.008354788646101952,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0011149403871968389,
          "input_gradient_l2_distance": -0.01126454770565033,
          "input_gradient_dot_product": -0.0034182490780949593
        }
      },
      {
        "fold": 6,
        "held_out_task": "MNIST",
        "n_train_pairs": 164,
        "n_val_pairs": 15,
        "train_r": 0.5794153858561251,
        "val_r": 0.2084254564080656,
        "n_iterations": 187,
        "n_nonzero_coefficients": 19,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0012568258680403233,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.001206244807690382,
          "interaction_matrix_overlap_bottom_k": 0.0367540642619133,
          "effective_rank": -0.00116757582873106,
          "effective_rank_mergeability_score": 0.0017708060331642628,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.018162347376346588,
          "task_vector_dot_product": -0.006130089983344078,
          "weight_space_angle": 0.002183478558436036,
          "task_vector_magnitude_ratio": -0.006573235150426626,
          "singular_value_overlap": -0.023492464795708656,
          "subspace_overlap": 0.005407592281699181,
          "right_subspace_overlap": 0.002677262993529439,
          "activation_l2_distance": -0.012351015582680702,
          "activation_cosine_similarity": 0.012339349836111069,
          "activation_magnitude_ratio": 0.0034306657034903765,
          "activation_dot_product": -0.020225465297698975,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.021291878074407578,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.03108304925262928,
          "input_gradient_dot_product": -0.013210399076342583
        }
      },
      {
        "fold": 7,
        "held_out_task": "DTD",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5194443213562621,
        "val_r": 0.3506908512145717,
        "n_iterations": 292,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.009286959655582905,
          "interaction_matrix_overlap_top_k": -0.0024412618950009346,
          "interaction_matrix_overlap_bottom_k": 0.04807247593998909,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": -0.001273138914257288,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0010430682450532913,
          "task_vector_l2_distance": -0.03535817563533783,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0018898660782724619,
          "task_vector_magnitude_ratio": -0.007832750678062439,
          "singular_value_overlap": -0.028828782960772514,
          "subspace_overlap": 0.010617786087095737,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0071038659662008286,
          "activation_dot_product": -0.0032159066759049892,
          "encoder_gradient_cosine_similarity": 0.0014660044107586145,
          "encoder_gradient_l2_distance": -0.01344169769436121,
          "encoder_gradient_dot_product": 0.0010356779675930738,
          "input_gradient_cosine_similarity": 0.0015826476737856865,
          "input_gradient_l2_distance": -0.01642231084406376,
          "input_gradient_dot_product": -0.001204141415655613
        }
      },
      {
        "fold": 8,
        "held_out_task": "Flowers102",
        "n_train_pairs": 163,
        "n_val_pairs": 16,
        "train_r": 0.47792095843498517,
        "val_r": 0.1806622521476343,
        "n_iterations": 232,
        "n_nonzero_coefficients": 25,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0016471596900373697,
          "right_subspace_overlap_bottom_k": -0.007955561392009258,
          "interaction_matrix_overlap_top_k": -0.0030426536686718464,
          "interaction_matrix_overlap_bottom_k": 0.034660037606954575,
          "effective_rank": -0.0021067573688924313,
          "effective_rank_mergeability_score": 0.002640481572598219,
          "stable_rank": -0.0017160429852083325,
          "spectral_gap": 0.0011007392313331366,
          "singular_value_ratio": -0.0019082824001088738,
          "layerwise_effective_rank": -0.002126976614817977,
          "layerwise_effective_rank_mergeability_score": 0.0019346732879057527,
          "task_vector_cosine_similarity": -0.0010352255776524544,
          "task_vector_l2_distance": -0.011725984513759613,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.005558381322771311,
          "singular_value_overlap": -0.014069187454879284,
          "subspace_overlap": 0.005278197582811117,
          "right_subspace_overlap": 0.001716629951260984,
          "activation_l2_distance": -0.0032885887194424868,
          "activation_cosine_similarity": 0.002993218833580613,
          "activation_magnitude_ratio": -0.0022105113603174686,
          "activation_dot_product": -0.0032860753126442432,
          "encoder_gradient_cosine_similarity": 0.0033969224896281958,
          "encoder_gradient_l2_distance": -0.008230943232774734,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.014593883417546749,
          "input_gradient_dot_product": -0.007520508952438831
        }
      },
      {
        "fold": 9,
        "held_out_task": "PCAM",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5630300177778378,
        "val_r": 0.18528250870671006,
        "n_iterations": 305,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0021007212344557047,
          "right_subspace_overlap_bottom_k": 0.011583030223846436,
          "interaction_matrix_overlap_top_k": -0.003537992015480995,
          "interaction_matrix_overlap_bottom_k": 0.04032205417752266,
          "effective_rank": -0.001509809517301619,
          "effective_rank_mergeability_score": 0.0014080627588555217,
          "stable_rank": -0.0017386488616466522,
          "spectral_gap": 0.0021088968496769667,
          "singular_value_ratio": -0.0018575451103970408,
          "layerwise_effective_rank": -0.001365026691928506,
          "layerwise_effective_rank_mergeability_score": 0.001328949467279017,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.0327385850250721,
          "task_vector_dot_product": -0.0022230995818972588,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.005216115154325962,
          "singular_value_overlap": -0.03061533533036709,
          "subspace_overlap": 0.010448677465319633,
          "right_subspace_overlap": -0.003004038706421852,
          "activation_l2_distance": -0.004046001471579075,
          "activation_cosine_similarity": -0.0071115377359092236,
          "activation_magnitude_ratio": -0.0062423706986010075,
          "activation_dot_product": -0.007633410859853029,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.013650866225361824,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.03135497123003006,
          "input_gradient_dot_product": -0.004746966529637575
        }
      },
      {
        "fold": 10,
        "held_out_task": "FER2013",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5209096407120051,
        "val_r": 0.39523215658126853,
        "n_iterations": 314,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0018224542727693915,
          "right_subspace_overlap_bottom_k": 0.004415964707732201,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.03271207958459854,
          "effective_rank": -0.00110371015034616,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": -0.0012737065553665161,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0013404299970716238,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.003745407797396183,
          "task_vector_l2_distance": -0.018728584051132202,
          "task_vector_dot_product": -0.0023633763194084167,
          "weight_space_angle": 0.0020382837392389774,
          "task_vector_magnitude_ratio": -0.004438401199877262,
          "singular_value_overlap": -0.019354522228240967,
          "subspace_overlap": 0.004902530927211046,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.007980434224009514,
          "activation_cosine_similarity": -0.0016278389375656843,
          "activation_magnitude_ratio": -0.00763744255527854,
          "activation_dot_product": -0.006729804445058107,
          "encoder_gradient_cosine_similarity": -0.0025677853263914585,
          "encoder_gradient_l2_distance": -0.012332107871770859,
          "encoder_gradient_dot_product": -0.004689664579927921,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.020993636921048164,
          "input_gradient_dot_product": -0.00419513788074255
        }
      },
      {
        "fold": 11,
        "held_out_task": "OxfordIIITPet",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5160949003075043,
        "val_r": 0.5273506802926412,
        "n_iterations": 399,
        "n_nonzero_coefficients": 17,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.0,
          "interaction_matrix_overlap_top_k": -0.004249352961778641,
          "interaction_matrix_overlap_bottom_k": 0.029796013608574867,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": -0.0010111491428688169,
          "task_vector_cosine_similarity": -0.0026182839646935463,
          "task_vector_l2_distance": -0.012520181015133858,
          "task_vector_dot_product": -0.0015849277842789888,
          "weight_space_angle": 0.0020940802060067654,
          "task_vector_magnitude_ratio": -0.005466807167977095,
          "singular_value_overlap": -0.021036451682448387,
          "subspace_overlap": 0.007442502770572901,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0,
          "activation_cosine_similarity": 0.001765526831150055,
          "activation_magnitude_ratio": -0.005946052260696888,
          "activation_dot_product": -0.006677696947008371,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.01266811415553093,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0023650103248655796,
          "input_gradient_l2_distance": -0.021279286593198776,
          "input_gradient_dot_product": -0.009634512476623058
        }
      },
      {
        "fold": 12,
        "held_out_task": "STL10",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5217935230689998,
        "val_r": 0.5170272405408263,
        "n_iterations": 300,
        "n_nonzero_coefficients": 16,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.004577931482344866,
          "interaction_matrix_overlap_top_k": -0.0026789435651153326,
          "interaction_matrix_overlap_bottom_k": 0.04542727768421173,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0010594443883746862,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.030055886134505272,
          "task_vector_dot_product": 0.0011247212532907724,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.007549887523055077,
          "singular_value_overlap": -0.025544337928295135,
          "subspace_overlap": 0.003289029933512211,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0087269963696599,
          "activation_cosine_similarity": 0.001342222560197115,
          "activation_magnitude_ratio": -0.005399439018219709,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.014062394388020039,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0018111735116690397,
          "input_gradient_l2_distance": -0.025571368634700775,
          "input_gradient_dot_product": -0.009286168962717056
        }
      },
      {
        "fold": 13,
        "held_out_task": "CIFAR100",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5332221363382699,
        "val_r": 0.6599632738980735,
        "n_iterations": 258,
        "n_nonzero_coefficients": 23,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0024103557225316763,
          "right_subspace_overlap_bottom_k": 0.001528751803562045,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.03517743572592735,
          "effective_rank": -0.002174559747800231,
          "effective_rank_mergeability_score": 0.0017752563580870628,
          "stable_rank": -0.0015517068095505238,
          "spectral_gap": 0.001639249618165195,
          "singular_value_ratio": -0.0018940182635560632,
          "layerwise_effective_rank": -0.0015607469249516726,
          "layerwise_effective_rank_mergeability_score": 0.0018041995353996754,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.026725424453616142,
          "task_vector_dot_product": 0.0,
          "weight_space_angle": 0.0013782830210402608,
          "task_vector_magnitude_ratio": -0.0054378751665353775,
          "singular_value_overlap": -0.02662530727684498,
          "subspace_overlap": 0.0017707271035760641,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": -0.0024774731136858463,
          "activation_cosine_similarity": 0.0,
          "activation_magnitude_ratio": -0.0072867851704359055,
          "activation_dot_product": -0.00521989818662405,
          "encoder_gradient_cosine_similarity": 0.0,
          "encoder_gradient_l2_distance": -0.015968579798936844,
          "encoder_gradient_dot_product": -0.0023279967717826366,
          "input_gradient_cosine_similarity": 0.0018183288630098104,
          "input_gradient_l2_distance": -0.026846542954444885,
          "input_gradient_dot_product": -0.008941066451370716
        }
      },
      {
        "fold": 14,
        "held_out_task": "CIFAR10",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5228571942107536,
        "val_r": 0.5773101313477232,
        "n_iterations": 255,
        "n_nonzero_coefficients": 28,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0023172739893198013,
          "right_subspace_overlap_bottom_k": 0.004072110168635845,
          "interaction_matrix_overlap_top_k": -0.00203699991106987,
          "interaction_matrix_overlap_bottom_k": 0.04563574492931366,
          "effective_rank": -0.0018331415485590696,
          "effective_rank_mergeability_score": 0.0015514213591814041,
          "stable_rank": -0.001941874623298645,
          "spectral_gap": 0.002033438766375184,
          "singular_value_ratio": -0.0010074053425341845,
          "layerwise_effective_rank": -0.0014756490709260106,
          "layerwise_effective_rank_mergeability_score": 0.0013806632487103343,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.03796462342143059,
          "task_vector_dot_product": 0.0012804262805730104,
          "weight_space_angle": 0.0029117476660758257,
          "task_vector_magnitude_ratio": -0.00954233855009079,
          "singular_value_overlap": -0.03390505164861679,
          "subspace_overlap": 0.009260897524654865,
          "right_subspace_overlap": -0.0013644634746015072,
          "activation_l2_distance": 0.0012803686549887061,
          "activation_cosine_similarity": -0.0024835695512592793,
          "activation_magnitude_ratio": -0.010037289001047611,
          "activation_dot_product": -0.0044958931393921375,
          "encoder_gradient_cosine_similarity": -0.0017973330104723573,
          "encoder_gradient_l2_distance": -0.015958959236741066,
          "encoder_gradient_dot_product": 0.001788097433745861,
          "input_gradient_cosine_similarity": 0.003128360491245985,
          "input_gradient_l2_distance": -0.037928733974695206,
          "input_gradient_dot_product": -0.007233182899653912
        }
      },
      {
        "fold": 15,
        "held_out_task": "Food101",
        "n_train_pairs": 162,
        "n_val_pairs": 17,
        "train_r": 0.5667041578943568,
        "val_r": 0.37760187492200314,
        "n_iterations": 323,
        "n_nonzero_coefficients": 20,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0019332119263708591,
          "right_subspace_overlap_bottom_k": 0.0021842382848262787,
          "interaction_matrix_overlap_top_k": -0.0011198152787983418,
          "interaction_matrix_overlap_bottom_k": 0.024706553667783737,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0011168336495757103,
          "layerwise_effective_rank_mergeability_score": 0.0,
          "task_vector_cosine_similarity": 0.0010831381659954786,
          "task_vector_l2_distance": -0.019113318994641304,
          "task_vector_dot_product": 0.0014080355176702142,
          "weight_space_angle": 0.001031993655487895,
          "task_vector_magnitude_ratio": -0.005882286000996828,
          "singular_value_overlap": -0.010165202431380749,
          "subspace_overlap": 0.0012828861363232136,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.0017603333108127117,
          "activation_cosine_similarity": 0.0015686014667153358,
          "activation_magnitude_ratio": -0.005540624260902405,
          "activation_dot_product": -0.0036963652819395065,
          "encoder_gradient_cosine_similarity": -0.0019522779621183872,
          "encoder_gradient_l2_distance": -0.010910853743553162,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.015020867809653282,
          "input_gradient_dot_product": -0.0054370141588151455
        }
      },
      {
        "fold": 16,
        "held_out_task": "FashionMNIST",
        "n_train_pairs": 160,
        "n_val_pairs": 19,
        "train_r": 0.5594115615431068,
        "val_r": 0.46562127442574086,
        "n_iterations": 353,
        "n_nonzero_coefficients": 24,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.013511640019714832,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.05064597725868225,
          "effective_rank": -0.0022602854296565056,
          "effective_rank_mergeability_score": 0.0017674207920208573,
          "stable_rank": -0.0015952188987284899,
          "spectral_gap": 0.0022759768180549145,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0012183748185634613,
          "layerwise_effective_rank_mergeability_score": 0.0011823336826637387,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.043577276170253754,
          "task_vector_dot_product": 0.001259493874385953,
          "weight_space_angle": 0.002927586203441024,
          "task_vector_magnitude_ratio": -0.005321447737514973,
          "singular_value_overlap": -0.032079536467790604,
          "subspace_overlap": 0.006219078786671162,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.008866984397172928,
          "activation_cosine_similarity": -0.0017944632563740015,
          "activation_magnitude_ratio": -0.010304315015673637,
          "activation_dot_product": 0.0023681458551436663,
          "encoder_gradient_cosine_similarity": 0.004503736272454262,
          "encoder_gradient_l2_distance": -0.012335010804235935,
          "encoder_gradient_dot_product": 0.0016812224639579654,
          "input_gradient_cosine_similarity": 0.001873350003734231,
          "input_gradient_l2_distance": -0.03787010908126831,
          "input_gradient_dot_product": -0.00998497474938631
        }
      },
      {
        "fold": 17,
        "held_out_task": "EMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5869140401741506,
        "val_r": 0.2790026856033174,
        "n_iterations": 199,
        "n_nonzero_coefficients": 18,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.0,
          "right_subspace_overlap_bottom_k": 0.007525056134909391,
          "interaction_matrix_overlap_top_k": -0.011347697116434574,
          "interaction_matrix_overlap_bottom_k": 0.03464752435684204,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": -0.0027237816248089075,
          "layerwise_effective_rank_mergeability_score": 0.002946848515421152,
          "task_vector_cosine_similarity": 0.0,
          "task_vector_l2_distance": -0.019477298483252525,
          "task_vector_dot_product": 0.0011870136950165033,
          "weight_space_angle": 0.0,
          "task_vector_magnitude_ratio": -0.002635451266542077,
          "singular_value_overlap": -0.013696659356355667,
          "subspace_overlap": 0.006757482886314392,
          "right_subspace_overlap": 0.0,
          "activation_l2_distance": 0.001933180377818644,
          "activation_cosine_similarity": -0.0031888321973383427,
          "activation_magnitude_ratio": -0.005540188401937485,
          "activation_dot_product": 0.0,
          "encoder_gradient_cosine_similarity": -0.001979042310267687,
          "encoder_gradient_l2_distance": -0.007543045561760664,
          "encoder_gradient_dot_product": 0.0,
          "input_gradient_cosine_similarity": 0.0036322367377579212,
          "input_gradient_l2_distance": -0.027478713542222977,
          "input_gradient_dot_product": -0.00415414571762085
        }
      },
      {
        "fold": 18,
        "held_out_task": "KMNIST",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.7340428511687523,
        "val_r": 0.5340119188901057,
        "n_iterations": 251,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": 0.02126951888203621,
          "right_subspace_overlap_bottom_k": -0.001441311789676547,
          "interaction_matrix_overlap_top_k": -0.002203352050855756,
          "interaction_matrix_overlap_bottom_k": 0.0,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": -0.0016440270701423287,
          "singular_value_ratio": 0.001146916882134974,
          "layerwise_effective_rank": -0.010040774941444397,
          "layerwise_effective_rank_mergeability_score": 0.007177793886512518,
          "task_vector_cosine_similarity": -0.006860989611595869,
          "task_vector_l2_distance": 0.0,
          "task_vector_dot_product": -0.0037139735650271177,
          "weight_space_angle": 0.004619083367288113,
          "task_vector_magnitude_ratio": 0.0,
          "singular_value_overlap": -0.00844587292522192,
          "subspace_overlap": -0.0017687028739601374,
          "right_subspace_overlap": 0.007329538464546204,
          "activation_l2_distance": -0.0015975640853866935,
          "activation_cosine_similarity": 0.009437683038413525,
          "activation_magnitude_ratio": -0.0036213649436831474,
          "activation_dot_product": 0.001053058309480548,
          "encoder_gradient_cosine_similarity": 0.0030680415220558643,
          "encoder_gradient_l2_distance": -0.030028576031327248,
          "encoder_gradient_dot_product": 0.0024264648091048002,
          "input_gradient_cosine_similarity": 0.0,
          "input_gradient_l2_distance": -0.019093384966254234,
          "input_gradient_dot_product": -0.00916232354938984
        }
      },
      {
        "fold": 19,
        "held_out_task": "RenderedSST2",
        "n_train_pairs": 161,
        "n_val_pairs": 18,
        "train_r": 0.5699272405458133,
        "val_r": 0.33130097053738866,
        "n_iterations": 241,
        "n_nonzero_coefficients": 22,
        "coefficients": {
          "right_subspace_overlap_top_k": -0.0056770918890833855,
          "right_subspace_overlap_bottom_k": 0.010742605663836002,
          "interaction_matrix_overlap_top_k": 0.0,
          "interaction_matrix_overlap_bottom_k": 0.035755522549152374,
          "effective_rank": 0.0,
          "effective_rank_mergeability_score": 0.0,
          "stable_rank": 0.0,
          "spectral_gap": 0.0,
          "singular_value_ratio": 0.0,
          "layerwise_effective_rank": 0.0,
          "layerwise_effective_rank_mergeability_score": -0.0010936502367258072,
          "task_vector_cosine_similarity": 0.001741033629514277,
          "task_vector_l2_distance": -0.028948934748768806,
          "task_vector_dot_product": -0.001848320011049509,
          "weight_space_angle": -0.0033878860995173454,
          "task_vector_magnitude_ratio": -0.00793104525655508,
          "singular_value_overlap": -0.028286410495638847,
          "subspace_overlap": 0.013460924848914146,
          "right_subspace_overlap": -0.004264256916940212,
          "activation_l2_distance": -0.002965926192700863,
          "activation_cosine_similarity": 0.0025879754684865475,
          "activation_magnitude_ratio": -0.004142588935792446,
          "activation_dot_product": -0.0028286210726946592,
          "encoder_gradient_cosine_similarity": 0.0016717216931283474,
          "encoder_gradient_l2_distance": -0.020240504294633865,
          "encoder_gradient_dot_product": 0.0020386194810271263,
          "input_gradient_cosine_similarity": 0.0033674477599561214,
          "input_gradient_l2_distance": -0.034657951444387436,
          "input_gradient_dot_product": -0.007312857545912266
        }
      }
    ],
    "optimization_params": {
      "lambda_l1": 0.3,
      "n_iterations": 2000,
      "learning_rate": 0.01,
      "patience": 100,
      "convergence_threshold": 1e-05
    }
  }
}