{
  "aggregate_metrics": {
    "train_r": 0.5926168702577306,
    "train_p": 7.56942168062438e-305,
    "val_r": 0.4396257068269801,
    "val_p": 2.3738329626086106e-18
  },
  "per_fold_stats": {
    "train_r_mean": 0.7471577939569263,
    "train_r_std": 0.027050015865128108,
    "val_r_mean": 0.6253752447783778,
    "val_r_std": 0.16719451651075096,
    "n_nonzero_mean": 21.25,
    "n_nonzero_std": 3.207413287993925
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.013724428601562977,
    "right_subspace_overlap_bottom_k": -0.017672907561063766,
    "interaction_matrix_overlap_top_k": 0.0005202004685997963,
    "interaction_matrix_overlap_bottom_k": 0.0018436642130836844,
    "effective_rank": -0.0007864800281822681,
    "effective_rank_mergeability_score": 0.0009055379778146744,
    "stable_rank": -0.0012206590035930276,
    "spectral_gap": 4.150969471083954e-05,
    "singular_value_ratio": 4.0163868106901646e-06,
    "layerwise_effective_rank": -0.0017830576980486512,
    "layerwise_effective_rank_mergeability_score": 0.001600724644958973,
    "task_vector_cosine_similarity": -0.000994836213067174,
    "task_vector_l2_distance": -0.008177132345736027,
    "task_vector_dot_product": -0.0024344122502952814,
    "weight_space_angle": 0.0016768056666478515,
    "task_vector_magnitude_ratio": -0.0007848691311664879,
    "singular_value_overlap": 0.00024485308676958084,
    "subspace_overlap": -0.0008565217140130699,
    "right_subspace_overlap": 0.01227252185344696,
    "activation_l2_distance": -0.002632628194987774,
    "activation_cosine_similarity": 0.01959354244172573,
    "activation_magnitude_ratio": -0.004180660471320152,
    "activation_dot_product": 0.005457724444568157,
    "encoder_gradient_cosine_similarity": 0.004266757518053055,
    "encoder_gradient_l2_distance": -0.044720977544784546,
    "encoder_gradient_dot_product": 0.0013078686315566301,
    "input_gradient_cosine_similarity": 0.0021346337161958218,
    "input_gradient_l2_distance": -0.03384353220462799,
    "input_gradient_dot_product": -0.007391627877950668
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.007847652770578861,
    "right_subspace_overlap_bottom_k": 0.005689507350325584,
    "interaction_matrix_overlap_top_k": 0.0020071661565452814,
    "interaction_matrix_overlap_bottom_k": 0.0028948558028787374,
    "effective_rank": 0.0013003022177144885,
    "effective_rank_mergeability_score": 0.0013669293839484453,
    "stable_rank": 0.0015239563072100282,
    "spectral_gap": 0.0012949913507327437,
    "singular_value_ratio": 0.0013379754964262247,
    "layerwise_effective_rank": 0.0012649433920159936,
    "layerwise_effective_rank_mergeability_score": 0.0014054446946829557,
    "task_vector_cosine_similarity": 0.0044459449127316475,
    "task_vector_l2_distance": 0.007551178336143494,
    "task_vector_dot_product": 0.0018911801744252443,
    "weight_space_angle": 0.0033015210647135973,
    "task_vector_magnitude_ratio": 0.0012510051019489765,
    "singular_value_overlap": 0.0032466573175042868,
    "subspace_overlap": 0.0015549649251624942,
    "right_subspace_overlap": 0.006801805924624205,
    "activation_l2_distance": 0.004796684253960848,
    "activation_cosine_similarity": 0.007266839034855366,
    "activation_magnitude_ratio": 0.0023644070606678724,
    "activation_dot_product": 0.010821906849741936,
    "encoder_gradient_cosine_similarity": 0.002439163625240326,
    "encoder_gradient_l2_distance": 0.018027573823928833,
    "encoder_gradient_dot_product": 0.0019537152256816626,
    "input_gradient_cosine_similarity": 0.002079788828268647,
    "input_gradient_l2_distance": 0.015846868976950645,
    "input_gradient_dot_product": 0.0038701763842254877
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 1.0,
    "right_subspace_overlap_bottom_k": 1.0,
    "interaction_matrix_overlap_top_k": 0.55,
    "interaction_matrix_overlap_bottom_k": 0.65,
    "effective_rank": 0.35,
    "effective_rank_mergeability_score": 0.4,
    "stable_rank": 0.55,
    "spectral_gap": 0.45,
    "singular_value_ratio": 0.45,
    "layerwise_effective_rank": 0.8,
    "layerwise_effective_rank_mergeability_score": 0.75,
    "task_vector_cosine_similarity": 0.55,
    "task_vector_l2_distance": 0.85,
    "task_vector_dot_product": 0.75,
    "weight_space_angle": 0.8,
    "task_vector_magnitude_ratio": 0.6,
    "singular_value_overlap": 0.55,
    "subspace_overlap": 0.4,
    "right_subspace_overlap": 0.95,
    "activation_l2_distance": 0.85,
    "activation_cosine_similarity": 1.0,
    "activation_magnitude_ratio": 0.95,
    "activation_dot_product": 0.8,
    "encoder_gradient_cosine_similarity": 0.95,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.55,
    "input_gradient_cosine_similarity": 0.8,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.95
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7641664039687966,
      "val_r": 0.6153039611742014,
      "n_iterations": 268,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009024444036185741,
        "right_subspace_overlap_bottom_k": -0.008244887925684452,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0019921937491744757,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.003889478277415037,
        "task_vector_dot_product": -0.0032076286152005196,
        "weight_space_angle": 0.0021412780042737722,
        "task_vector_magnitude_ratio": -0.0025716102682054043,
        "singular_value_overlap": -0.003299061441794038,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.005398551467806101,
        "activation_l2_distance": 0.0030883632134646177,
        "activation_cosine_similarity": 0.0194547101855278,
        "activation_magnitude_ratio": -0.004809306003153324,
        "activation_dot_product": -0.003896509064361453,
        "encoder_gradient_cosine_similarity": 0.0013710171915590763,
        "encoder_gradient_l2_distance": -0.023211752995848656,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0019323891028761864,
        "input_gradient_l2_distance": -0.014405721798539162,
        "input_gradient_dot_product": -0.00660921772941947
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.730118415975912,
      "val_r": 0.8074247432351749,
      "n_iterations": 363,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.01893748715519905,
        "right_subspace_overlap_bottom_k": -0.022701263427734375,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0012041323352605104,
        "stable_rank": -0.00200723041780293,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0019095820607617497,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0028800847940146923,
        "task_vector_l2_distance": -0.01565822958946228,
        "task_vector_dot_product": -0.0032834301237016916,
        "weight_space_angle": -0.0028945463709533215,
        "task_vector_magnitude_ratio": -0.001960551831871271,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.023850498721003532,
        "activation_l2_distance": -0.010261435061693192,
        "activation_cosine_similarity": 0.027808653190732002,
        "activation_magnitude_ratio": -0.009713947772979736,
        "activation_dot_product": 0.002853161422535777,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0780031606554985,
        "encoder_gradient_dot_product": 0.0011548787588253617,
        "input_gradient_cosine_similarity": 0.003538701683282852,
        "input_gradient_l2_distance": -0.055419743061065674,
        "input_gradient_dot_product": -0.007235167548060417
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.754263263771205,
      "val_r": 0.7039496065953981,
      "n_iterations": 251,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.010079054161906242,
        "right_subspace_overlap_bottom_k": -0.01398113090544939,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.004095263779163361,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0014630267396569252,
        "singular_value_ratio": 0.0011625145561993122,
        "layerwise_effective_rank": -0.0014414484612643719,
        "layerwise_effective_rank_mergeability_score": 0.0023569809272885323,
        "task_vector_cosine_similarity": -0.002901046071201563,
        "task_vector_l2_distance": -0.003846214385703206,
        "task_vector_dot_product": -0.0013853444252163172,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0033738981001079082,
        "subspace_overlap": -0.0014376253820955753,
        "right_subspace_overlap": 0.013598824851214886,
        "activation_l2_distance": -0.0026845026295632124,
        "activation_cosine_similarity": 0.011262585408985615,
        "activation_magnitude_ratio": -0.004477307666093111,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0035502049140632153,
        "encoder_gradient_l2_distance": -0.027852047234773636,
        "encoder_gradient_dot_product": 0.0013247421011328697,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.021327678114175797,
        "input_gradient_dot_product": -0.004185395315289497
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7196474653919857,
      "val_r": 0.6810674152992265,
      "n_iterations": 352,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.02211422473192215,
        "right_subspace_overlap_bottom_k": -0.019439078867435455,
        "interaction_matrix_overlap_top_k": 0.001992088044062257,
        "interaction_matrix_overlap_bottom_k": 0.0015709990402683616,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0016915041487663984,
        "singular_value_ratio": 0.001967239659279585,
        "layerwise_effective_rank": -0.0013050900306552649,
        "layerwise_effective_rank_mergeability_score": 0.0023458702489733696,
        "task_vector_cosine_similarity": -0.004860764369368553,
        "task_vector_l2_distance": -0.005447322968393564,
        "task_vector_dot_product": -0.003574846312403679,
        "weight_space_angle": 0.004859617445617914,
        "task_vector_magnitude_ratio": 0.0011478158412501216,
        "singular_value_overlap": 0.0010869349353015423,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.012776152230799198,
        "activation_l2_distance": -0.004869913682341576,
        "activation_cosine_similarity": 0.01670333370566368,
        "activation_magnitude_ratio": -0.0033908402547240257,
        "activation_dot_product": 0.010115502402186394,
        "encoder_gradient_cosine_similarity": 0.0034999498166143894,
        "encoder_gradient_l2_distance": -0.041647572070360184,
        "encoder_gradient_dot_product": 0.006208838429301977,
        "input_gradient_cosine_similarity": 0.0010595244821161032,
        "input_gradient_l2_distance": -0.046172238886356354,
        "input_gradient_dot_product": -0.01623384840786457
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7462125872818015,
      "val_r": 0.7514684124466295,
      "n_iterations": 440,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.004185941070318222,
        "right_subspace_overlap_bottom_k": -0.013581870123744011,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0010601093526929617,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0038691931404173374,
        "task_vector_dot_product": -0.005899668671190739,
        "weight_space_angle": -0.001241954043507576,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.015142606571316719,
        "activation_l2_distance": 0.004897105973213911,
        "activation_cosine_similarity": 0.01942877098917961,
        "activation_magnitude_ratio": -0.001824579550884664,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0038254931569099426,
        "encoder_gradient_l2_distance": -0.03272353112697601,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0038864687085151672,
        "input_gradient_l2_distance": -0.014108595438301563,
        "input_gradient_dot_product": -0.004445265047252178
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7525996654142924,
      "val_r": 0.7391552716275007,
      "n_iterations": 478,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.014290638267993927,
        "right_subspace_overlap_bottom_k": -0.017581820487976074,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.004876903723925352,
        "effective_rank": -0.0015727923018857837,
        "effective_rank_mergeability_score": 0.0023316596634685993,
        "stable_rank": -0.002273554913699627,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0014160670107230544,
        "layerwise_effective_rank": -0.004074912052601576,
        "layerwise_effective_rank_mergeability_score": 0.003375114407390356,
        "task_vector_cosine_similarity": -0.004311664029955864,
        "task_vector_l2_distance": -0.018005521968007088,
        "task_vector_dot_product": -0.002802510280162096,
        "weight_space_angle": 0.002506366465240717,
        "task_vector_magnitude_ratio": -0.0015196388121694326,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0018256640760228038,
        "right_subspace_overlap": 0.017304373905062675,
        "activation_l2_distance": -0.005916747730225325,
        "activation_cosine_similarity": 0.025627408176660538,
        "activation_magnitude_ratio": -0.0027990953531116247,
        "activation_dot_product": 0.01228634174913168,
        "encoder_gradient_cosine_similarity": 0.00622007017955184,
        "encoder_gradient_l2_distance": -0.0587986521422863,
        "encoder_gradient_dot_product": 0.0020890221931040287,
        "input_gradient_cosine_similarity": -0.00152248190715909,
        "input_gradient_l2_distance": -0.043945275247097015,
        "input_gradient_dot_product": -0.00805825088173151
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7259063729155306,
      "val_r": 0.49780274754581244,
      "n_iterations": 304,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.009785105474293232,
        "right_subspace_overlap_bottom_k": -0.0200701504945755,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.006183536723256111,
        "effective_rank": -0.0012233412126079202,
        "effective_rank_mergeability_score": 0.0012737842043861747,
        "stable_rank": -0.0013075992465019226,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0012396026868373156,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0015219768974930048,
        "task_vector_dot_product": -0.0026822444051504135,
        "weight_space_angle": -0.0012440318241715431,
        "task_vector_magnitude_ratio": -0.00120331603102386,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0034993065055459738,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.016480136662721634,
        "activation_magnitude_ratio": -0.0015140390023589134,
        "activation_dot_product": 0.003780159866437316,
        "encoder_gradient_cosine_similarity": 0.005221265833824873,
        "encoder_gradient_l2_distance": -0.01721865125000477,
        "encoder_gradient_dot_product": 0.0022854001726955175,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0179677065461874,
        "input_gradient_dot_product": -0.006860287860035896
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7060389098640025,
      "val_r": 0.2722380462033936,
      "n_iterations": 479,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.030054859817028046,
        "right_subspace_overlap_bottom_k": -0.02478799968957901,
        "interaction_matrix_overlap_top_k": -0.002422543242573738,
        "interaction_matrix_overlap_bottom_k": 0.004152490757405758,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0017252020770683885,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.001073662657290697,
        "layerwise_effective_rank_mergeability_score": 0.0021859491243958473,
        "task_vector_cosine_similarity": -0.010733035393059254,
        "task_vector_l2_distance": -0.014200001955032349,
        "task_vector_dot_product": -0.002910345559939742,
        "weight_space_angle": 0.010968262329697609,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0043721566908061504,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.024936897680163383,
        "activation_l2_distance": -0.011034197174012661,
        "activation_cosine_similarity": 0.029618892818689346,
        "activation_magnitude_ratio": -0.004215111956000328,
        "activation_dot_product": -0.0042027672752738,
        "encoder_gradient_cosine_similarity": 0.010568803176283836,
        "encoder_gradient_l2_distance": -0.06069960072636604,
        "encoder_gradient_dot_product": 0.0020332925487309694,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.038265760987997055,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7591427971681964,
      "val_r": 0.6189433560218425,
      "n_iterations": 187,
      "n_nonzero_coefficients": 22,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.017747929319739342,
        "right_subspace_overlap_bottom_k": -0.021278705447912216,
        "interaction_matrix_overlap_top_k": 0.0021786759607493877,
        "interaction_matrix_overlap_bottom_k": 0.0065699415281414986,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.001526752021163702,
        "spectral_gap": -0.0031862056348472834,
        "singular_value_ratio": 0.0027245250530540943,
        "layerwise_effective_rank": -0.004383462481200695,
        "layerwise_effective_rank_mergeability_score": 0.003994102589786053,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.004722667392343283,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0012491440866142511,
        "task_vector_magnitude_ratio": 0.0019025335786864161,
        "singular_value_overlap": -0.0019733207300305367,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.006208611186593771,
        "activation_l2_distance": -0.0044011203572154045,
        "activation_cosine_similarity": 0.017060110345482826,
        "activation_magnitude_ratio": -0.005756118334829807,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.004744283854961395,
        "encoder_gradient_l2_distance": -0.02991599589586258,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.004956371150910854,
        "input_gradient_l2_distance": -0.02839987352490425,
        "input_gradient_dot_product": -0.007848180830478668
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7349620442817367,
      "val_r": 0.6152144310905914,
      "n_iterations": 254,
      "n_nonzero_coefficients": 24,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.014216461218893528,
        "right_subspace_overlap_bottom_k": -0.023823179304599762,
        "interaction_matrix_overlap_top_k": 0.003184329252690077,
        "interaction_matrix_overlap_bottom_k": 0.003712557489052415,
        "effective_rank": -0.0033978791907429695,
        "effective_rank_mergeability_score": 0.0024487380869686604,
        "stable_rank": -0.0020762972999364138,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.002724051009863615,
        "layerwise_effective_rank_mergeability_score": 0.0033531985245645046,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.012868841178715229,
        "task_vector_dot_product": -0.006415230222046375,
        "weight_space_angle": -0.0022127665579319,
        "task_vector_magnitude_ratio": -0.0013413499109447002,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.022689227014780045,
        "activation_l2_distance": 0.00134569825604558,
        "activation_cosine_similarity": -0.0021292383316904306,
        "activation_magnitude_ratio": -0.005899706389755011,
        "activation_dot_product": -0.010568046011030674,
        "encoder_gradient_cosine_similarity": 0.008499148301780224,
        "encoder_gradient_l2_distance": -0.05076603963971138,
        "encoder_gradient_dot_product": 0.0010547306155785918,
        "input_gradient_cosine_similarity": 0.004541718401014805,
        "input_gradient_l2_distance": -0.053588271141052246,
        "input_gradient_dot_product": -0.002088692970573902
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7054484165480448,
      "val_r": 0.26136735414719764,
      "n_iterations": 310,
      "n_nonzero_coefficients": 27,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.012821526266634464,
        "right_subspace_overlap_bottom_k": -0.022019999101758003,
        "interaction_matrix_overlap_top_k": 0.005976258777081966,
        "interaction_matrix_overlap_bottom_k": -0.004340771585702896,
        "effective_rank": -0.004729022271931171,
        "effective_rank_mergeability_score": 0.005406461656093597,
        "stable_rank": -0.006539618596434593,
        "spectral_gap": 0.0023966648150235415,
        "singular_value_ratio": -0.003477207152172923,
        "layerwise_effective_rank": -0.0026298908051103354,
        "layerwise_effective_rank_mergeability_score": 0.002686650026589632,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.004734812304377556,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0020765839144587517,
        "task_vector_magnitude_ratio": -0.0030663474462926388,
        "singular_value_overlap": 0.0060920435935258865,
        "subspace_overlap": -0.002572115743532777,
        "right_subspace_overlap": 0.008638577535748482,
        "activation_l2_distance": -0.008787206374108791,
        "activation_cosine_similarity": 0.03005586937069893,
        "activation_magnitude_ratio": -0.005545899737626314,
        "activation_dot_product": 0.029498688876628876,
        "encoder_gradient_cosine_similarity": 0.00320868450216949,
        "encoder_gradient_l2_distance": -0.0375351645052433,
        "encoder_gradient_dot_product": 0.005873317830264568,
        "input_gradient_cosine_similarity": 0.0014119953848421574,
        "input_gradient_l2_distance": -0.041166406124830246,
        "input_gradient_dot_product": -0.009113937616348267
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.757778231678134,
      "val_r": 0.7140636247528799,
      "n_iterations": 209,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.016635656356811523,
        "right_subspace_overlap_bottom_k": -0.015986386686563492,
        "interaction_matrix_overlap_top_k": 0.00211039325222373,
        "interaction_matrix_overlap_bottom_k": 0.007080634590238333,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": -0.001175688928924501,
        "task_vector_cosine_similarity": -0.008779001422226429,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.00446076737716794,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0011676839785650373,
        "right_subspace_overlap": 0.004299739375710487,
        "activation_l2_distance": 0.0038857818581163883,
        "activation_cosine_similarity": 0.016197286546230316,
        "activation_magnitude_ratio": -0.003487923415377736,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.002721168100833893,
        "encoder_gradient_l2_distance": -0.018344474956393242,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0018111434765160084,
        "input_gradient_l2_distance": -0.012977203354239464,
        "input_gradient_dot_product": -0.0054010022431612015
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7278187325872895,
      "val_r": 0.8183353100284848,
      "n_iterations": 362,
      "n_nonzero_coefficients": 21,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006364190950989723,
        "right_subspace_overlap_bottom_k": -0.019425740465521812,
        "interaction_matrix_overlap_top_k": 0.0018334193155169487,
        "interaction_matrix_overlap_bottom_k": 0.0016667958116158843,
        "effective_rank": -0.001490980852395296,
        "effective_rank_mergeability_score": 0.0015422215219587088,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.003506589448079467,
        "layerwise_effective_rank_mergeability_score": 0.0010039167245849967,
        "task_vector_cosine_similarity": 0.012441861443221569,
        "task_vector_l2_distance": -0.004098247736692429,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.008566705510020256,
        "activation_l2_distance": -0.007735807914286852,
        "activation_cosine_similarity": 0.023099595680832863,
        "activation_magnitude_ratio": -0.0028621808160096407,
        "activation_dot_product": 0.008074057288467884,
        "encoder_gradient_cosine_similarity": 0.0051712230779230595,
        "encoder_gradient_l2_distance": -0.058995574712753296,
        "encoder_gradient_dot_product": -0.0010496970498934388,
        "input_gradient_cosine_similarity": 0.0033295771572738886,
        "input_gradient_l2_distance": -0.043086856603622437,
        "input_gradient_dot_product": -0.007075058296322823
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7492601739327347,
      "val_r": 0.7859336855668348,
      "n_iterations": 253,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.021160941570997238,
        "right_subspace_overlap_bottom_k": -0.015317363664507866,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.001307524275034666,
        "layerwise_effective_rank": -0.002226038370281458,
        "layerwise_effective_rank_mergeability_score": 0.0021475672256201506,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.005956275388598442,
        "task_vector_dot_product": -0.0013219465035945177,
        "weight_space_angle": 0.002626296365633607,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0014109014300629497,
        "subspace_overlap": -0.0035646886099129915,
        "right_subspace_overlap": 0.009010427631437778,
        "activation_l2_distance": -0.007929421029984951,
        "activation_cosine_similarity": 0.021180855110287666,
        "activation_magnitude_ratio": -0.007386836223304272,
        "activation_dot_product": 0.0031920447945594788,
        "encoder_gradient_cosine_similarity": 0.0028589414432644844,
        "encoder_gradient_l2_distance": -0.06026922166347504,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0022507542744278908,
        "input_gradient_l2_distance": -0.028379365801811218,
        "input_gradient_dot_product": -0.00940703321248293
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.746111195906735,
      "val_r": 0.7806589203106321,
      "n_iterations": 341,
      "n_nonzero_coefficients": 18,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.006757151335477829,
        "right_subspace_overlap_bottom_k": -0.019720816984772682,
        "interaction_matrix_overlap_top_k": -0.00109042227268219,
        "interaction_matrix_overlap_bottom_k": 0.0011011767201125622,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0010852421401068568,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.003485080087557435,
        "weight_space_angle": 0.0017584264278411865,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.0,
        "subspace_overlap": -0.0015870778588578105,
        "right_subspace_overlap": 0.018559304997324944,
        "activation_l2_distance": 0.0010629722382873297,
        "activation_cosine_similarity": 0.0188126303255558,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.002221245551481843,
        "encoder_gradient_cosine_similarity": 0.005323193501681089,
        "encoder_gradient_l2_distance": -0.03288792446255684,
        "encoder_gradient_dot_product": 0.0010024562943726778,
        "input_gradient_cosine_similarity": 0.0017165795434266329,
        "input_gradient_l2_distance": -0.01384043786674738,
        "input_gradient_dot_product": -0.008036444894969463
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7525361574010614,
      "val_r": 0.42756164255633106,
      "n_iterations": 423,
      "n_nonzero_coefficients": 26,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.005229653790593147,
        "right_subspace_overlap_bottom_k": -0.01776239648461342,
        "interaction_matrix_overlap_top_k": 0.0016371412202715874,
        "interaction_matrix_overlap_bottom_k": -0.0017884373664855957,
        "effective_rank": -0.0021998626179993153,
        "effective_rank_mergeability_score": 0.0018167418893426657,
        "stable_rank": -0.0017287026857957244,
        "spectral_gap": 0.0017883226973935962,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.001267933053895831,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.008537495508790016,
        "task_vector_dot_product": -0.00513132568448782,
        "weight_space_angle": 0.005972873419523239,
        "task_vector_magnitude_ratio": -0.0016035446897149086,
        "singular_value_overlap": 0.009759016335010529,
        "subspace_overlap": -0.0016931984573602676,
        "right_subspace_overlap": 0.017752300947904587,
        "activation_l2_distance": 0.00311657995916903,
        "activation_cosine_similarity": 0.015923980623483658,
        "activation_magnitude_ratio": -0.005429686047136784,
        "activation_dot_product": 0.004836803302168846,
        "encoder_gradient_cosine_similarity": 0.0027307490818202496,
        "encoder_gradient_l2_distance": -0.02157631143927574,
        "encoder_gradient_dot_product": 0.004180391319096088,
        "input_gradient_cosine_similarity": 0.0022879166062921286,
        "input_gradient_l2_distance": -0.03157041594386101,
        "input_gradient_dot_product": -0.01736190728843212
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7518049289246553,
      "val_r": 0.7278667931551717,
      "n_iterations": 206,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.016549212858080864,
        "right_subspace_overlap_bottom_k": -0.013803927227854729,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0010129817528650165,
        "spectral_gap": 0.0012918879510834813,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0015972958644852042,
        "layerwise_effective_rank_mergeability_score": 0.0014201197773218155,
        "task_vector_cosine_similarity": -0.002141362288966775,
        "task_vector_l2_distance": -0.010634166188538074,
        "task_vector_dot_product": -0.001959742046892643,
        "weight_space_angle": 0.005505270790308714,
        "task_vector_magnitude_ratio": -0.001316078007221222,
        "singular_value_overlap": 0.0,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.01093937549740076,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.020296644419431686,
        "activation_magnitude_ratio": -0.007883104495704174,
        "activation_dot_product": 0.006282632239162922,
        "encoder_gradient_cosine_similarity": 0.006608420517295599,
        "encoder_gradient_l2_distance": -0.05440318211913109,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.027965735644102097,
        "input_gradient_dot_product": -0.007845163345336914
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7394327794364381,
      "val_r": 0.6074179170427889,
      "n_iterations": 196,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.015506061725318432,
        "right_subspace_overlap_bottom_k": -0.016460388898849487,
        "interaction_matrix_overlap_top_k": -0.0016651960322633386,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": -0.001115723280236125,
        "effective_rank_mergeability_score": 0.002087018918246031,
        "stable_rank": -0.0019379123114049435,
        "spectral_gap": 0.001872456632554531,
        "singular_value_ratio": -0.0013450533151626587,
        "layerwise_effective_rank": -0.002345075597986579,
        "layerwise_effective_rank_mergeability_score": 0.0033561561722308397,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.014298549853265285,
        "task_vector_dot_product": -0.002441608114168048,
        "weight_space_angle": 0.0011576928663998842,
        "task_vector_magnitude_ratio": -0.001702269073575735,
        "singular_value_overlap": 0.003908418584614992,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.010884804651141167,
        "activation_l2_distance": -0.004723794758319855,
        "activation_cosine_similarity": 0.02964034304022789,
        "activation_magnitude_ratio": -0.0020637144334614277,
        "activation_dot_product": 0.00542818196117878,
        "encoder_gradient_cosine_similarity": 0.00177172408439219,
        "encoder_gradient_l2_distance": -0.06673489511013031,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0018217565957456827,
        "input_gradient_l2_distance": -0.06397051364183426,
        "input_gradient_dot_product": -0.005294123664498329
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.793324840347617,
      "val_r": 0.3752508647756753,
      "n_iterations": 348,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.02648795396089554,
        "right_subspace_overlap_bottom_k": -0.026196200400590897,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": -0.0015534237027168274,
        "singular_value_ratio": 0.0011891598114743829,
        "layerwise_effective_rank": -0.0025411027017980814,
        "layerwise_effective_rank_mergeability_score": 0.0017523241695016623,
        "task_vector_cosine_similarity": -0.0014325263909995556,
        "task_vector_l2_distance": 0.0,
        "task_vector_dot_product": -0.0021872972138226032,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": 0.001958777429535985,
        "subspace_overlap": -0.0056177470833063126,
        "right_subspace_overlap": 0.011394129134714603,
        "activation_l2_distance": -0.0017049160087481141,
        "activation_cosine_similarity": 0.02136583812534809,
        "activation_magnitude_ratio": -0.0014903763076290488,
        "activation_dot_product": 0.005718467757105827,
        "encoder_gradient_cosine_similarity": 0.005513570737093687,
        "encoder_gradient_l2_distance": -0.05814121663570404,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0018379519460722804,
        "input_gradient_l2_distance": -0.022040730342268944,
        "input_gradient_dot_product": -0.008500522933900356
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8265824963423563,
      "val_r": 0.7064807919917905,
      "n_iterations": 248,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.003459973493590951,
        "right_subspace_overlap_bottom_k": -0.0012748793233186007,
        "interaction_matrix_overlap_top_k": -0.003330135252326727,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.002277329796925187,
        "spectral_gap": 0.0013750221114605665,
        "singular_value_ratio": -0.002032308140769601,
        "layerwise_effective_rank": -0.001395418425090611,
        "layerwise_effective_rank_mergeability_score": 0.002152122324332595,
        "task_vector_cosine_similarity": -0.001144513487815857,
        "task_vector_l2_distance": -0.0312536396086216,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.002463025040924549,
        "singular_value_overlap": -0.0034787904005497694,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.013982431031763554,
        "activation_magnitude_ratio": -0.003063442185521126,
        "activation_dot_product": 0.037977010011672974,
        "encoder_gradient_cosine_similarity": 0.0019272355129942298,
        "encoder_gradient_l2_distance": -0.06469450145959854,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.007832312025129795,
        "input_gradient_l2_distance": -0.058272115886211395,
        "input_gradient_dot_product": -0.0062330723740160465
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 0.3,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}