{
  "aggregate_metrics": {
    "train_r": 0.06762073080938706,
    "train_p": 0.00012241410671881924,
    "val_r": 0.20929188183147265,
    "val_p": 6.595653214996166e-05
  },
  "per_fold_stats": {
    "train_r_mean": 0.6733626207018186,
    "train_r_std": 0.1340944270521072,
    "val_r_mean": 0.5248547802954963,
    "val_r_std": 0.193619978441789
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 24.884315490722656,
    "right_subspace_overlap_bottom_k": -21.459972381591797,
    "interaction_matrix_overlap_top_k": 3.0477170944213867,
    "interaction_matrix_overlap_bottom_k": -7.693885803222656,
    "effective_rank": -15.861124038696289,
    "effective_rank_mergeability_score": -22.590986251831055,
    "stable_rank": -9.087815284729004,
    "spectral_gap": 7.006402492523193,
    "singular_value_ratio": -26.1436824798584,
    "layerwise_effective_rank": -11.62832260131836,
    "layerwise_effective_rank_mergeability_score": 7.374472618103027,
    "task_vector_cosine_similarity": 25.76519775390625,
    "task_vector_l2_distance": 7.5434722900390625,
    "task_vector_dot_product": 32.70201110839844,
    "weight_space_angle": 9.043668746948242,
    "task_vector_magnitude_ratio": 3.6100687980651855,
    "singular_value_overlap": 11.629496574401855,
    "subspace_overlap": -2.5813746452331543,
    "right_subspace_overlap": 41.547061920166016,
    "activation_l2_distance": -30.619190216064453,
    "activation_cosine_similarity": -1.3738325834274292,
    "activation_magnitude_ratio": -44.809852600097656,
    "activation_dot_product": 21.184139251708984,
    "encoder_gradient_cosine_similarity": -5.065914154052734,
    "encoder_gradient_l2_distance": -13.815847396850586,
    "encoder_gradient_dot_product": 21.24355697631836,
    "input_gradient_cosine_similarity": 44.986507415771484,
    "input_gradient_l2_distance": -38.55215072631836,
    "input_gradient_dot_product": -9.289923667907715
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 32.95955276489258,
    "right_subspace_overlap_bottom_k": 46.44782257080078,
    "interaction_matrix_overlap_top_k": 29.44813346862793,
    "interaction_matrix_overlap_bottom_k": 16.816421508789062,
    "effective_rank": 77.27819061279297,
    "effective_rank_mergeability_score": 63.721981048583984,
    "stable_rank": 31.414268493652344,
    "spectral_gap": 56.62427520751953,
    "singular_value_ratio": 115.57380676269531,
    "layerwise_effective_rank": 24.987619400024414,
    "layerwise_effective_rank_mergeability_score": 23.349567413330078,
    "task_vector_cosine_similarity": 59.6183967590332,
    "task_vector_l2_distance": 48.96830749511719,
    "task_vector_dot_product": 126.74755859375,
    "weight_space_angle": 87.50823211669922,
    "task_vector_magnitude_ratio": 36.96215057373047,
    "singular_value_overlap": 25.20598793029785,
    "subspace_overlap": 52.123573303222656,
    "right_subspace_overlap": 128.97915649414062,
    "activation_l2_distance": 87.27774810791016,
    "activation_cosine_similarity": 50.63249969482422,
    "activation_magnitude_ratio": 132.56715393066406,
    "activation_dot_product": 36.0350341796875,
    "encoder_gradient_cosine_similarity": 53.05628967285156,
    "encoder_gradient_l2_distance": 23.703792572021484,
    "encoder_gradient_dot_product": 74.05584716796875,
    "input_gradient_cosine_similarity": 157.1617431640625,
    "input_gradient_l2_distance": 66.33950805664062,
    "input_gradient_dot_product": 79.544677734375
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.23925290602500116,
      "val_r": 0.2247516161460303,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 127.35424041748047,
        "right_subspace_overlap_bottom_k": -182.4384307861328,
        "interaction_matrix_overlap_top_k": -111.6633529663086,
        "interaction_matrix_overlap_bottom_k": 36.77713394165039,
        "effective_rank": -343.91339111328125,
        "effective_rank_mergeability_score": -260.2033996582031,
        "stable_rank": -131.6728515625,
        "spectral_gap": -115.93846893310547,
        "singular_value_ratio": -527.0239868164062,
        "layerwise_effective_rank": -101.80789947509766,
        "layerwise_effective_rank_mergeability_score": 62.307769775390625,
        "task_vector_cosine_similarity": 216.36102294921875,
        "task_vector_l2_distance": 214.16128540039062,
        "task_vector_dot_product": 579.715576171875,
        "weight_space_angle": 367.043212890625,
        "task_vector_magnitude_ratio": -79.28584289550781,
        "singular_value_overlap": 74.56094360351562,
        "subspace_overlap": -204.81365966796875,
        "right_subspace_overlap": 598.2108764648438,
        "activation_l2_distance": -394.7183532714844,
        "activation_cosine_similarity": -216.69154357910156,
        "activation_magnitude_ratio": -607.103271484375,
        "activation_dot_product": 113.10712432861328,
        "encoder_gradient_cosine_similarity": -155.06605529785156,
        "encoder_gradient_l2_distance": -20.031641006469727,
        "encoder_gradient_dot_product": 319.9499206542969,
        "input_gradient_cosine_similarity": 725.0942993164062,
        "input_gradient_l2_distance": -279.2798156738281,
        "input_gradient_dot_product": 298.00927734375
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6434745784728482,
      "val_r": 0.6722095547466627,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 64.07221984863281,
        "right_subspace_overlap_bottom_k": -40.30537796020508,
        "interaction_matrix_overlap_top_k": -3.7938578128814697,
        "interaction_matrix_overlap_bottom_k": -50.694480895996094,
        "effective_rank": 13.6593599319458,
        "effective_rank_mergeability_score": 32.96051788330078,
        "stable_rank": 35.16752243041992,
        "spectral_gap": 8.17874526977539,
        "singular_value_ratio": -1.4566837549209595,
        "layerwise_effective_rank": -25.090978622436523,
        "layerwise_effective_rank_mergeability_score": -23.205686569213867,
        "task_vector_cosine_similarity": 30.59787940979004,
        "task_vector_l2_distance": -7.457367897033691,
        "task_vector_dot_product": -15.233421325683594,
        "weight_space_angle": -28.223712921142578,
        "task_vector_magnitude_ratio": -17.350400924682617,
        "singular_value_overlap": 63.35697937011719,
        "subspace_overlap": 14.083162307739258,
        "right_subspace_overlap": 55.71683883666992,
        "activation_l2_distance": -30.248741149902344,
        "activation_cosine_similarity": 29.277217864990234,
        "activation_magnitude_ratio": -52.70260238647461,
        "activation_dot_product": 41.99921798706055,
        "encoder_gradient_cosine_similarity": 39.02511978149414,
        "encoder_gradient_l2_distance": -80.88614654541016,
        "encoder_gradient_dot_product": 73.18103790283203,
        "input_gradient_cosine_similarity": -14.276061058044434,
        "input_gradient_l2_distance": -61.58708572387695,
        "input_gradient_dot_product": -47.76481628417969
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6226408182523073,
      "val_r": 0.5024401938820509,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 69.56302642822266,
        "right_subspace_overlap_bottom_k": -99.68254852294922,
        "interaction_matrix_overlap_top_k": 27.145750045776367,
        "interaction_matrix_overlap_bottom_k": -17.08823585510254,
        "effective_rank": 41.72834396362305,
        "effective_rank_mergeability_score": -52.991943359375,
        "stable_rank": -25.806425094604492,
        "spectral_gap": 48.041969299316406,
        "singular_value_ratio": -38.59965896606445,
        "layerwise_effective_rank": -43.602691650390625,
        "layerwise_effective_rank_mergeability_score": -18.60411834716797,
        "task_vector_cosine_similarity": 20.29659080505371,
        "task_vector_l2_distance": 4.696615695953369,
        "task_vector_dot_product": 66.8129653930664,
        "weight_space_angle": -2.364809513092041,
        "task_vector_magnitude_ratio": 20.20966339111328,
        "singular_value_overlap": -8.018401145935059,
        "subspace_overlap": 25.586151123046875,
        "right_subspace_overlap": 53.13404846191406,
        "activation_l2_distance": -47.604488372802734,
        "activation_cosine_similarity": 22.591943740844727,
        "activation_magnitude_ratio": -52.48531723022461,
        "activation_dot_product": 42.28086471557617,
        "encoder_gradient_cosine_similarity": 54.90537643432617,
        "encoder_gradient_l2_distance": 11.237345695495605,
        "encoder_gradient_dot_product": 6.233688831329346,
        "input_gradient_cosine_similarity": 75.55892944335938,
        "input_gradient_l2_distance": -91.04486846923828,
        "input_gradient_dot_product": -91.13141632080078
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6857949778779433,
      "val_r": 0.5982993708474039,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 54.303401947021484,
        "right_subspace_overlap_bottom_k": -34.52175521850586,
        "interaction_matrix_overlap_top_k": 18.29440689086914,
        "interaction_matrix_overlap_bottom_k": -25.952613830566406,
        "effective_rank": 7.1328959465026855,
        "effective_rank_mergeability_score": -11.335429191589355,
        "stable_rank": -41.482852935791016,
        "spectral_gap": -0.6595717072486877,
        "singular_value_ratio": -5.565253257751465,
        "layerwise_effective_rank": 22.524808883666992,
        "layerwise_effective_rank_mergeability_score": 16.07476043701172,
        "task_vector_cosine_similarity": 21.609130859375,
        "task_vector_l2_distance": 5.992469310760498,
        "task_vector_dot_product": 7.159867286682129,
        "weight_space_angle": 9.77334213256836,
        "task_vector_magnitude_ratio": 13.98493480682373,
        "singular_value_overlap": 1.298306941986084,
        "subspace_overlap": -8.99168586730957,
        "right_subspace_overlap": 14.102063179016113,
        "activation_l2_distance": -29.341039657592773,
        "activation_cosine_similarity": 8.842524528503418,
        "activation_magnitude_ratio": -16.824228286743164,
        "activation_dot_product": 20.071557998657227,
        "encoder_gradient_cosine_similarity": 24.13075065612793,
        "encoder_gradient_l2_distance": -22.68610191345215,
        "encoder_gradient_dot_product": 30.538715362548828,
        "input_gradient_cosine_similarity": 13.41684341430664,
        "input_gradient_l2_distance": -43.50356674194336,
        "input_gradient_dot_product": -47.3882942199707
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6873814037134065,
      "val_r": 0.6221196247903374,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 31.05036163330078,
        "right_subspace_overlap_bottom_k": -24.545482635498047,
        "interaction_matrix_overlap_top_k": -0.6448614001274109,
        "interaction_matrix_overlap_bottom_k": -29.190765380859375,
        "effective_rank": -6.48896598815918,
        "effective_rank_mergeability_score": 33.11677169799805,
        "stable_rank": 9.82072925567627,
        "spectral_gap": -1.0253126621246338,
        "singular_value_ratio": 17.996749877929688,
        "layerwise_effective_rank": -26.231990814208984,
        "layerwise_effective_rank_mergeability_score": -10.92776870727539,
        "task_vector_cosine_similarity": 18.35593032836914,
        "task_vector_l2_distance": -19.402463912963867,
        "task_vector_dot_product": -32.04058837890625,
        "weight_space_angle": -30.47498321533203,
        "task_vector_magnitude_ratio": 14.213591575622559,
        "singular_value_overlap": 0.7868310213088989,
        "subspace_overlap": 38.73748779296875,
        "right_subspace_overlap": 26.283674240112305,
        "activation_l2_distance": -0.7049641013145447,
        "activation_cosine_similarity": 16.665109634399414,
        "activation_magnitude_ratio": -7.323365211486816,
        "activation_dot_product": 31.524412155151367,
        "encoder_gradient_cosine_similarity": 37.9456672668457,
        "encoder_gradient_l2_distance": -66.07475280761719,
        "encoder_gradient_dot_product": 16.59861946105957,
        "input_gradient_cosine_similarity": 45.00920867919922,
        "input_gradient_l2_distance": -41.56461715698242,
        "input_gradient_dot_product": -40.46586227416992
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7076448078980143,
      "val_r": 0.6935167600691494,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 8.636240005493164,
        "right_subspace_overlap_bottom_k": 0.4280291199684143,
        "interaction_matrix_overlap_top_k": 7.078511714935303,
        "interaction_matrix_overlap_bottom_k": -16.5725040435791,
        "effective_rank": 11.125869750976562,
        "effective_rank_mergeability_score": 0.33992800116539,
        "stable_rank": -15.522315979003906,
        "spectral_gap": 1.6963428258895874,
        "singular_value_ratio": -6.607046604156494,
        "layerwise_effective_rank": 5.2742462158203125,
        "layerwise_effective_rank_mergeability_score": 6.326724529266357,
        "task_vector_cosine_similarity": -10.926033020019531,
        "task_vector_l2_distance": -2.955540895462036,
        "task_vector_dot_product": 5.441878795623779,
        "weight_space_angle": 0.6186132431030273,
        "task_vector_magnitude_ratio": 11.8377103805542,
        "singular_value_overlap": -0.5274502635002136,
        "subspace_overlap": -0.8194308280944824,
        "right_subspace_overlap": 9.36811351776123,
        "activation_l2_distance": -2.959779977798462,
        "activation_cosine_similarity": 11.335348129272461,
        "activation_magnitude_ratio": -4.032323360443115,
        "activation_dot_product": 0.07700438797473907,
        "encoder_gradient_cosine_similarity": 6.834955215454102,
        "encoder_gradient_l2_distance": -8.793572425842285,
        "encoder_gradient_dot_product": 5.3961873054504395,
        "input_gradient_cosine_similarity": 4.8656463623046875,
        "input_gradient_l2_distance": -21.58478546142578,
        "input_gradient_dot_product": -4.381931781768799
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.73981379173495,
      "val_r": 0.45242760597835013,
      "n_iterations": 141,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.7699074745178223,
        "right_subspace_overlap_bottom_k": -1.1173579692840576,
        "interaction_matrix_overlap_top_k": 0.5349670052528381,
        "interaction_matrix_overlap_bottom_k": -0.5510883331298828,
        "effective_rank": 0.13293275237083435,
        "effective_rank_mergeability_score": 0.7911407351493835,
        "stable_rank": 0.6953656077384949,
        "spectral_gap": 0.020535891875624657,
        "singular_value_ratio": 0.06829451769590378,
        "layerwise_effective_rank": -0.48424237966537476,
        "layerwise_effective_rank_mergeability_score": -0.1809912770986557,
        "task_vector_cosine_similarity": -0.26550188660621643,
        "task_vector_l2_distance": -0.26322105526924133,
        "task_vector_dot_product": 0.45814943313598633,
        "weight_space_angle": 0.8337037563323975,
        "task_vector_magnitude_ratio": -0.24711397290229797,
        "singular_value_overlap": 0.2662428021430969,
        "subspace_overlap": 0.4299635589122772,
        "right_subspace_overlap": 1.0451297760009766,
        "activation_l2_distance": -0.28075966238975525,
        "activation_cosine_similarity": 0.7884235978126526,
        "activation_magnitude_ratio": 0.18076208233833313,
        "activation_dot_product": 0.6293318271636963,
        "encoder_gradient_cosine_similarity": 0.5946068167686462,
        "encoder_gradient_l2_distance": -2.039778232574463,
        "encoder_gradient_dot_product": 0.6790871620178223,
        "input_gradient_cosine_similarity": 0.09091829508543015,
        "input_gradient_l2_distance": -1.4285989999771118,
        "input_gradient_dot_product": -1.1611617803573608
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7041155419836922,
      "val_r": 0.18917142295978331,
      "n_iterations": 59,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.9155734777450562,
        "right_subspace_overlap_bottom_k": -0.8275137543678284,
        "interaction_matrix_overlap_top_k": 0.8991342782974243,
        "interaction_matrix_overlap_bottom_k": -0.19357751309871674,
        "effective_rank": 0.16907311975955963,
        "effective_rank_mergeability_score": -0.06883111596107483,
        "stable_rank": -0.12730573117733002,
        "spectral_gap": 0.05041274428367615,
        "singular_value_ratio": -0.07511613517999649,
        "layerwise_effective_rank": -0.43417420983314514,
        "layerwise_effective_rank_mergeability_score": 0.003245874308049679,
        "task_vector_cosine_similarity": -0.27134817838668823,
        "task_vector_l2_distance": -0.36441361904144287,
        "task_vector_dot_product": -0.092891626060009,
        "weight_space_angle": 0.7087284326553345,
        "task_vector_magnitude_ratio": 0.19382190704345703,
        "singular_value_overlap": 0.05160750076174736,
        "subspace_overlap": 0.020392518490552902,
        "right_subspace_overlap": 0.2828637659549713,
        "activation_l2_distance": 0.09882120043039322,
        "activation_cosine_similarity": 0.6887824535369873,
        "activation_magnitude_ratio": -0.1404074728488922,
        "activation_dot_product": 0.43366768956184387,
        "encoder_gradient_cosine_similarity": 0.5866646766662598,
        "encoder_gradient_l2_distance": -1.4749444723129272,
        "encoder_gradient_dot_product": 0.0059649888426065445,
        "input_gradient_cosine_similarity": 0.389996200799942,
        "input_gradient_l2_distance": -0.867777943611145,
        "input_gradient_dot_product": 0.41774997115135193
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.6611514993942484,
      "val_r": 0.2845317481808859,
      "n_iterations": 65,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.9032111167907715,
        "right_subspace_overlap_bottom_k": -0.7185025811195374,
        "interaction_matrix_overlap_top_k": 0.4112814962863922,
        "interaction_matrix_overlap_bottom_k": -1.789451003074646,
        "effective_rank": -0.661988377571106,
        "effective_rank_mergeability_score": 0.43908771872520447,
        "stable_rank": -0.30945417284965515,
        "spectral_gap": 0.26203370094299316,
        "singular_value_ratio": -0.2572682201862335,
        "layerwise_effective_rank": -0.07503525912761688,
        "layerwise_effective_rank_mergeability_score": 0.43358877301216125,
        "task_vector_cosine_similarity": 1.0728563070297241,
        "task_vector_l2_distance": -0.24519076943397522,
        "task_vector_dot_product": 1.182340383529663,
        "weight_space_angle": -0.7361633777618408,
        "task_vector_magnitude_ratio": 1.0100852251052856,
        "singular_value_overlap": 1.012120246887207,
        "subspace_overlap": 0.48019614815711975,
        "right_subspace_overlap": 0.10240466147661209,
        "activation_l2_distance": -0.715368926525116,
        "activation_cosine_similarity": 0.8281897306442261,
        "activation_magnitude_ratio": -0.30201515555381775,
        "activation_dot_product": 0.3277387320995331,
        "encoder_gradient_cosine_similarity": 1.6306371688842773,
        "encoder_gradient_l2_distance": -1.9469280242919922,
        "encoder_gradient_dot_product": 0.262407511472702,
        "input_gradient_cosine_similarity": 0.8292235136032104,
        "input_gradient_l2_distance": -1.0104800462722778,
        "input_gradient_dot_product": -1.435254693031311
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6874796835288821,
      "val_r": 0.3035074977116192,
      "n_iterations": 115,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.6008601188659668,
        "right_subspace_overlap_bottom_k": -1.5680617094039917,
        "interaction_matrix_overlap_top_k": 2.22902512550354,
        "interaction_matrix_overlap_bottom_k": -0.572513997554779,
        "effective_rank": -0.08868866413831711,
        "effective_rank_mergeability_score": 0.081169992685318,
        "stable_rank": 0.14697659015655518,
        "spectral_gap": -0.3211546540260315,
        "singular_value_ratio": 0.554809033870697,
        "layerwise_effective_rank": -0.5035936832427979,
        "layerwise_effective_rank_mergeability_score": 0.6278828382492065,
        "task_vector_cosine_similarity": -0.25908026099205017,
        "task_vector_l2_distance": -0.2426154613494873,
        "task_vector_dot_product": -0.6649947762489319,
        "weight_space_angle": -0.2186991423368454,
        "task_vector_magnitude_ratio": -0.36448797583580017,
        "singular_value_overlap": 0.13284309208393097,
        "subspace_overlap": 0.4471115171909332,
        "right_subspace_overlap": 1.0604121685028076,
        "activation_l2_distance": 1.0661523342132568,
        "activation_cosine_similarity": -0.23339277505874634,
        "activation_magnitude_ratio": -0.09616749733686447,
        "activation_dot_product": -0.08327040076255798,
        "encoder_gradient_cosine_similarity": 1.1260625123977661,
        "encoder_gradient_l2_distance": -0.9648225903511047,
        "encoder_gradient_dot_product": 0.5627781748771667,
        "input_gradient_cosine_similarity": 1.192668080329895,
        "input_gradient_l2_distance": -1.409943699836731,
        "input_gradient_dot_product": -1.2500451803207397
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7075210981913744,
      "val_r": 0.6494772937232739,
      "n_iterations": 71,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.849783718585968,
        "right_subspace_overlap_bottom_k": -1.6811699867248535,
        "interaction_matrix_overlap_top_k": 0.608317494392395,
        "interaction_matrix_overlap_bottom_k": 0.1609870344400406,
        "effective_rank": 0.14913706481456757,
        "effective_rank_mergeability_score": 0.9470020532608032,
        "stable_rank": -0.5667574405670166,
        "spectral_gap": -0.6961559057235718,
        "singular_value_ratio": 0.2968251705169678,
        "layerwise_effective_rank": 0.08221685886383057,
        "layerwise_effective_rank_mergeability_score": -0.7092695236206055,
        "task_vector_cosine_similarity": 0.7764800786972046,
        "task_vector_l2_distance": -0.16994552314281464,
        "task_vector_dot_product": 0.0558515228331089,
        "weight_space_angle": 0.27493831515312195,
        "task_vector_magnitude_ratio": -0.6638532280921936,
        "singular_value_overlap": 0.3797178864479065,
        "subspace_overlap": -0.9994086623191833,
        "right_subspace_overlap": 1.3085006475448608,
        "activation_l2_distance": -0.2176164984703064,
        "activation_cosine_similarity": 0.15761955082416534,
        "activation_magnitude_ratio": 0.2751356065273285,
        "activation_dot_product": 1.6723816394805908,
        "encoder_gradient_cosine_similarity": 0.8058951497077942,
        "encoder_gradient_l2_distance": -1.243109941482544,
        "encoder_gradient_dot_product": 0.8674684762954712,
        "input_gradient_cosine_similarity": 0.853083610534668,
        "input_gradient_l2_distance": -1.7242416143417358,
        "input_gradient_dot_product": -0.8681021928787231
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7591502907654646,
      "val_r": 0.7680740780244809,
      "n_iterations": 91,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.3437700867652893,
        "right_subspace_overlap_bottom_k": -0.3975973129272461,
        "interaction_matrix_overlap_top_k": 0.04639299213886261,
        "interaction_matrix_overlap_bottom_k": -0.01765214093029499,
        "effective_rank": -0.20751510560512543,
        "effective_rank_mergeability_score": 0.3763871192932129,
        "stable_rank": 0.21192635595798492,
        "spectral_gap": 0.07759561389684677,
        "singular_value_ratio": 0.09700508415699005,
        "layerwise_effective_rank": 0.15822294354438782,
        "layerwise_effective_rank_mergeability_score": -0.2302260547876358,
        "task_vector_cosine_similarity": 0.06512743979692459,
        "task_vector_l2_distance": -0.10832186043262482,
        "task_vector_dot_product": -0.13964006304740906,
        "weight_space_angle": 0.7257473468780518,
        "task_vector_magnitude_ratio": -0.08121373504400253,
        "singular_value_overlap": 0.033313628286123276,
        "subspace_overlap": 0.1466786116361618,
        "right_subspace_overlap": 0.5023790001869202,
        "activation_l2_distance": 0.12574809789657593,
        "activation_cosine_similarity": 0.3623616397380829,
        "activation_magnitude_ratio": -0.11612977832555771,
        "activation_dot_product": 0.30725398659706116,
        "encoder_gradient_cosine_similarity": 0.1683080494403839,
        "encoder_gradient_l2_distance": -0.8285135626792908,
        "encoder_gradient_dot_product": 0.02580903470516205,
        "input_gradient_cosine_similarity": 0.10953158140182495,
        "input_gradient_l2_distance": -0.48981863260269165,
        "input_gradient_dot_product": -0.26951852440834045
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7473277970129775,
      "val_r": 0.679194889843433,
      "n_iterations": 975,
      "coefficients": {
        "right_subspace_overlap_top_k": 39.09723663330078,
        "right_subspace_overlap_bottom_k": -41.8505859375,
        "interaction_matrix_overlap_top_k": 17.23818588256836,
        "interaction_matrix_overlap_bottom_k": -2.5497007369995117,
        "effective_rank": 16.29368782043457,
        "effective_rank_mergeability_score": -55.64943313598633,
        "stable_rank": 1.7963417768478394,
        "spectral_gap": -11.262704849243164,
        "singular_value_ratio": 15.086113929748535,
        "layerwise_effective_rank": -14.251962661743164,
        "layerwise_effective_rank_mergeability_score": 60.53445816040039,
        "task_vector_cosine_similarity": 14.993026733398438,
        "task_vector_l2_distance": 9.654321670532227,
        "task_vector_dot_product": 10.492091178894043,
        "weight_space_angle": 4.8175859451293945,
        "task_vector_magnitude_ratio": -32.16069793701172,
        "singular_value_overlap": 2.1692898273468018,
        "subspace_overlap": -28.220413208007812,
        "right_subspace_overlap": 7.142767906188965,
        "activation_l2_distance": 3.9579951763153076,
        "activation_cosine_similarity": 35.98514175415039,
        "activation_magnitude_ratio": -0.12744836509227753,
        "activation_dot_product": 9.646368026733398,
        "encoder_gradient_cosine_similarity": 23.600717544555664,
        "encoder_gradient_l2_distance": -47.62245559692383,
        "encoder_gradient_dot_product": 26.780574798583984,
        "input_gradient_cosine_similarity": 8.144096374511719,
        "input_gradient_l2_distance": -31.991838455200195,
        "input_gradient_dot_product": -40.74441909790039
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5610457450708299,
      "val_r": 0.6616948031047553,
      "n_iterations": 440,
      "coefficients": {
        "right_subspace_overlap_top_k": 29.46262550354004,
        "right_subspace_overlap_bottom_k": -26.764965057373047,
        "interaction_matrix_overlap_top_k": 35.585716247558594,
        "interaction_matrix_overlap_bottom_k": -16.548751831054688,
        "effective_rank": 0.27155590057373047,
        "effective_rank_mergeability_score": -7.145925045013428,
        "stable_rank": -5.016761779785156,
        "spectral_gap": 1.5819792747497559,
        "singular_value_ratio": -1.421423316001892,
        "layerwise_effective_rank": -23.068140029907227,
        "layerwise_effective_rank_mergeability_score": -9.470718383789062,
        "task_vector_cosine_similarity": 27.943889617919922,
        "task_vector_l2_distance": 3.8456673622131348,
        "task_vector_dot_product": 2.9749977588653564,
        "weight_space_angle": -20.799686431884766,
        "task_vector_magnitude_ratio": 6.798483371734619,
        "singular_value_overlap": 16.29107093811035,
        "subspace_overlap": 13.301338195800781,
        "right_subspace_overlap": -3.0214078426361084,
        "activation_l2_distance": -5.665212631225586,
        "activation_cosine_similarity": 20.00644302368164,
        "activation_magnitude_ratio": -19.5922794342041,
        "activation_dot_product": 12.691991806030273,
        "encoder_gradient_cosine_similarity": 11.600971221923828,
        "encoder_gradient_l2_distance": -20.144163131713867,
        "encoder_gradient_dot_product": 17.672109603881836,
        "input_gradient_cosine_similarity": 13.05931568145752,
        "input_gradient_l2_distance": -6.367824554443359,
        "input_gradient_dot_product": -47.06427764892578
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.41140657017776056,
      "val_r": 0.6016504052129641,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 46.497135162353516,
        "right_subspace_overlap_bottom_k": 52.526817321777344,
        "interaction_matrix_overlap_top_k": 41.252864837646484,
        "interaction_matrix_overlap_bottom_k": -21.712142944335938,
        "effective_rank": -61.31068801879883,
        "effective_rank_mergeability_score": -123.95664978027344,
        "stable_rank": -7.672507286071777,
        "spectral_gap": 221.31942749023438,
        "singular_value_ratio": 29.602807998657227,
        "layerwise_effective_rank": -9.665542602539062,
        "layerwise_effective_rank_mergeability_score": 54.69191360473633,
        "task_vector_cosine_similarity": 184.9276885986328,
        "task_vector_l2_distance": -51.021270751953125,
        "task_vector_dot_product": 26.30358123779297,
        "weight_space_angle": -132.95205688476562,
        "task_vector_magnitude_ratio": 137.67288208007812,
        "singular_value_overlap": 73.9106216430664,
        "subspace_overlap": 95.34403991699219,
        "right_subspace_overlap": 45.410213470458984,
        "activation_l2_distance": -105.80281066894531,
        "activation_cosine_similarity": 23.224315643310547,
        "activation_magnitude_ratio": -129.4638671875,
        "activation_dot_product": 128.7861785888672,
        "encoder_gradient_cosine_similarity": -159.32366943359375,
        "encoder_gradient_l2_distance": 7.980257034301758,
        "encoder_gradient_dot_product": -91.63580322265625,
        "input_gradient_cosine_similarity": 15.446955680847168,
        "input_gradient_l2_distance": -144.76321411132812,
        "input_gradient_dot_product": -144.61917114257812
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7493999374509545,
      "val_r": 0.16978391550272715,
      "n_iterations": 72,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.119483470916748,
        "right_subspace_overlap_bottom_k": -0.3556704819202423,
        "interaction_matrix_overlap_top_k": 0.2422262281179428,
        "interaction_matrix_overlap_bottom_k": -0.6515368819236755,
        "effective_rank": -0.10158874839544296,
        "effective_rank_mergeability_score": -0.26464492082595825,
        "stable_rank": 0.42719271779060364,
        "spectral_gap": -0.2526293992996216,
        "singular_value_ratio": -0.2091764658689499,
        "layerwise_effective_rank": 0.19430990517139435,
        "layerwise_effective_rank_mergeability_score": 1.0957192182540894,
        "task_vector_cosine_similarity": -1.2836675643920898,
        "task_vector_l2_distance": -0.3903203308582306,
        "task_vector_dot_product": 0.18650932610034943,
        "weight_space_angle": 0.2522994577884674,
        "task_vector_magnitude_ratio": -0.06457820534706116,
        "singular_value_overlap": 0.5337981581687927,
        "subspace_overlap": -0.16396547853946686,
        "right_subspace_overlap": 0.7830299139022827,
        "activation_l2_distance": 0.4578520953655243,
        "activation_cosine_similarity": 0.5662717223167419,
        "activation_magnitude_ratio": -0.23622985184192657,
        "activation_dot_product": 0.659055769443512,
        "encoder_gradient_cosine_similarity": 0.34124255180358887,
        "encoder_gradient_l2_distance": -0.7962387204170227,
        "encoder_gradient_dot_product": 0.2908035218715668,
        "input_gradient_cosine_similarity": 0.12650062143802643,
        "input_gradient_l2_distance": -0.5496680736541748,
        "input_gradient_dot_product": -0.9707018136978149
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.8026072038539378,
      "val_r": 0.7377123302860715,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.9032939672470093,
        "right_subspace_overlap_bottom_k": -2.4874258041381836,
        "interaction_matrix_overlap_top_k": -1.2124449014663696,
        "interaction_matrix_overlap_bottom_k": 2.323878288269043,
        "effective_rank": 0.1543564349412918,
        "effective_rank_mergeability_score": -0.6518359780311584,
        "stable_rank": -0.590928316116333,
        "spectral_gap": 0.40852922201156616,
        "singular_value_ratio": 1.0182034969329834,
        "layerwise_effective_rank": 0.09897878021001816,
        "layerwise_effective_rank_mergeability_score": 0.4616360366344452,
        "task_vector_cosine_similarity": 0.38520750403404236,
        "task_vector_l2_distance": -0.032960232347249985,
        "task_vector_dot_product": 0.10436335951089859,
        "weight_space_angle": 0.24889568984508514,
        "task_vector_magnitude_ratio": -0.49951064586639404,
        "singular_value_overlap": -0.07896458357572556,
        "subspace_overlap": 0.0336008183658123,
        "right_subspace_overlap": 0.301971435546875,
        "activation_l2_distance": 0.4175616204738617,
        "activation_cosine_similarity": 0.8361676931381226,
        "activation_magnitude_ratio": -0.037523671984672546,
        "activation_dot_product": -0.17516113817691803,
        "encoder_gradient_cosine_similarity": 0.10250120609998703,
        "encoder_gradient_l2_distance": -0.5326786041259766,
        "encoder_gradient_dot_product": 0.07825181633234024,
        "input_gradient_cosine_similarity": 0.07171262055635452,
        "input_gradient_l2_distance": -0.4895794093608856,
        "input_gradient_dot_product": -0.16245177388191223
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7233172155163802,
      "val_r": 0.5492343754722641,
      "n_iterations": 795,
      "coefficients": {
        "right_subspace_overlap_top_k": 19.872190475463867,
        "right_subspace_overlap_bottom_k": -21.850849151611328,
        "interaction_matrix_overlap_top_k": 25.49608612060547,
        "interaction_matrix_overlap_bottom_k": -7.842594146728516,
        "effective_rank": 4.820370674133301,
        "effective_rank_mergeability_score": -8.692955017089844,
        "stable_rank": -1.1797090768814087,
        "spectral_gap": -13.141901016235352,
        "singular_value_ratio": -7.901671409606934,
        "layerwise_effective_rank": -15.60545825958252,
        "layerwise_effective_rank_mergeability_score": 7.6750102043151855,
        "task_vector_cosine_similarity": -8.517085075378418,
        "task_vector_l2_distance": -4.495692253112793,
        "task_vector_dot_product": 0.7370977997779846,
        "weight_space_angle": 10.342206954956055,
        "task_vector_magnitude_ratio": -3.740631341934204,
        "singular_value_overlap": 6.065938949584961,
        "subspace_overlap": 4.526862144470215,
        "right_subspace_overlap": 18.568073272705078,
        "activation_l2_distance": 0.3794146776199341,
        "activation_cosine_similarity": 16.29234504699707,
        "activation_magnitude_ratio": -5.894582748413086,
        "activation_dot_product": 18.973072052001953,
        "encoder_gradient_cosine_similarity": 8.900983810424805,
        "encoder_gradient_l2_distance": -16.430513381958008,
        "encoder_gradient_dot_product": 16.82478141784668,
        "input_gradient_cosine_similarity": 9.440776824951172,
        "input_gradient_l2_distance": -39.3199577331543,
        "input_gradient_dot_product": -13.30354118347168
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7903641853827186,
      "val_r": 0.38080333691621676,
      "n_iterations": 248,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.0775235891342163,
        "right_subspace_overlap_bottom_k": -0.8233262896537781,
        "interaction_matrix_overlap_top_k": 0.9351122975349426,
        "interaction_matrix_overlap_bottom_k": -1.391465187072754,
        "effective_rank": -0.5199460387229919,
        "effective_rank_mergeability_score": 0.2458709329366684,
        "stable_rank": 0.0974542498588562,
        "spectral_gap": 1.1277797222137451,
        "singular_value_ratio": 0.7689056396484375,
        "layerwise_effective_rank": 0.18816423416137695,
        "layerwise_effective_rank_mergeability_score": 0.33364054560661316,
        "task_vector_cosine_similarity": -0.46185269951820374,
        "task_vector_l2_distance": 0.15712344646453857,
        "task_vector_dot_product": 0.12731827795505524,
        "weight_space_angle": 0.4547654390335083,
        "task_vector_magnitude_ratio": 0.9358758926391602,
        "singular_value_overlap": 0.42950740456581116,
        "subspace_overlap": -0.931079089641571,
        "right_subspace_overlap": 1.3593658208847046,
        "activation_l2_distance": -0.7377641201019287,
        "activation_cosine_similarity": 0.6567741632461548,
        "activation_magnitude_ratio": -0.1435939073562622,
        "activation_dot_product": 0.38473695516586304,
        "encoder_gradient_cosine_similarity": 0.6903642416000366,
        "encoder_gradient_l2_distance": -2.1602578163146973,
        "encoder_gradient_dot_product": 0.4673323631286621,
        "input_gradient_cosine_similarity": 0.2165251225233078,
        "input_gradient_l2_distance": -1.4631825685501099,
        "input_gradient_dot_product": -1.0229651927947998
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8363623617326801,
      "val_r": 0.7564947825114654,
      "n_iterations": 105,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.2942681908607483,
        "right_subspace_overlap_bottom_k": -0.21764899790287018,
        "interaction_matrix_overlap_top_k": 0.27088025212287903,
        "interaction_matrix_overlap_bottom_k": 0.17935308814048767,
        "effective_rank": 0.4327010214328766,
        "effective_rank_mergeability_score": -0.15656694769859314,
        "stable_rank": -0.17196537554264069,
        "spectral_gap": 0.6606085300445557,
        "singular_value_ratio": 0.7539445757865906,
        "layerwise_effective_rank": -0.2656777501106262,
        "layerwise_effective_rank_mergeability_score": 0.2518918812274933,
        "task_vector_cosine_similarity": -0.09627532958984375,
        "task_vector_l2_distance": -0.48871326446533203,
        "task_vector_dot_product": 0.4591405689716339,
        "weight_space_angle": 0.5493859648704529,
        "task_vector_magnitude_ratio": -0.19735020399093628,
        "singular_value_overlap": -0.06437613070011139,
        "subspace_overlap": 0.17517097294330597,
        "right_subspace_overlap": -0.7199625372886658,
        "activation_l2_distance": 0.10963189601898193,
        "activation_cosine_similarity": 0.34328606724739075,
        "activation_magnitude_ratio": -0.031597089022397995,
        "activation_dot_product": 0.36921846866607666,
        "encoder_gradient_cosine_similarity": 0.08062632381916046,
        "encoder_gradient_l2_distance": -0.8779696226119995,
        "encoder_gradient_dot_product": 0.09136928617954254,
        "input_gradient_cosine_similarity": 0.08969268947839737,
        "input_gradient_l2_distance": -0.6021395325660706,
        "input_gradient_dot_product": -0.22155240178108215
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}