{
  "aggregate_metrics": {
    "train_r": 0.22974179740781905,
    "train_p": 7.400838778789625e-40,
    "val_r": 0.27209185097452504,
    "val_p": 1.702454796883292e-07
  },
  "per_fold_stats": {
    "train_r_mean": 0.6451938590727094,
    "train_r_std": 0.14919151351573262,
    "val_r_mean": 0.48773271075779434,
    "val_r_std": 0.26144315300897647
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 33.950279235839844,
    "right_subspace_overlap_bottom_k": -17.783538818359375,
    "interaction_matrix_overlap_top_k": 48.71793746948242,
    "interaction_matrix_overlap_bottom_k": -8.814979553222656,
    "task_vector_cosine_similarity": -1.3593978881835938,
    "task_vector_l2_distance": -7.100573539733887,
    "task_vector_dot_product": 30.62314224243164,
    "weight_space_angle": -8.538134574890137,
    "task_vector_magnitude_ratio": -16.049406051635742,
    "singular_value_overlap": 12.186305046081543,
    "subspace_overlap": -11.193406105041504,
    "right_subspace_overlap": 10.792043685913086,
    "activation_l2_distance": -6.5288519859313965,
    "activation_cosine_similarity": 14.103507995605469,
    "activation_magnitude_ratio": -16.455167770385742,
    "activation_dot_product": 7.570091247558594,
    "encoder_gradient_cosine_similarity": 17.183712005615234,
    "encoder_gradient_l2_distance": -36.80042266845703,
    "encoder_gradient_dot_product": 36.35559844970703,
    "input_gradient_cosine_similarity": 1.4777672290802002,
    "input_gradient_l2_distance": -55.502906799316406,
    "input_gradient_dot_product": -25.8313045501709
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 40.347293853759766,
    "right_subspace_overlap_bottom_k": 41.0671272277832,
    "interaction_matrix_overlap_top_k": 97.51153564453125,
    "interaction_matrix_overlap_bottom_k": 32.18950271606445,
    "task_vector_cosine_similarity": 29.362781524658203,
    "task_vector_l2_distance": 19.96870231628418,
    "task_vector_dot_product": 104.41273498535156,
    "weight_space_angle": 34.0318489074707,
    "task_vector_magnitude_ratio": 26.889514923095703,
    "singular_value_overlap": 31.34313201904297,
    "subspace_overlap": 34.50360870361328,
    "right_subspace_overlap": 25.973804473876953,
    "activation_l2_distance": 15.462276458740234,
    "activation_cosine_similarity": 28.894412994384766,
    "activation_magnitude_ratio": 92.08470916748047,
    "activation_dot_product": 51.79677963256836,
    "encoder_gradient_cosine_similarity": 27.16464614868164,
    "encoder_gradient_l2_distance": 30.68996238708496,
    "encoder_gradient_dot_product": 61.57847213745117,
    "input_gradient_cosine_similarity": 31.25309944152832,
    "input_gradient_l2_distance": 79.43519592285156,
    "input_gradient_dot_product": 51.625282287597656
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7505913488204051,
      "val_r": 0.5989720237959691,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 3.8102262020111084,
        "right_subspace_overlap_bottom_k": -6.361344814300537,
        "interaction_matrix_overlap_top_k": 4.477158546447754,
        "interaction_matrix_overlap_bottom_k": -0.2586662173271179,
        "task_vector_cosine_similarity": -0.7769419550895691,
        "task_vector_l2_distance": -5.91281795501709,
        "task_vector_dot_product": 9.365723609924316,
        "weight_space_angle": 16.583740234375,
        "task_vector_magnitude_ratio": -2.8890128135681152,
        "singular_value_overlap": -1.6909910440444946,
        "subspace_overlap": 2.2128615379333496,
        "right_subspace_overlap": 6.3783440589904785,
        "activation_l2_distance": -1.694830298423767,
        "activation_cosine_similarity": 10.049234390258789,
        "activation_magnitude_ratio": -4.082810401916504,
        "activation_dot_product": 1.5564026832580566,
        "encoder_gradient_cosine_similarity": 3.6470186710357666,
        "encoder_gradient_l2_distance": -18.09011459350586,
        "encoder_gradient_dot_product": 0.8859654664993286,
        "input_gradient_cosine_similarity": 3.687772274017334,
        "input_gradient_l2_distance": -10.041714668273926,
        "input_gradient_dot_product": -9.856491088867188
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.716950676166492,
      "val_r": 0.7572301873415309,
      "n_iterations": 834,
      "coefficients": {
        "right_subspace_overlap_top_k": -1.298088550567627,
        "right_subspace_overlap_bottom_k": -4.489099502563477,
        "interaction_matrix_overlap_top_k": 18.567678451538086,
        "interaction_matrix_overlap_bottom_k": -5.656981945037842,
        "task_vector_cosine_similarity": 4.827300071716309,
        "task_vector_l2_distance": -5.800776958465576,
        "task_vector_dot_product": -16.15580940246582,
        "weight_space_angle": 13.60468578338623,
        "task_vector_magnitude_ratio": -2.6266307830810547,
        "singular_value_overlap": 4.399844169616699,
        "subspace_overlap": 11.832809448242188,
        "right_subspace_overlap": 6.776604652404785,
        "activation_l2_distance": -1.216385006904602,
        "activation_cosine_similarity": 4.396315097808838,
        "activation_magnitude_ratio": -3.1611688137054443,
        "activation_dot_product": 21.06572914123535,
        "encoder_gradient_cosine_similarity": 5.93954610824585,
        "encoder_gradient_l2_distance": -34.266502380371094,
        "encoder_gradient_dot_product": 9.472441673278809,
        "input_gradient_cosine_similarity": 4.399372577667236,
        "input_gradient_l2_distance": -19.95555877685547,
        "input_gradient_dot_product": -9.657050132751465
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7473707481149658,
      "val_r": 0.713873678168662,
      "n_iterations": 722,
      "coefficients": {
        "right_subspace_overlap_top_k": 23.66701889038086,
        "right_subspace_overlap_bottom_k": -37.36814498901367,
        "interaction_matrix_overlap_top_k": 7.643301963806152,
        "interaction_matrix_overlap_bottom_k": 9.348860740661621,
        "task_vector_cosine_similarity": -3.2035818099975586,
        "task_vector_l2_distance": -2.5108463764190674,
        "task_vector_dot_product": 4.976145267486572,
        "weight_space_angle": 13.21749496459961,
        "task_vector_magnitude_ratio": -7.235226631164551,
        "singular_value_overlap": 0.5767754316329956,
        "subspace_overlap": -7.335672378540039,
        "right_subspace_overlap": 23.784364700317383,
        "activation_l2_distance": -0.020873362198472023,
        "activation_cosine_similarity": 19.055889129638672,
        "activation_magnitude_ratio": -5.719112396240234,
        "activation_dot_product": 13.686820983886719,
        "encoder_gradient_cosine_similarity": 5.180025100708008,
        "encoder_gradient_l2_distance": -28.22057342529297,
        "encoder_gradient_dot_product": 11.448887825012207,
        "input_gradient_cosine_similarity": 12.000341415405273,
        "input_gradient_l2_distance": -30.51711082458496,
        "input_gradient_dot_product": -21.456893920898438
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7166183518934206,
      "val_r": 0.6010250595802255,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.778152942657471,
        "right_subspace_overlap_bottom_k": -13.173110961914062,
        "interaction_matrix_overlap_top_k": 3.5830748081207275,
        "interaction_matrix_overlap_bottom_k": 1.4129283428192139,
        "task_vector_cosine_similarity": -11.238423347473145,
        "task_vector_l2_distance": -5.4589338302612305,
        "task_vector_dot_product": 4.465466022491455,
        "weight_space_angle": 12.473247528076172,
        "task_vector_magnitude_ratio": -4.604199409484863,
        "singular_value_overlap": 2.0102481842041016,
        "subspace_overlap": 16.977521896362305,
        "right_subspace_overlap": 6.0330939292907715,
        "activation_l2_distance": -1.7165884971618652,
        "activation_cosine_similarity": 3.9045629501342773,
        "activation_magnitude_ratio": -4.313821315765381,
        "activation_dot_product": 13.939785957336426,
        "encoder_gradient_cosine_similarity": 6.970749855041504,
        "encoder_gradient_l2_distance": -18.380895614624023,
        "encoder_gradient_dot_product": 6.014134883880615,
        "input_gradient_cosine_similarity": 2.931403875350952,
        "input_gradient_l2_distance": -15.0398530960083,
        "input_gradient_dot_product": -12.570005416870117
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6844025430859713,
      "val_r": 0.6320073638194925,
      "n_iterations": 796,
      "coefficients": {
        "right_subspace_overlap_top_k": 53.47934341430664,
        "right_subspace_overlap_bottom_k": -0.6473646759986877,
        "interaction_matrix_overlap_top_k": 14.266457557678223,
        "interaction_matrix_overlap_bottom_k": -42.38640213012695,
        "task_vector_cosine_similarity": 19.77264976501465,
        "task_vector_l2_distance": 1.6798286437988281,
        "task_vector_dot_product": -29.35982322692871,
        "weight_space_angle": 6.604082107543945,
        "task_vector_magnitude_ratio": -1.9359562397003174,
        "singular_value_overlap": 6.371695041656494,
        "subspace_overlap": 9.777937889099121,
        "right_subspace_overlap": -5.0625786781311035,
        "activation_l2_distance": -28.26997184753418,
        "activation_cosine_similarity": -10.944194793701172,
        "activation_magnitude_ratio": -5.466084003448486,
        "activation_dot_product": 39.028629302978516,
        "encoder_gradient_cosine_similarity": 9.97741413116455,
        "encoder_gradient_l2_distance": -23.395605087280273,
        "encoder_gradient_dot_product": 15.982771873474121,
        "input_gradient_cosine_similarity": 17.05313491821289,
        "input_gradient_l2_distance": -48.65727233886719,
        "input_gradient_dot_product": 3.1293563842773438
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.6399170133786273,
      "val_r": 0.6659539200422926,
      "n_iterations": 428,
      "coefficients": {
        "right_subspace_overlap_top_k": 95.41029357910156,
        "right_subspace_overlap_bottom_k": -28.983749389648438,
        "interaction_matrix_overlap_top_k": -91.65504455566406,
        "interaction_matrix_overlap_bottom_k": 17.21993064880371,
        "task_vector_cosine_similarity": 2.170220136642456,
        "task_vector_l2_distance": -21.84624481201172,
        "task_vector_dot_product": 74.40544891357422,
        "weight_space_angle": -96.62154388427734,
        "task_vector_magnitude_ratio": -43.08372497558594,
        "singular_value_overlap": 69.31826782226562,
        "subspace_overlap": -16.2528133392334,
        "right_subspace_overlap": -11.32079792022705,
        "activation_l2_distance": -46.663055419921875,
        "activation_cosine_similarity": 4.848827362060547,
        "activation_magnitude_ratio": -15.537663459777832,
        "activation_dot_product": 79.1104965209961,
        "encoder_gradient_cosine_similarity": 63.429931640625,
        "encoder_gradient_l2_distance": -140.52076721191406,
        "encoder_gradient_dot_product": 64.68806457519531,
        "input_gradient_cosine_similarity": 42.76042938232422,
        "input_gradient_l2_distance": 3.889709949493408,
        "input_gradient_dot_product": -3.7695767879486084
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.7369612055278016,
      "val_r": 0.4181599204969697,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.6765313148498535,
        "right_subspace_overlap_bottom_k": -4.9078826904296875,
        "interaction_matrix_overlap_top_k": 9.233120918273926,
        "interaction_matrix_overlap_bottom_k": -12.625664710998535,
        "task_vector_cosine_similarity": 7.473623752593994,
        "task_vector_l2_distance": 5.892350673675537,
        "task_vector_dot_product": -13.567787170410156,
        "weight_space_angle": 5.316024303436279,
        "task_vector_magnitude_ratio": -0.15027806162834167,
        "singular_value_overlap": 3.271383762359619,
        "subspace_overlap": -0.20396292209625244,
        "right_subspace_overlap": 4.740888595581055,
        "activation_l2_distance": 3.332427501678467,
        "activation_cosine_similarity": 14.530776023864746,
        "activation_magnitude_ratio": 0.12807561457157135,
        "activation_dot_product": 2.3505187034606934,
        "encoder_gradient_cosine_similarity": 5.418540000915527,
        "encoder_gradient_l2_distance": -19.129823684692383,
        "encoder_gradient_dot_product": 5.021763801574707,
        "input_gradient_cosine_similarity": 0.15317751467227936,
        "input_gradient_l2_distance": -12.486756324768066,
        "input_gradient_dot_product": -9.4684476852417
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6791246347356255,
      "val_r": 0.26942702203088764,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 17.27609634399414,
        "right_subspace_overlap_bottom_k": -22.3763484954834,
        "interaction_matrix_overlap_top_k": 13.945241928100586,
        "interaction_matrix_overlap_bottom_k": -5.082146167755127,
        "task_vector_cosine_similarity": -15.205528259277344,
        "task_vector_l2_distance": -2.1956276893615723,
        "task_vector_dot_product": -14.155679702758789,
        "weight_space_angle": -9.333772659301758,
        "task_vector_magnitude_ratio": -3.2993195056915283,
        "singular_value_overlap": 3.4496114253997803,
        "subspace_overlap": 3.7085483074188232,
        "right_subspace_overlap": 15.954246520996094,
        "activation_l2_distance": 0.3817000091075897,
        "activation_cosine_similarity": 26.395992279052734,
        "activation_magnitude_ratio": -5.3686418533325195,
        "activation_dot_product": 5.482141494750977,
        "encoder_gradient_cosine_similarity": 2.779071092605591,
        "encoder_gradient_l2_distance": -10.561683654785156,
        "encoder_gradient_dot_product": 13.621830940246582,
        "input_gradient_cosine_similarity": 11.652874946594238,
        "input_gradient_l2_distance": -29.847021102905273,
        "input_gradient_dot_product": 3.7768568992614746
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5443892976292029,
      "val_r": 0.3065363712801866,
      "n_iterations": 509,
      "coefficients": {
        "right_subspace_overlap_top_k": 94.37712097167969,
        "right_subspace_overlap_bottom_k": -0.0807805210351944,
        "interaction_matrix_overlap_top_k": 390.8424377441406,
        "interaction_matrix_overlap_bottom_k": -51.89961624145508,
        "task_vector_cosine_similarity": -102.9283218383789,
        "task_vector_l2_distance": -41.46145248413086,
        "task_vector_dot_product": 94.45954895019531,
        "weight_space_angle": -52.270530700683594,
        "task_vector_magnitude_ratio": -77.20448303222656,
        "singular_value_overlap": -39.81800079345703,
        "subspace_overlap": -115.1559829711914,
        "right_subspace_overlap": 61.43876266479492,
        "activation_l2_distance": -31.06015396118164,
        "activation_cosine_similarity": 35.843284606933594,
        "activation_magnitude_ratio": 89.4886474609375,
        "activation_dot_product": 81.37606811523438,
        "encoder_gradient_cosine_similarity": -49.6968994140625,
        "encoder_gradient_l2_distance": -61.56748580932617,
        "encoder_gradient_dot_product": 95.05403137207031,
        "input_gradient_cosine_similarity": -35.92709732055664,
        "input_gradient_l2_distance": -199.13497924804688,
        "input_gradient_dot_product": -83.67707824707031
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6472455955246739,
      "val_r": 0.40088273116808193,
      "n_iterations": 700,
      "coefficients": {
        "right_subspace_overlap_top_k": 57.59071350097656,
        "right_subspace_overlap_bottom_k": -85.13201904296875,
        "interaction_matrix_overlap_top_k": 92.20976257324219,
        "interaction_matrix_overlap_bottom_k": -13.610946655273438,
        "task_vector_cosine_similarity": 12.448874473571777,
        "task_vector_l2_distance": -3.678985595703125,
        "task_vector_dot_product": -40.39897918701172,
        "weight_space_angle": -52.27225112915039,
        "task_vector_magnitude_ratio": -5.136332988739014,
        "singular_value_overlap": 0.7151194214820862,
        "subspace_overlap": -42.2841911315918,
        "right_subspace_overlap": 34.54517364501953,
        "activation_l2_distance": 11.474379539489746,
        "activation_cosine_similarity": -2.9402759075164795,
        "activation_magnitude_ratio": 0.7459346055984497,
        "activation_dot_product": 11.627599716186523,
        "encoder_gradient_cosine_similarity": 46.22101974487305,
        "encoder_gradient_l2_distance": -36.79020690917969,
        "encoder_gradient_dot_product": 28.825105667114258,
        "input_gradient_cosine_similarity": 34.26630401611328,
        "input_gradient_l2_distance": -44.66729736328125,
        "input_gradient_dot_product": -2.7606964111328125
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7637187083445846,
      "val_r": 0.34349261749175236,
      "n_iterations": 974,
      "coefficients": {
        "right_subspace_overlap_top_k": 9.397551536560059,
        "right_subspace_overlap_bottom_k": -3.794452428817749,
        "interaction_matrix_overlap_top_k": 0.708276629447937,
        "interaction_matrix_overlap_bottom_k": -4.702842712402344,
        "task_vector_cosine_similarity": -3.570497512817383,
        "task_vector_l2_distance": -0.5823037028312683,
        "task_vector_dot_product": 0.22758464515209198,
        "weight_space_angle": 4.7182207107543945,
        "task_vector_magnitude_ratio": -1.5435324907302856,
        "singular_value_overlap": 1.5958775281906128,
        "subspace_overlap": -1.6008906364440918,
        "right_subspace_overlap": 4.484089374542236,
        "activation_l2_distance": 0.4520987868309021,
        "activation_cosine_similarity": 10.817652702331543,
        "activation_magnitude_ratio": -1.823311686515808,
        "activation_dot_product": 0.9976910352706909,
        "encoder_gradient_cosine_similarity": 1.4811335802078247,
        "encoder_gradient_l2_distance": -9.427518844604492,
        "encoder_gradient_dot_product": 1.780987024307251,
        "input_gradient_cosine_similarity": 2.0050673484802246,
        "input_gradient_l2_distance": -7.831904888153076,
        "input_gradient_dot_product": -2.790363073348999
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7212206759747927,
      "val_r": 0.7530035395094167,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.695312976837158,
        "right_subspace_overlap_bottom_k": -9.46136474609375,
        "interaction_matrix_overlap_top_k": 3.5966691970825195,
        "interaction_matrix_overlap_bottom_k": -10.928403854370117,
        "task_vector_cosine_similarity": 1.6056245565414429,
        "task_vector_l2_distance": 2.6754603385925293,
        "task_vector_dot_product": 0.25353917479515076,
        "weight_space_angle": 4.557237148284912,
        "task_vector_magnitude_ratio": -1.0890388488769531,
        "singular_value_overlap": 1.9636282920837402,
        "subspace_overlap": 4.6203107833862305,
        "right_subspace_overlap": 11.04019546508789,
        "activation_l2_distance": -0.9205092191696167,
        "activation_cosine_similarity": 11.563774108886719,
        "activation_magnitude_ratio": -2.8356528282165527,
        "activation_dot_product": 3.8429558277130127,
        "encoder_gradient_cosine_similarity": 6.811646461486816,
        "encoder_gradient_l2_distance": -19.455005645751953,
        "encoder_gradient_dot_product": 4.503942012786865,
        "input_gradient_cosine_similarity": 5.201081275939941,
        "input_gradient_l2_distance": -7.712102890014648,
        "input_gradient_dot_product": -15.530701637268066
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.695594680215909,
      "val_r": 0.6808578231482735,
      "n_iterations": 925,
      "coefficients": {
        "right_subspace_overlap_top_k": 5.80201530456543,
        "right_subspace_overlap_bottom_k": -24.042341232299805,
        "interaction_matrix_overlap_top_k": 19.944475173950195,
        "interaction_matrix_overlap_bottom_k": -26.62889289855957,
        "task_vector_cosine_similarity": 22.465633392333984,
        "task_vector_l2_distance": 12.178237915039062,
        "task_vector_dot_product": 1.8972179889678955,
        "weight_space_angle": -19.866491317749023,
        "task_vector_magnitude_ratio": 2.7154757976531982,
        "singular_value_overlap": -5.882471084594727,
        "subspace_overlap": -3.2456154823303223,
        "right_subspace_overlap": 23.053895950317383,
        "activation_l2_distance": -6.219295978546143,
        "activation_cosine_similarity": 26.888256072998047,
        "activation_magnitude_ratio": -6.583544731140137,
        "activation_dot_product": 6.39982795715332,
        "encoder_gradient_cosine_similarity": 27.76132583618164,
        "encoder_gradient_l2_distance": -39.56723403930664,
        "encoder_gradient_dot_product": 14.548344612121582,
        "input_gradient_cosine_similarity": 13.271079063415527,
        "input_gradient_l2_distance": -16.525127410888672,
        "input_gradient_dot_product": -27.366371154785156
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6668096760071844,
      "val_r": 0.6611376716162819,
      "n_iterations": 865,
      "coefficients": {
        "right_subspace_overlap_top_k": 108.79694366455078,
        "right_subspace_overlap_bottom_k": -90.462158203125,
        "interaction_matrix_overlap_top_k": 152.4482421875,
        "interaction_matrix_overlap_bottom_k": -61.562496185302734,
        "task_vector_cosine_similarity": 18.261974334716797,
        "task_vector_l2_distance": 32.63134002685547,
        "task_vector_dot_product": -32.64080810546875,
        "weight_space_angle": 3.021188497543335,
        "task_vector_magnitude_ratio": -15.377510070800781,
        "singular_value_overlap": 26.30729103088379,
        "subspace_overlap": -19.799423217773438,
        "right_subspace_overlap": 0.2899068593978882,
        "activation_l2_distance": -21.78692054748535,
        "activation_cosine_similarity": 21.764785766601562,
        "activation_magnitude_ratio": -1.4741145372390747,
        "activation_dot_product": -7.117275238037109,
        "encoder_gradient_cosine_similarity": 67.53377532958984,
        "encoder_gradient_l2_distance": -57.415191650390625,
        "encoder_gradient_dot_product": 71.28239440917969,
        "input_gradient_cosine_similarity": -1.2648494243621826,
        "input_gradient_l2_distance": -98.01637268066406,
        "input_gradient_dot_product": -94.42255401611328
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7023490193121238,
      "val_r": 0.7815510301776321,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.545825481414795,
        "right_subspace_overlap_bottom_k": -93.10386657714844,
        "interaction_matrix_overlap_top_k": 49.1506462097168,
        "interaction_matrix_overlap_bottom_k": 17.927261352539062,
        "task_vector_cosine_similarity": -36.358421325683594,
        "task_vector_l2_distance": -5.98569393157959,
        "task_vector_dot_product": 20.49833106994629,
        "weight_space_angle": 7.617325305938721,
        "task_vector_magnitude_ratio": -3.104628801345825,
        "singular_value_overlap": -9.865991592407227,
        "subspace_overlap": 2.872134208679199,
        "right_subspace_overlap": 58.937015533447266,
        "activation_l2_distance": -3.4256646633148193,
        "activation_cosine_similarity": 43.31726837158203,
        "activation_magnitude_ratio": -13.777647972106934,
        "activation_dot_product": 8.549173355102539,
        "encoder_gradient_cosine_similarity": 29.72620964050293,
        "encoder_gradient_l2_distance": -58.668556213378906,
        "encoder_gradient_dot_product": -2.698103904724121,
        "input_gradient_cosine_similarity": 25.48798942565918,
        "input_gradient_l2_distance": -18.497133255004883,
        "input_gradient_dot_product": -24.14511489868164
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.6098315803371015,
      "val_r": -0.12319652117002146,
      "n_iterations": 625,
      "coefficients": {
        "right_subspace_overlap_top_k": 131.86871337890625,
        "right_subspace_overlap_bottom_k": 17.94883918762207,
        "interaction_matrix_overlap_top_k": 65.70741271972656,
        "interaction_matrix_overlap_bottom_k": -52.196659088134766,
        "task_vector_cosine_similarity": 56.684104919433594,
        "task_vector_l2_distance": -70.6355209350586,
        "task_vector_dot_product": 105.12051391601562,
        "weight_space_angle": -76.97846984863281,
        "task_vector_magnitude_ratio": -44.13400650024414,
        "singular_value_overlap": 78.13487243652344,
        "subspace_overlap": 27.07286834716797,
        "right_subspace_overlap": -62.923248291015625,
        "activation_l2_distance": 16.947465896606445,
        "activation_cosine_similarity": 100.714599609375,
        "activation_magnitude_ratio": 59.2536735534668,
        "activation_dot_product": 8.887857437133789,
        "encoder_gradient_cosine_similarity": 70.1084976196289,
        "encoder_gradient_l2_distance": -78.22362518310547,
        "encoder_gradient_dot_product": 69.8319091796875,
        "input_gradient_cosine_similarity": -18.682451248168945,
        "input_gradient_l2_distance": -197.8305206298828,
        "input_gradient_dot_product": -205.6792449951172
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7106093093150716,
      "val_r": 0.637757226311704,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 24.228700637817383,
        "right_subspace_overlap_bottom_k": -14.964607238769531,
        "interaction_matrix_overlap_top_k": 27.06208610534668,
        "interaction_matrix_overlap_bottom_k": -33.71259689331055,
        "task_vector_cosine_similarity": -13.157169342041016,
        "task_vector_l2_distance": -8.810546875,
        "task_vector_dot_product": -12.526957511901855,
        "weight_space_angle": -14.25656509399414,
        "task_vector_magnitude_ratio": -5.357580661773682,
        "singular_value_overlap": 1.3996573686599731,
        "subspace_overlap": 12.231139183044434,
        "right_subspace_overlap": 18.240537643432617,
        "activation_l2_distance": 8.574241638183594,
        "activation_cosine_similarity": 22.373371124267578,
        "activation_magnitude_ratio": -3.157649040222168,
        "activation_dot_product": 26.82332420349121,
        "encoder_gradient_cosine_similarity": 19.026641845703125,
        "encoder_gradient_l2_distance": -21.2540340423584,
        "encoder_gradient_dot_product": 29.88410186767578,
        "input_gradient_cosine_similarity": 17.4019718170166,
        "input_gradient_l2_distance": -42.97782516479492,
        "input_gradient_dot_product": -36.07186508178711
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.719288991828857,
      "val_r": 0.5484409138861812,
      "n_iterations": 973,
      "coefficients": {
        "right_subspace_overlap_top_k": 8.07430362701416,
        "right_subspace_overlap_bottom_k": -35.16704559326172,
        "interaction_matrix_overlap_top_k": 4.407222747802734,
        "interaction_matrix_overlap_bottom_k": 9.118378639221191,
        "task_vector_cosine_similarity": 10.936543464660645,
        "task_vector_l2_distance": -5.756160259246826,
        "task_vector_dot_product": 1.6360971927642822,
        "weight_space_angle": 21.94829559326172,
        "task_vector_magnitude_ratio": -8.022037506103516,
        "singular_value_overlap": 5.428079128265381,
        "subspace_overlap": -16.4368953704834,
        "right_subspace_overlap": 32.8929557800293,
        "activation_l2_distance": -2.9468564987182617,
        "activation_cosine_similarity": 1.0355738401412964,
        "activation_magnitude_ratio": -1.5883303880691528,
        "activation_dot_product": 27.634353637695312,
        "encoder_gradient_cosine_similarity": 10.386699676513672,
        "encoder_gradient_l2_distance": -38.09364318847656,
        "encoder_gradient_dot_product": 9.17848014831543,
        "input_gradient_cosine_similarity": 8.034920692443848,
        "input_gradient_l2_distance": -15.207566261291504,
        "input_gradient_dot_product": -26.494956970214844
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.1897115178044858,
      "val_r": 0.21451735074619446,
      "n_iterations": 51,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.5949852466583252,
        "right_subspace_overlap_bottom_k": -1.5399143695831299,
        "interaction_matrix_overlap_top_k": -1.3050588369369507,
        "interaction_matrix_overlap_bottom_k": -0.03322002291679382,
        "task_vector_cosine_similarity": 0.010007228702306747,
        "task_vector_l2_distance": -0.005756378173828125,
        "task_vector_dot_product": -0.3120032846927643,
        "weight_space_angle": -0.7241764664649963,
        "task_vector_magnitude_ratio": -0.12122195959091187,
        "singular_value_overlap": 0.28013697266578674,
        "subspace_overlap": 1.0450923442840576,
        "right_subspace_overlap": 1.122762680053711,
        "activation_l2_distance": -0.3641226291656494,
        "activation_cosine_similarity": 0.6107821464538574,
        "activation_magnitude_ratio": -0.2831885814666748,
        "activation_dot_product": 0.21950630843639374,
        "encoder_gradient_cosine_similarity": -0.20483994483947754,
        "encoder_gradient_l2_distance": 1.0580296516418457,
        "encoder_gradient_dot_product": 1.52706778049469,
        "input_gradient_cosine_similarity": -0.42985227704048157,
        "input_gradient_l2_distance": 0.19062195718288422,
        "input_gradient_dot_product": -0.2539065182209015
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.26117160743689316,
      "val_r": -0.10697571428582726,
      "n_iterations": 626,
      "coefficients": {
        "right_subspace_overlap_top_k": 19.233863830566406,
        "right_subspace_overlap_bottom_k": 102.43596649169922,
        "interaction_matrix_overlap_top_k": 189.52557373046875,
        "interaction_matrix_overlap_bottom_k": 89.95858001708984,
        "task_vector_cosine_similarity": 2.5943691730499268,
        "task_vector_l2_distance": -16.42700958251953,
        "task_vector_dot_product": 454.2750549316406,
        "weight_space_angle": 41.89957046508789,
        "task_vector_magnitude_ratio": -96.78889465332031,
        "singular_value_overlap": 95.76107025146484,
        "subspace_overlap": -93.90388488769531,
        "right_subspace_overlap": -14.565308570861816,
        "activation_l2_distance": -25.434123992919922,
        "activation_cosine_similarity": -62.15634536743164,
        "activation_magnitude_ratio": -403.5469665527344,
        "activation_dot_product": -194.059814453125,
        "encoder_gradient_cosine_similarity": 11.176733016967773,
        "encoder_gradient_l2_distance": -24.03805923461914,
        "encoder_gradient_dot_product": 276.2577819824219,
        "input_gradient_cosine_similarity": -114.44734191894531,
        "input_gradient_l2_distance": -299.1922607421875,
        "input_gradient_dot_product": 62.43899154663086
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}