{
  "aggregate_metrics": {
    "train_r": 0.2573278249815707,
    "train_p": 6.7788408964568495e-50,
    "val_r": 0.2648724232717321,
    "val_p": 3.672310723845613e-07
  },
  "per_fold_stats": {
    "train_r_mean": 0.49923363930807396,
    "train_r_std": 0.10276393826231098,
    "val_r_mean": 0.3630630682396062,
    "val_r_std": 0.1855509870916421
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 34.82499694824219,
    "right_subspace_overlap_bottom_k": 8.984418869018555,
    "interaction_matrix_overlap_top_k": 19.01105308532715,
    "interaction_matrix_overlap_bottom_k": 17.853384017944336,
    "task_vector_cosine_similarity": 2.7257161140441895,
    "task_vector_l2_distance": -24.732288360595703,
    "task_vector_dot_product": -15.735891342163086,
    "weight_space_angle": -13.612360954284668,
    "task_vector_magnitude_ratio": -20.796884536743164,
    "singular_value_overlap": -38.82279586791992,
    "subspace_overlap": 29.999160766601562,
    "right_subspace_overlap": 35.778770446777344,
    "activation_l2_distance": -12.621975898742676,
    "activation_cosine_similarity": 11.303022384643555,
    "activation_magnitude_ratio": -23.947059631347656,
    "activation_dot_product": 34.18110656738281,
    "encoder_gradient_cosine_similarity": 19.547523498535156,
    "encoder_gradient_l2_distance": -32.10605239868164,
    "encoder_gradient_dot_product": 35.70928192138672,
    "input_gradient_cosine_similarity": 14.300585746765137,
    "input_gradient_l2_distance": -44.00261688232422,
    "input_gradient_dot_product": -36.84321975708008
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 39.983760833740234,
    "right_subspace_overlap_bottom_k": 18.112051010131836,
    "interaction_matrix_overlap_top_k": 33.78462219238281,
    "interaction_matrix_overlap_bottom_k": 17.397109985351562,
    "task_vector_cosine_similarity": 29.56171989440918,
    "task_vector_l2_distance": 26.411346435546875,
    "task_vector_dot_product": 24.08144760131836,
    "weight_space_angle": 35.70813751220703,
    "task_vector_magnitude_ratio": 23.009191513061523,
    "singular_value_overlap": 33.14337158203125,
    "subspace_overlap": 31.920808792114258,
    "right_subspace_overlap": 42.73274230957031,
    "activation_l2_distance": 38.830562591552734,
    "activation_cosine_similarity": 24.94234848022461,
    "activation_magnitude_ratio": 36.67430114746094,
    "activation_dot_product": 28.085834503173828,
    "encoder_gradient_cosine_similarity": 19.923139572143555,
    "encoder_gradient_l2_distance": 40.40269470214844,
    "encoder_gradient_dot_product": 32.2113037109375,
    "input_gradient_cosine_similarity": 19.002695083618164,
    "input_gradient_l2_distance": 37.596553802490234,
    "input_gradient_dot_product": 27.03949737548828
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.372940890572132,
      "val_r": 0.38664300628934056,
      "n_iterations": 366,
      "coefficients": {
        "right_subspace_overlap_top_k": 123.85301971435547,
        "right_subspace_overlap_bottom_k": 26.310537338256836,
        "interaction_matrix_overlap_top_k": -36.823081970214844,
        "interaction_matrix_overlap_bottom_k": 6.418450355529785,
        "task_vector_cosine_similarity": -48.26211929321289,
        "task_vector_l2_distance": -33.3289909362793,
        "task_vector_dot_product": 5.79181432723999,
        "weight_space_angle": -21.684961318969727,
        "task_vector_magnitude_ratio": -15.203887939453125,
        "singular_value_overlap": -95.22979736328125,
        "subspace_overlap": 51.54545593261719,
        "right_subspace_overlap": 130.6336212158203,
        "activation_l2_distance": -89.26680755615234,
        "activation_cosine_similarity": -27.646366119384766,
        "activation_magnitude_ratio": -79.4071273803711,
        "activation_dot_product": 80.61736297607422,
        "encoder_gradient_cosine_similarity": 21.898235321044922,
        "encoder_gradient_l2_distance": -44.39839172363281,
        "encoder_gradient_dot_product": 29.807819366455078,
        "input_gradient_cosine_similarity": 33.58523178100586,
        "input_gradient_l2_distance": 27.898345947265625,
        "input_gradient_dot_product": -46.11233901977539
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5314447294939507,
      "val_r": 0.41371194140834994,
      "n_iterations": 731,
      "coefficients": {
        "right_subspace_overlap_top_k": 44.41807556152344,
        "right_subspace_overlap_bottom_k": -12.277024269104004,
        "interaction_matrix_overlap_top_k": 30.254297256469727,
        "interaction_matrix_overlap_bottom_k": 49.448463439941406,
        "task_vector_cosine_similarity": -33.23311996459961,
        "task_vector_l2_distance": -47.76743698120117,
        "task_vector_dot_product": -34.93096923828125,
        "weight_space_angle": -23.650131225585938,
        "task_vector_magnitude_ratio": -37.30000686645508,
        "singular_value_overlap": -37.19862365722656,
        "subspace_overlap": 44.17182540893555,
        "right_subspace_overlap": 17.856346130371094,
        "activation_l2_distance": 35.52651596069336,
        "activation_cosine_similarity": 25.568883895874023,
        "activation_magnitude_ratio": -17.368085861206055,
        "activation_dot_product": 53.17393493652344,
        "encoder_gradient_cosine_similarity": 11.994044303894043,
        "encoder_gradient_l2_distance": -65.42353057861328,
        "encoder_gradient_dot_product": 44.198429107666016,
        "input_gradient_cosine_similarity": 29.435937881469727,
        "input_gradient_l2_distance": -41.67124557495117,
        "input_gradient_dot_product": -34.22873306274414
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5064693176845232,
      "val_r": 0.2881006262192957,
      "n_iterations": 878,
      "coefficients": {
        "right_subspace_overlap_top_k": 26.135374069213867,
        "right_subspace_overlap_bottom_k": 8.549579620361328,
        "interaction_matrix_overlap_top_k": 19.075220108032227,
        "interaction_matrix_overlap_bottom_k": 40.2838249206543,
        "task_vector_cosine_similarity": 23.89651107788086,
        "task_vector_l2_distance": -42.9919319152832,
        "task_vector_dot_product": -8.048917770385742,
        "weight_space_angle": -29.85964584350586,
        "task_vector_magnitude_ratio": -30.04428482055664,
        "singular_value_overlap": -55.048431396484375,
        "subspace_overlap": 47.67090606689453,
        "right_subspace_overlap": -2.5487091541290283,
        "activation_l2_distance": 12.772489547729492,
        "activation_cosine_similarity": 13.799108505249023,
        "activation_magnitude_ratio": -23.24155044555664,
        "activation_dot_product": 27.70517921447754,
        "encoder_gradient_cosine_similarity": 10.239864349365234,
        "encoder_gradient_l2_distance": 15.283894538879395,
        "encoder_gradient_dot_product": 41.823917388916016,
        "input_gradient_cosine_similarity": 34.432064056396484,
        "input_gradient_l2_distance": -69.06494140625,
        "input_gradient_dot_product": -59.82134246826172
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5963313523129803,
      "val_r": 0.3873667578999923,
      "n_iterations": 847,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.2018014192581177,
        "right_subspace_overlap_bottom_k": 1.3195258378982544,
        "interaction_matrix_overlap_top_k": 1.914667010307312,
        "interaction_matrix_overlap_bottom_k": 11.467379570007324,
        "task_vector_cosine_similarity": 4.231793403625488,
        "task_vector_l2_distance": -10.33932113647461,
        "task_vector_dot_product": -5.702263832092285,
        "weight_space_angle": 4.899712562561035,
        "task_vector_magnitude_ratio": -4.18848180770874,
        "singular_value_overlap": -8.240245819091797,
        "subspace_overlap": 5.421139717102051,
        "right_subspace_overlap": 2.0413360595703125,
        "activation_l2_distance": 8.441825866699219,
        "activation_cosine_similarity": 5.245480060577393,
        "activation_magnitude_ratio": -2.4707303047180176,
        "activation_dot_product": 5.094065189361572,
        "encoder_gradient_cosine_similarity": 1.6337226629257202,
        "encoder_gradient_l2_distance": -11.779268264770508,
        "encoder_gradient_dot_product": 0.20335717499256134,
        "input_gradient_cosine_similarity": 2.818593978881836,
        "input_gradient_l2_distance": -8.875677108764648,
        "input_gradient_dot_product": -3.339653730392456
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4542210760326956,
      "val_r": 0.47373382636941863,
      "n_iterations": 611,
      "coefficients": {
        "right_subspace_overlap_top_k": 65.52606201171875,
        "right_subspace_overlap_bottom_k": -19.87668800354004,
        "interaction_matrix_overlap_top_k": -53.22074508666992,
        "interaction_matrix_overlap_bottom_k": 15.66301155090332,
        "task_vector_cosine_similarity": -9.372942924499512,
        "task_vector_l2_distance": -49.29691696166992,
        "task_vector_dot_product": -19.8725528717041,
        "weight_space_angle": -69.09858703613281,
        "task_vector_magnitude_ratio": -35.652687072753906,
        "singular_value_overlap": -33.92496109008789,
        "subspace_overlap": 83.06783294677734,
        "right_subspace_overlap": 82.18968200683594,
        "activation_l2_distance": -35.15578842163086,
        "activation_cosine_similarity": -24.707115173339844,
        "activation_magnitude_ratio": 12.130548477172852,
        "activation_dot_product": 75.35543060302734,
        "encoder_gradient_cosine_similarity": 52.67279815673828,
        "encoder_gradient_l2_distance": -108.57797241210938,
        "encoder_gradient_dot_product": 79.44489288330078,
        "input_gradient_cosine_similarity": 27.91173553466797,
        "input_gradient_l2_distance": -15.587969779968262,
        "input_gradient_dot_product": -18.619585037231445
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.37633175946796027,
      "val_r": 0.15691582423489117,
      "n_iterations": 626,
      "coefficients": {
        "right_subspace_overlap_top_k": 65.54753112792969,
        "right_subspace_overlap_bottom_k": 16.809614181518555,
        "interaction_matrix_overlap_top_k": 33.31423568725586,
        "interaction_matrix_overlap_bottom_k": 23.620702743530273,
        "task_vector_cosine_similarity": -28.902172088623047,
        "task_vector_l2_distance": 43.989131927490234,
        "task_vector_dot_product": 5.045403003692627,
        "weight_space_angle": -69.47895812988281,
        "task_vector_magnitude_ratio": -55.06404113769531,
        "singular_value_overlap": -55.375553131103516,
        "subspace_overlap": 0.9301422238349915,
        "right_subspace_overlap": 49.61211395263672,
        "activation_l2_distance": -43.80378341674805,
        "activation_cosine_similarity": 15.13074016571045,
        "activation_magnitude_ratio": -46.89213562011719,
        "activation_dot_product": 83.949951171875,
        "encoder_gradient_cosine_similarity": 30.656538009643555,
        "encoder_gradient_l2_distance": 42.19651412963867,
        "encoder_gradient_dot_product": 12.5306396484375,
        "input_gradient_cosine_similarity": 48.66364669799805,
        "input_gradient_l2_distance": -121.17514038085938,
        "input_gradient_dot_product": -50.3076171875
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.44633773758937983,
      "val_r": 0.061477597351377034,
      "n_iterations": 553,
      "coefficients": {
        "right_subspace_overlap_top_k": 5.931107044219971,
        "right_subspace_overlap_bottom_k": 24.324399948120117,
        "interaction_matrix_overlap_top_k": 43.096988677978516,
        "interaction_matrix_overlap_bottom_k": -6.40878438949585,
        "task_vector_cosine_similarity": -53.53227233886719,
        "task_vector_l2_distance": -39.31605911254883,
        "task_vector_dot_product": -32.76606750488281,
        "weight_space_angle": -19.222055435180664,
        "task_vector_magnitude_ratio": -6.8652262687683105,
        "singular_value_overlap": -63.28337097167969,
        "subspace_overlap": 12.39500617980957,
        "right_subspace_overlap": 72.8880615234375,
        "activation_l2_distance": -26.85647201538086,
        "activation_cosine_similarity": 33.36616516113281,
        "activation_magnitude_ratio": 42.107852935791016,
        "activation_dot_product": 12.806112289428711,
        "encoder_gradient_cosine_similarity": 53.44011688232422,
        "encoder_gradient_l2_distance": 9.775944709777832,
        "encoder_gradient_dot_product": 105.8675308227539,
        "input_gradient_cosine_similarity": -8.877823829650879,
        "input_gradient_l2_distance": -81.4509048461914,
        "input_gradient_dot_product": -76.42298126220703
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4052220770750181,
      "val_r": -0.09546641976507002,
      "n_iterations": 656,
      "coefficients": {
        "right_subspace_overlap_top_k": -8.822757720947266,
        "right_subspace_overlap_bottom_k": 25.75605583190918,
        "interaction_matrix_overlap_top_k": 48.79397964477539,
        "interaction_matrix_overlap_bottom_k": -2.8207340240478516,
        "task_vector_cosine_similarity": 12.487719535827637,
        "task_vector_l2_distance": 12.241247177124023,
        "task_vector_dot_product": -23.469501495361328,
        "weight_space_angle": -28.35585594177246,
        "task_vector_magnitude_ratio": -37.444786071777344,
        "singular_value_overlap": -29.160860061645508,
        "subspace_overlap": 70.99272918701172,
        "right_subspace_overlap": 21.210344314575195,
        "activation_l2_distance": -35.74898147583008,
        "activation_cosine_similarity": 63.11220169067383,
        "activation_magnitude_ratio": -38.806884765625,
        "activation_dot_product": -2.1863956451416016,
        "encoder_gradient_cosine_similarity": 29.751676559448242,
        "encoder_gradient_l2_distance": -45.10417938232422,
        "encoder_gradient_dot_product": -1.1599836349487305,
        "input_gradient_cosine_similarity": 8.017830848693848,
        "input_gradient_l2_distance": -49.44239044189453,
        "input_gradient_dot_product": 11.157166481018066
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.6083821297826102,
      "val_r": 0.4580948547519442,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.9334504008293152,
        "right_subspace_overlap_bottom_k": -0.25300678610801697,
        "interaction_matrix_overlap_top_k": 0.16223753988742828,
        "interaction_matrix_overlap_bottom_k": 1.9862741231918335,
        "task_vector_cosine_similarity": 1.4177190065383911,
        "task_vector_l2_distance": -2.3735649585723877,
        "task_vector_dot_product": 1.8001773357391357,
        "weight_space_angle": 2.8741531372070312,
        "task_vector_magnitude_ratio": -1.0530223846435547,
        "singular_value_overlap": -1.6601338386535645,
        "subspace_overlap": -0.20601724088191986,
        "right_subspace_overlap": 0.08966109901666641,
        "activation_l2_distance": 1.3900576829910278,
        "activation_cosine_similarity": 2.293238639831543,
        "activation_magnitude_ratio": -0.4793180227279663,
        "activation_dot_product": -0.7808470726013184,
        "encoder_gradient_cosine_similarity": 0.44306039810180664,
        "encoder_gradient_l2_distance": -2.334941864013672,
        "encoder_gradient_dot_product": 0.22513878345489502,
        "input_gradient_cosine_similarity": 0.14706917107105255,
        "input_gradient_l2_distance": -2.4506239891052246,
        "input_gradient_dot_product": -1.1710658073425293
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.565000406383767,
      "val_r": 0.46542523964802807,
      "n_iterations": 871,
      "coefficients": {
        "right_subspace_overlap_top_k": 14.153616905212402,
        "right_subspace_overlap_bottom_k": 7.596770286560059,
        "interaction_matrix_overlap_top_k": 11.84189224243164,
        "interaction_matrix_overlap_bottom_k": 19.928316116333008,
        "task_vector_cosine_similarity": 9.309775352478027,
        "task_vector_l2_distance": -26.407489776611328,
        "task_vector_dot_product": -33.30890655517578,
        "weight_space_angle": 17.359188079833984,
        "task_vector_magnitude_ratio": -10.637012481689453,
        "singular_value_overlap": -20.253673553466797,
        "subspace_overlap": 22.25309944152832,
        "right_subspace_overlap": 2.5865092277526855,
        "activation_l2_distance": 28.045093536376953,
        "activation_cosine_similarity": 13.069108009338379,
        "activation_magnitude_ratio": -0.17268423736095428,
        "activation_dot_product": 10.213367462158203,
        "encoder_gradient_cosine_similarity": 7.500551700592041,
        "encoder_gradient_l2_distance": -40.48328399658203,
        "encoder_gradient_dot_product": -0.706545889377594,
        "input_gradient_cosine_similarity": 0.21309231221675873,
        "input_gradient_l2_distance": -15.421340942382812,
        "input_gradient_dot_product": -15.681140899658203
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.4638674628104591,
      "val_r": 0.27299482996637847,
      "n_iterations": 653,
      "coefficients": {
        "right_subspace_overlap_top_k": 24.733617782592773,
        "right_subspace_overlap_bottom_k": 16.38922882080078,
        "interaction_matrix_overlap_top_k": 26.39352798461914,
        "interaction_matrix_overlap_bottom_k": 22.050067901611328,
        "task_vector_cosine_similarity": 7.72293758392334,
        "task_vector_l2_distance": -33.046356201171875,
        "task_vector_dot_product": -13.461002349853516,
        "weight_space_angle": -36.235206604003906,
        "task_vector_magnitude_ratio": -3.987459659576416,
        "singular_value_overlap": -16.521148681640625,
        "subspace_overlap": 25.32036018371582,
        "right_subspace_overlap": 19.023921966552734,
        "activation_l2_distance": -19.057750701904297,
        "activation_cosine_similarity": 40.185646057128906,
        "activation_magnitude_ratio": -32.253116607666016,
        "activation_dot_product": 41.4730110168457,
        "encoder_gradient_cosine_similarity": 8.709016799926758,
        "encoder_gradient_l2_distance": -42.77109146118164,
        "encoder_gradient_dot_product": 30.363666534423828,
        "input_gradient_cosine_similarity": 47.24449157714844,
        "input_gradient_l2_distance": -52.73764419555664,
        "input_gradient_dot_product": -58.54107666015625
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5257036515666086,
      "val_r": 0.41533834150594934,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 39.4477424621582,
        "right_subspace_overlap_bottom_k": 31.553024291992188,
        "interaction_matrix_overlap_top_k": 5.9698381423950195,
        "interaction_matrix_overlap_bottom_k": 1.228601336479187,
        "task_vector_cosine_similarity": -17.81903839111328,
        "task_vector_l2_distance": -42.60700225830078,
        "task_vector_dot_product": 4.808671951293945,
        "weight_space_angle": 9.921765327453613,
        "task_vector_magnitude_ratio": -16.473520278930664,
        "singular_value_overlap": -35.781578063964844,
        "subspace_overlap": -3.6980719566345215,
        "right_subspace_overlap": 23.398836135864258,
        "activation_l2_distance": 25.361751556396484,
        "activation_cosine_similarity": 5.8326287269592285,
        "activation_magnitude_ratio": -10.045767784118652,
        "activation_dot_product": 29.929973602294922,
        "encoder_gradient_cosine_similarity": 12.174893379211426,
        "encoder_gradient_l2_distance": -16.543277740478516,
        "encoder_gradient_dot_product": 11.257586479187012,
        "input_gradient_cosine_similarity": 19.55518341064453,
        "input_gradient_l2_distance": -26.11595916748047,
        "input_gradient_dot_product": -50.357810974121094
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5270272731095305,
      "val_r": 0.39632205809643395,
      "n_iterations": 694,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.9841307401657104,
        "right_subspace_overlap_bottom_k": -3.9965758323669434,
        "interaction_matrix_overlap_top_k": 2.2697551250457764,
        "interaction_matrix_overlap_bottom_k": 25.31260871887207,
        "task_vector_cosine_similarity": 15.597921371459961,
        "task_vector_l2_distance": -32.52819061279297,
        "task_vector_dot_product": 7.823009490966797,
        "weight_space_angle": -2.3679864406585693,
        "task_vector_magnitude_ratio": -16.90312957763672,
        "singular_value_overlap": -38.59067153930664,
        "subspace_overlap": -12.461709976196289,
        "right_subspace_overlap": 58.51307678222656,
        "activation_l2_distance": 11.040985107421875,
        "activation_cosine_similarity": 7.884982585906982,
        "activation_magnitude_ratio": -6.164466857910156,
        "activation_dot_product": 19.523422241210938,
        "encoder_gradient_cosine_similarity": 21.43155288696289,
        "encoder_gradient_l2_distance": -22.580581665039062,
        "encoder_gradient_dot_product": 30.148183822631836,
        "input_gradient_cosine_similarity": 19.528614044189453,
        "input_gradient_l2_distance": -40.84307861328125,
        "input_gradient_dot_product": -42.62407684326172
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3959149570993129,
      "val_r": 0.7252818729208397,
      "n_iterations": 536,
      "coefficients": {
        "right_subspace_overlap_top_k": 124.4487075805664,
        "right_subspace_overlap_bottom_k": 16.040910720825195,
        "interaction_matrix_overlap_top_k": 79.89936065673828,
        "interaction_matrix_overlap_bottom_k": 48.4962272644043,
        "task_vector_cosine_similarity": -17.251953125,
        "task_vector_l2_distance": 15.683171272277832,
        "task_vector_dot_product": -65.50006103515625,
        "weight_space_angle": -99.30530548095703,
        "task_vector_magnitude_ratio": -54.156288146972656,
        "singular_value_overlap": -118.78386688232422,
        "subspace_overlap": 36.262123107910156,
        "right_subspace_overlap": 58.28957748413086,
        "activation_l2_distance": 27.80995750427246,
        "activation_cosine_similarity": 28.254077911376953,
        "activation_magnitude_ratio": -32.2790412902832,
        "activation_dot_product": 39.73994445800781,
        "encoder_gradient_cosine_similarity": -0.16069121658802032,
        "encoder_gradient_l2_distance": -87.05819702148438,
        "encoder_gradient_dot_product": 57.62298583984375,
        "input_gradient_cosine_similarity": 18.801210403442383,
        "input_gradient_l2_distance": -16.42667579650879,
        "input_gradient_dot_product": -59.42897415161133
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.3561680824459107,
      "val_r": 0.4988293265186892,
      "n_iterations": 801,
      "coefficients": {
        "right_subspace_overlap_top_k": 60.37119674682617,
        "right_subspace_overlap_bottom_k": -30.56692123413086,
        "interaction_matrix_overlap_top_k": 36.02169418334961,
        "interaction_matrix_overlap_bottom_k": -1.0193748474121094,
        "task_vector_cosine_similarity": 25.198827743530273,
        "task_vector_l2_distance": -17.316532135009766,
        "task_vector_dot_product": -50.57025146484375,
        "weight_space_angle": -13.981269836425781,
        "task_vector_magnitude_ratio": -57.22166442871094,
        "singular_value_overlap": 21.278154373168945,
        "subspace_overlap": 77.70414733886719,
        "right_subspace_overlap": 102.94650268554688,
        "activation_l2_distance": -42.82109451293945,
        "activation_cosine_similarity": 34.96208953857422,
        "activation_magnitude_ratio": -138.71673583984375,
        "activation_dot_product": 27.832365036010742,
        "encoder_gradient_cosine_similarity": 18.783559799194336,
        "encoder_gradient_l2_distance": -8.602293968200684,
        "encoder_gradient_dot_product": 106.18730926513672,
        "input_gradient_cosine_similarity": -4.959243297576904,
        "input_gradient_l2_distance": -55.93180465698242,
        "input_gradient_dot_product": -88.58064270019531
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5371017364505424,
      "val_r": 0.41615979498016753,
      "n_iterations": 683,
      "coefficients": {
        "right_subspace_overlap_top_k": 82.10346984863281,
        "right_subspace_overlap_bottom_k": 18.20338249206543,
        "interaction_matrix_overlap_top_k": -5.2871856689453125,
        "interaction_matrix_overlap_bottom_k": 21.02267074584961,
        "task_vector_cosine_similarity": 46.80506134033203,
        "task_vector_l2_distance": -45.797080993652344,
        "task_vector_dot_product": -23.344722747802734,
        "weight_space_angle": 31.100704193115234,
        "task_vector_magnitude_ratio": -51.54487228393555,
        "singular_value_overlap": -17.723682403564453,
        "subspace_overlap": -21.992982864379883,
        "right_subspace_overlap": 65.1648941040039,
        "activation_l2_distance": 2.662261962890625,
        "activation_cosine_similarity": -2.360407590866089,
        "activation_magnitude_ratio": -33.78129959106445,
        "activation_dot_product": 65.39219665527344,
        "encoder_gradient_cosine_similarity": -7.605556488037109,
        "encoder_gradient_l2_distance": -42.05016326904297,
        "encoder_gradient_dot_product": 43.948970794677734,
        "input_gradient_cosine_similarity": 0.6602802276611328,
        "input_gradient_l2_distance": -116.44046783447266,
        "input_gradient_dot_product": -8.137721061706543
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4396876756064741,
      "val_r": 0.19819438215342597,
      "n_iterations": 570,
      "coefficients": {
        "right_subspace_overlap_top_k": 26.688026428222656,
        "right_subspace_overlap_bottom_k": 6.457052230834961,
        "interaction_matrix_overlap_top_k": 90.92847442626953,
        "interaction_matrix_overlap_bottom_k": 24.436368942260742,
        "task_vector_cosine_similarity": 69.19943237304688,
        "task_vector_l2_distance": -55.697574615478516,
        "task_vector_dot_product": 34.005149841308594,
        "weight_space_angle": 57.20878601074219,
        "task_vector_magnitude_ratio": 34.25043869018555,
        "singular_value_overlap": -77.22864532470703,
        "subspace_overlap": 70.60289764404297,
        "right_subspace_overlap": -52.77300262451172,
        "activation_l2_distance": -119.03766632080078,
        "activation_cosine_similarity": -51.5002555847168,
        "activation_magnitude_ratio": -34.57675552368164,
        "activation_dot_product": 57.20264434814453,
        "encoder_gradient_cosine_similarity": 68.83868408203125,
        "encoder_gradient_l2_distance": -122.73629760742188,
        "encoder_gradient_dot_product": 26.375181198120117,
        "input_gradient_cosine_similarity": 20.27614974975586,
        "input_gradient_l2_distance": -33.583072662353516,
        "input_gradient_dot_product": -38.338653564453125
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.48970427358476704,
      "val_r": 0.27912156751527223,
      "n_iterations": 452,
      "coefficients": {
        "right_subspace_overlap_top_k": 13.632281303405762,
        "right_subspace_overlap_bottom_k": 49.04977035522461,
        "interaction_matrix_overlap_top_k": 0.5101363658905029,
        "interaction_matrix_overlap_bottom_k": 48.71220779418945,
        "task_vector_cosine_similarity": 26.102182388305664,
        "task_vector_l2_distance": -60.319366455078125,
        "task_vector_dot_product": -56.40859603881836,
        "weight_space_angle": -7.076048374176025,
        "task_vector_magnitude_ratio": -0.7800998687744141,
        "singular_value_overlap": -67.19249725341797,
        "subspace_overlap": 69.52140045166016,
        "right_subspace_overlap": 65.7823257446289,
        "activation_l2_distance": 4.506665229797363,
        "activation_cosine_similarity": 23.2895565032959,
        "activation_magnitude_ratio": -41.86920166015625,
        "activation_dot_product": 55.87702560424805,
        "encoder_gradient_cosine_similarity": 37.42495346069336,
        "encoder_gradient_l2_distance": -46.2615966796875,
        "encoder_gradient_dot_product": 59.63665771484375,
        "input_gradient_cosine_similarity": -27.91969871520996,
        "input_gradient_l2_distance": -80.4905014038086,
        "input_gradient_dot_product": -64.73080444335938
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8060815434448672,
      "val_r": 0.6870949060816748,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 4.414272308349609,
        "right_subspace_overlap_bottom_k": -3.574713945388794,
        "interaction_matrix_overlap_top_k": -3.5673444271087646,
        "interaction_matrix_overlap_bottom_k": 0.9291860461235046,
        "task_vector_cosine_similarity": 2.155277729034424,
        "task_vector_l2_distance": -0.5236181616783142,
        "task_vector_dot_product": 0.15415498614311218,
        "weight_space_angle": 5.0136399269104,
        "task_vector_magnitude_ratio": -0.9119338393211365,
        "singular_value_overlap": -0.4713329076766968,
        "subspace_overlap": 0.15780413150787354,
        "right_subspace_overlap": 4.590461730957031,
        "activation_l2_distance": 0.2568400204181671,
        "activation_cosine_similarity": 2.655496120452881,
        "activation_magnitude_ratio": -0.7244681715965271,
        "activation_dot_product": 1.2765123844146729,
        "encoder_gradient_cosine_similarity": 0.93659907579422,
        "encoder_gradient_l2_distance": -6.509300708770752,
        "encoder_gradient_dot_product": 1.1095741987228394,
        "input_gradient_cosine_similarity": 0.07986429333686829,
        "input_gradient_l2_distance": -4.9913458824157715,
        "input_gradient_dot_product": -1.4560811519622803
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5807346536479896,
      "val_r": 0.3759210306457248,
      "n_iterations": 968,
      "coefficients": {
        "right_subspace_overlap_top_k": -19.20079231262207,
        "right_subspace_overlap_bottom_k": 1.8734393119812012,
        "interaction_matrix_overlap_top_k": 48.67311096191406,
        "interaction_matrix_overlap_bottom_k": 6.312231063842773,
        "task_vector_cosine_similarity": 18.762765884399414,
        "task_vector_l2_distance": -26.901885986328125,
        "task_vector_dot_product": -6.76241397857666,
        "weight_space_angle": 19.69084358215332,
        "task_vector_magnitude_ratio": -14.75572395324707,
        "singular_value_overlap": -26.06504249572754,
        "subspace_overlap": 20.325063705444336,
        "right_subspace_overlap": -5.9201250076293945,
        "activation_l2_distance": 1.49440336227417,
        "activation_cosine_similarity": 17.625211715698242,
        "activation_magnitude_ratio": 6.069802761077881,
        "activation_dot_product": -0.57303386926651,
        "encoder_gradient_cosine_similarity": 10.186891555786133,
        "encoder_gradient_l2_distance": 3.8369951248168945,
        "encoder_gradient_dot_product": 35.300323486328125,
        "input_gradient_cosine_similarity": 16.397462844848633,
        "input_gradient_l2_distance": -75.2499008178711,
        "input_gradient_dot_product": -30.121227264404297
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}