{
  "aggregate_metrics": {
    "train_r": 0.22220084657269074,
    "train_p": 2.482273791210613e-37,
    "val_r": 0.2967493011021166,
    "val_p": 1.0368983310196897e-08
  },
  "per_fold_stats": {
    "train_r_mean": 0.7351355459825684,
    "train_r_std": 0.09186829122009306,
    "val_r_mean": 0.6026536589895402,
    "val_r_std": 0.21018584140999014
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 8.964734077453613,
    "right_subspace_overlap_bottom_k": -13.09703540802002,
    "interaction_matrix_overlap_top_k": 10.068421363830566,
    "interaction_matrix_overlap_bottom_k": -10.337394714355469,
    "task_vector_cosine_similarity": 5.036282539367676,
    "task_vector_l2_distance": -9.790189743041992,
    "task_vector_dot_product": 4.110795497894287,
    "weight_space_angle": -9.419816017150879,
    "task_vector_magnitude_ratio": 2.992100954055786,
    "singular_value_overlap": 10.956035614013672,
    "subspace_overlap": 4.772482395172119,
    "right_subspace_overlap": 20.481307983398438,
    "activation_l2_distance": -8.468992233276367,
    "activation_cosine_similarity": 6.356347560882568,
    "activation_magnitude_ratio": -16.329082489013672,
    "activation_dot_product": 17.70657730102539,
    "encoder_gradient_cosine_similarity": 10.545819282531738,
    "encoder_gradient_l2_distance": -15.376062393188477,
    "encoder_gradient_dot_product": 9.504496574401855,
    "input_gradient_cosine_similarity": 2.5283455848693848,
    "input_gradient_l2_distance": -16.381336212158203,
    "input_gradient_dot_product": -13.825215339660645
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 15.383045196533203,
    "right_subspace_overlap_bottom_k": 32.69923400878906,
    "interaction_matrix_overlap_top_k": 23.9586238861084,
    "interaction_matrix_overlap_bottom_k": 25.864200592041016,
    "task_vector_cosine_similarity": 31.20132827758789,
    "task_vector_l2_distance": 21.01969337463379,
    "task_vector_dot_product": 16.678035736083984,
    "weight_space_angle": 20.46914291381836,
    "task_vector_magnitude_ratio": 14.01434326171875,
    "singular_value_overlap": 19.521621704101562,
    "subspace_overlap": 46.30326461791992,
    "right_subspace_overlap": 36.45045471191406,
    "activation_l2_distance": 20.14162254333496,
    "activation_cosine_similarity": 21.525991439819336,
    "activation_magnitude_ratio": 32.64149475097656,
    "activation_dot_product": 31.280494689941406,
    "encoder_gradient_cosine_similarity": 25.674179077148438,
    "encoder_gradient_l2_distance": 17.197668075561523,
    "encoder_gradient_dot_product": 20.013519287109375,
    "input_gradient_cosine_similarity": 33.87791442871094,
    "input_gradient_l2_distance": 23.13755989074707,
    "input_gradient_dot_product": 32.00599670410156
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6064706900787769,
      "val_r": 0.5641097458158857,
      "n_iterations": 753,
      "coefficients": {
        "right_subspace_overlap_top_k": 39.587127685546875,
        "right_subspace_overlap_bottom_k": -118.87415313720703,
        "interaction_matrix_overlap_top_k": 7.388456344604492,
        "interaction_matrix_overlap_bottom_k": 3.343843936920166,
        "task_vector_cosine_similarity": -64.84566497802734,
        "task_vector_l2_distance": -34.315635681152344,
        "task_vector_dot_product": 4.927624225616455,
        "weight_space_angle": -45.51142501831055,
        "task_vector_magnitude_ratio": 22.4473934173584,
        "singular_value_overlap": -20.618711471557617,
        "subspace_overlap": 69.81598663330078,
        "right_subspace_overlap": 142.76986694335938,
        "activation_l2_distance": -74.12049102783203,
        "activation_cosine_similarity": -11.824684143066406,
        "activation_magnitude_ratio": -40.10370635986328,
        "activation_dot_product": 18.571468353271484,
        "encoder_gradient_cosine_similarity": 63.9158935546875,
        "encoder_gradient_l2_distance": -18.001163482666016,
        "encoder_gradient_dot_product": 43.03326416015625,
        "input_gradient_cosine_similarity": 76.7528305053711,
        "input_gradient_l2_distance": -32.48396682739258,
        "input_gradient_dot_product": -30.8562068939209
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7402803306980166,
      "val_r": 0.7147857963614986,
      "n_iterations": 994,
      "coefficients": {
        "right_subspace_overlap_top_k": 24.969905853271484,
        "right_subspace_overlap_bottom_k": -17.324562072753906,
        "interaction_matrix_overlap_top_k": -1.810536503791809,
        "interaction_matrix_overlap_bottom_k": -4.058625221252441,
        "task_vector_cosine_similarity": -23.965293884277344,
        "task_vector_l2_distance": -4.526321887969971,
        "task_vector_dot_product": 1.8062328100204468,
        "weight_space_angle": 1.1728359460830688,
        "task_vector_magnitude_ratio": -4.228585720062256,
        "singular_value_overlap": 12.351829528808594,
        "subspace_overlap": 4.260957717895508,
        "right_subspace_overlap": 8.617717742919922,
        "activation_l2_distance": 10.227856636047363,
        "activation_cosine_similarity": 13.602624893188477,
        "activation_magnitude_ratio": -2.4535393714904785,
        "activation_dot_product": 21.5261287689209,
        "encoder_gradient_cosine_similarity": 6.026854991912842,
        "encoder_gradient_l2_distance": -36.97501754760742,
        "encoder_gradient_dot_product": 1.3732370138168335,
        "input_gradient_cosine_similarity": 3.9308972358703613,
        "input_gradient_l2_distance": -4.825789451599121,
        "input_gradient_dot_product": -8.70036506652832
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.6624195964989904,
      "val_r": 0.621276202766503,
      "n_iterations": 641,
      "coefficients": {
        "right_subspace_overlap_top_k": 10.94480037689209,
        "right_subspace_overlap_bottom_k": -41.484832763671875,
        "interaction_matrix_overlap_top_k": 43.31614303588867,
        "interaction_matrix_overlap_bottom_k": 9.337249755859375,
        "task_vector_cosine_similarity": 11.442689895629883,
        "task_vector_l2_distance": -25.535568237304688,
        "task_vector_dot_product": -3.5673420429229736,
        "weight_space_angle": -49.47127914428711,
        "task_vector_magnitude_ratio": -9.659984588623047,
        "singular_value_overlap": 6.728464603424072,
        "subspace_overlap": 14.162034034729004,
        "right_subspace_overlap": 21.141794204711914,
        "activation_l2_distance": -25.792266845703125,
        "activation_cosine_similarity": -28.174959182739258,
        "activation_magnitude_ratio": -10.743124961853027,
        "activation_dot_product": 64.86920928955078,
        "encoder_gradient_cosine_similarity": 25.00202178955078,
        "encoder_gradient_l2_distance": -57.4838981628418,
        "encoder_gradient_dot_product": 9.76522159576416,
        "input_gradient_cosine_similarity": 44.465431213378906,
        "input_gradient_l2_distance": -25.35070037841797,
        "input_gradient_dot_product": 17.0865421295166
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8269298721363962,
      "val_r": 0.8234490239296105,
      "n_iterations": 640,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.271224021911621,
        "right_subspace_overlap_bottom_k": -5.497565269470215,
        "interaction_matrix_overlap_top_k": -3.2091503143310547,
        "interaction_matrix_overlap_bottom_k": 4.987925052642822,
        "task_vector_cosine_similarity": 1.2105590105056763,
        "task_vector_l2_distance": 0.23734717071056366,
        "task_vector_dot_product": 0.04436783865094185,
        "weight_space_angle": 0.3561307489871979,
        "task_vector_magnitude_ratio": 0.012696713209152222,
        "singular_value_overlap": 0.09131447225809097,
        "subspace_overlap": -0.18984951078891754,
        "right_subspace_overlap": 0.5733010768890381,
        "activation_l2_distance": 0.5045979022979736,
        "activation_cosine_similarity": 1.258027195930481,
        "activation_magnitude_ratio": -0.0077879526652395725,
        "activation_dot_product": -0.30349597334861755,
        "encoder_gradient_cosine_similarity": 0.08094479888677597,
        "encoder_gradient_l2_distance": -0.8101377487182617,
        "encoder_gradient_dot_product": 0.026037273928523064,
        "input_gradient_cosine_similarity": 0.09896373748779297,
        "input_gradient_l2_distance": -0.6049871444702148,
        "input_gradient_dot_product": -0.13166841864585876
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6300064682872082,
      "val_r": 0.5963883411140988,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.3873255252838135,
        "right_subspace_overlap_bottom_k": -30.769582748413086,
        "interaction_matrix_overlap_top_k": 40.2374382019043,
        "interaction_matrix_overlap_bottom_k": -16.85730743408203,
        "task_vector_cosine_similarity": 2.6273059844970703,
        "task_vector_l2_distance": -2.4118127822875977,
        "task_vector_dot_product": 60.361419677734375,
        "weight_space_angle": -39.48272705078125,
        "task_vector_magnitude_ratio": -13.717864036560059,
        "singular_value_overlap": 43.69442367553711,
        "subspace_overlap": -49.584354400634766,
        "right_subspace_overlap": 39.221961975097656,
        "activation_l2_distance": -8.677084922790527,
        "activation_cosine_similarity": 71.1010513305664,
        "activation_magnitude_ratio": -58.91697692871094,
        "activation_dot_product": 25.097936630249023,
        "encoder_gradient_cosine_similarity": 22.777172088623047,
        "encoder_gradient_l2_distance": -31.347299575805664,
        "encoder_gradient_dot_product": -3.0668532848358154,
        "input_gradient_cosine_similarity": 24.250755310058594,
        "input_gradient_l2_distance": -38.81748580932617,
        "input_gradient_dot_product": -36.10901641845703
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7470636939266819,
      "val_r": 0.6950034947230807,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 10.325977325439453,
        "right_subspace_overlap_bottom_k": -16.718536376953125,
        "interaction_matrix_overlap_top_k": -1.7967344522476196,
        "interaction_matrix_overlap_bottom_k": -5.513145923614502,
        "task_vector_cosine_similarity": -5.321095943450928,
        "task_vector_l2_distance": -5.715384006500244,
        "task_vector_dot_product": 12.829328536987305,
        "weight_space_angle": 2.220716714859009,
        "task_vector_magnitude_ratio": -4.826107501983643,
        "singular_value_overlap": 8.885744094848633,
        "subspace_overlap": 3.0709946155548096,
        "right_subspace_overlap": 11.343734741210938,
        "activation_l2_distance": -1.807984709739685,
        "activation_cosine_similarity": 13.333150863647461,
        "activation_magnitude_ratio": -5.097618579864502,
        "activation_dot_product": 11.464625358581543,
        "encoder_gradient_cosine_similarity": 9.025848388671875,
        "encoder_gradient_l2_distance": -15.03689956665039,
        "encoder_gradient_dot_product": 2.9637646675109863,
        "input_gradient_cosine_similarity": 8.56866455078125,
        "input_gradient_l2_distance": -20.04363441467285,
        "input_gradient_dot_product": -11.156867027282715
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5516878999632435,
      "val_r": 0.5307562774265555,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -23.178144454956055,
        "right_subspace_overlap_bottom_k": 76.39196014404297,
        "interaction_matrix_overlap_top_k": -12.386116981506348,
        "interaction_matrix_overlap_bottom_k": -78.38636016845703,
        "task_vector_cosine_similarity": 59.50223159790039,
        "task_vector_l2_distance": -45.5788688659668,
        "task_vector_dot_product": -25.787721633911133,
        "weight_space_angle": -37.587310791015625,
        "task_vector_magnitude_ratio": 39.89311218261719,
        "singular_value_overlap": 61.9228401184082,
        "subspace_overlap": 166.42567443847656,
        "right_subspace_overlap": 13.56334400177002,
        "activation_l2_distance": -21.22174072265625,
        "activation_cosine_similarity": 44.67184829711914,
        "activation_magnitude_ratio": -67.61686706542969,
        "activation_dot_product": 125.56551361083984,
        "encoder_gradient_cosine_similarity": -31.53959083557129,
        "encoder_gradient_l2_distance": -54.07314682006836,
        "encoder_gradient_dot_product": 69.27957153320312,
        "input_gradient_cosine_similarity": -10.547005653381348,
        "input_gradient_l2_distance": -104.66464233398438,
        "input_gradient_dot_product": -143.6501007080078
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7700043765024934,
      "val_r": 0.33662626175708893,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.238802909851074,
        "right_subspace_overlap_bottom_k": -3.491987705230713,
        "interaction_matrix_overlap_top_k": -0.7030606269836426,
        "interaction_matrix_overlap_bottom_k": -1.8622695207595825,
        "task_vector_cosine_similarity": 0.03689584508538246,
        "task_vector_l2_distance": 0.008571439422667027,
        "task_vector_dot_product": -1.1950315237045288,
        "weight_space_angle": 1.8346959352493286,
        "task_vector_magnitude_ratio": -0.14668430387973785,
        "singular_value_overlap": 1.289555549621582,
        "subspace_overlap": 0.34849780797958374,
        "right_subspace_overlap": 4.998836040496826,
        "activation_l2_distance": 0.33996182680130005,
        "activation_cosine_similarity": 5.94489860534668,
        "activation_magnitude_ratio": -1.0070618391036987,
        "activation_dot_product": -1.3789606094360352,
        "encoder_gradient_cosine_similarity": 1.23407781124115,
        "encoder_gradient_l2_distance": -5.466862678527832,
        "encoder_gradient_dot_product": 0.24952243268489838,
        "input_gradient_cosine_similarity": 0.9479163289070129,
        "input_gradient_l2_distance": -3.522059679031372,
        "input_gradient_dot_product": 0.30140697956085205
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.7070442072921976,
      "val_r": 0.7187500413942585,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.2652280628681183,
        "right_subspace_overlap_bottom_k": -11.503569602966309,
        "interaction_matrix_overlap_top_k": 10.341582298278809,
        "interaction_matrix_overlap_bottom_k": -16.169687271118164,
        "task_vector_cosine_similarity": 30.69856834411621,
        "task_vector_l2_distance": 2.4831628799438477,
        "task_vector_dot_product": 5.128949165344238,
        "weight_space_angle": 16.04767417907715,
        "task_vector_magnitude_ratio": -2.9280970096588135,
        "singular_value_overlap": 14.112335205078125,
        "subspace_overlap": -6.2087016105651855,
        "right_subspace_overlap": 11.066863059997559,
        "activation_l2_distance": -18.78141212463379,
        "activation_cosine_similarity": -4.300518035888672,
        "activation_magnitude_ratio": -3.6357202529907227,
        "activation_dot_product": 16.258472442626953,
        "encoder_gradient_cosine_similarity": -3.8194580078125,
        "encoder_gradient_l2_distance": -29.004772186279297,
        "encoder_gradient_dot_product": -5.557531833648682,
        "input_gradient_cosine_similarity": 9.21386432647705,
        "input_gradient_l2_distance": -11.740523338317871,
        "input_gradient_dot_product": -0.43747061491012573
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7437696277842853,
      "val_r": 0.44992279865121815,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 10.923087120056152,
        "right_subspace_overlap_bottom_k": -12.868194580078125,
        "interaction_matrix_overlap_top_k": 10.881758689880371,
        "interaction_matrix_overlap_bottom_k": -10.035015106201172,
        "task_vector_cosine_similarity": -5.208014965057373,
        "task_vector_l2_distance": -2.877157688140869,
        "task_vector_dot_product": 0.5582937598228455,
        "weight_space_angle": 5.190859794616699,
        "task_vector_magnitude_ratio": -3.9388933181762695,
        "singular_value_overlap": 6.708451271057129,
        "subspace_overlap": -0.612207293510437,
        "right_subspace_overlap": 13.711387634277344,
        "activation_l2_distance": 7.008294105529785,
        "activation_cosine_similarity": 1.0703636407852173,
        "activation_magnitude_ratio": 1.3914363384246826,
        "activation_dot_product": -2.214320421218872,
        "encoder_gradient_cosine_similarity": 7.714527130126953,
        "encoder_gradient_l2_distance": -10.381087303161621,
        "encoder_gradient_dot_product": 4.930715560913086,
        "input_gradient_cosine_similarity": 2.714151620864868,
        "input_gradient_l2_distance": -14.62371826171875,
        "input_gradient_dot_product": -9.046195983886719
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8226288184723018,
      "val_r": 0.40855916646625423,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 4.124943733215332,
        "right_subspace_overlap_bottom_k": -8.834747314453125,
        "interaction_matrix_overlap_top_k": -0.03916019946336746,
        "interaction_matrix_overlap_bottom_k": 4.476210594177246,
        "task_vector_cosine_similarity": -0.020377997308969498,
        "task_vector_l2_distance": 1.1776378154754639,
        "task_vector_dot_product": -1.1455668210983276,
        "weight_space_angle": 0.45663607120513916,
        "task_vector_magnitude_ratio": 0.04193712770938873,
        "singular_value_overlap": 1.7542753219604492,
        "subspace_overlap": -2.787355661392212,
        "right_subspace_overlap": 2.4975740909576416,
        "activation_l2_distance": 0.5355664491653442,
        "activation_cosine_similarity": 5.133324146270752,
        "activation_magnitude_ratio": -0.4873967468738556,
        "activation_dot_product": -0.5257183313369751,
        "encoder_gradient_cosine_similarity": 0.2962820827960968,
        "encoder_gradient_l2_distance": -3.520446538925171,
        "encoder_gradient_dot_product": 0.002028319053351879,
        "input_gradient_cosine_similarity": 0.5876772403717041,
        "input_gradient_l2_distance": -2.2294366359710693,
        "input_gradient_dot_product": -0.49480679631233215
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.8370098896898324,
      "val_r": 0.8517326178929981,
      "n_iterations": 789,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.3848310708999634,
        "right_subspace_overlap_bottom_k": -2.8865904808044434,
        "interaction_matrix_overlap_top_k": -1.3570460081100464,
        "interaction_matrix_overlap_bottom_k": 2.60048246383667,
        "task_vector_cosine_similarity": 0.39771589636802673,
        "task_vector_l2_distance": 0.10834603756666183,
        "task_vector_dot_product": 0.16703486442565918,
        "weight_space_angle": 0.340107262134552,
        "task_vector_magnitude_ratio": 0.02380652166903019,
        "singular_value_overlap": 0.04484318569302559,
        "subspace_overlap": 0.1348983347415924,
        "right_subspace_overlap": 0.7562817931175232,
        "activation_l2_distance": 0.364621639251709,
        "activation_cosine_similarity": 0.7768614888191223,
        "activation_magnitude_ratio": 0.0072567276656627655,
        "activation_dot_product": -0.21044136583805084,
        "encoder_gradient_cosine_similarity": 0.038754675537347794,
        "encoder_gradient_l2_distance": -0.37444257736206055,
        "encoder_gradient_dot_product": -0.022102709859609604,
        "input_gradient_cosine_similarity": 0.05702677741646767,
        "input_gradient_l2_distance": -0.30388501286506653,
        "input_gradient_dot_product": -0.049891602247953415
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.7831387054035719,
      "val_r": 0.7731543147427657,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 2.3695690631866455,
        "right_subspace_overlap_bottom_k": -2.4536635875701904,
        "interaction_matrix_overlap_top_k": -0.14743682742118835,
        "interaction_matrix_overlap_bottom_k": -0.0672307088971138,
        "task_vector_cosine_similarity": 1.9129635095596313,
        "task_vector_l2_distance": 0.48511967062950134,
        "task_vector_dot_product": -1.089677095413208,
        "weight_space_angle": 0.1002640426158905,
        "task_vector_magnitude_ratio": 0.0822291225194931,
        "singular_value_overlap": 0.7629808783531189,
        "subspace_overlap": -2.0264976024627686,
        "right_subspace_overlap": 1.4513187408447266,
        "activation_l2_distance": 1.0987303256988525,
        "activation_cosine_similarity": 2.810861110687256,
        "activation_magnitude_ratio": -0.18937359750270844,
        "activation_dot_product": -0.050494205206632614,
        "encoder_gradient_cosine_similarity": 0.6160839200019836,
        "encoder_gradient_l2_distance": -2.6516988277435303,
        "encoder_gradient_dot_product": 0.21757157146930695,
        "input_gradient_cosine_similarity": 0.3647516071796417,
        "input_gradient_l2_distance": -1.673959732055664,
        "input_gradient_dot_product": -0.9219530820846558
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7818548362877998,
      "val_r": 0.7303006407572976,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 18.677345275878906,
        "right_subspace_overlap_bottom_k": -11.349041938781738,
        "interaction_matrix_overlap_top_k": -3.7350993156433105,
        "interaction_matrix_overlap_bottom_k": -1.6441330909729004,
        "task_vector_cosine_similarity": 3.811042070388794,
        "task_vector_l2_distance": 1.8552998304367065,
        "task_vector_dot_product": -10.193337440490723,
        "weight_space_angle": 3.798065185546875,
        "task_vector_magnitude_ratio": -0.24818943440914154,
        "singular_value_overlap": 5.00038480758667,
        "subspace_overlap": -3.029571771621704,
        "right_subspace_overlap": 7.840240478515625,
        "activation_l2_distance": 3.582352638244629,
        "activation_cosine_similarity": 14.325505256652832,
        "activation_magnitude_ratio": -2.407200574874878,
        "activation_dot_product": 2.7011189460754395,
        "encoder_gradient_cosine_similarity": 2.738706588745117,
        "encoder_gradient_l2_distance": -14.84951114654541,
        "encoder_gradient_dot_product": 1.918343186378479,
        "input_gradient_cosine_similarity": 1.970139741897583,
        "input_gradient_l2_distance": -14.18893051147461,
        "input_gradient_dot_product": -5.574773788452148
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7498335522047939,
      "val_r": 0.7498991816100405,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.344101905822754,
        "right_subspace_overlap_bottom_k": -29.611614227294922,
        "interaction_matrix_overlap_top_k": 12.874199867248535,
        "interaction_matrix_overlap_bottom_k": -0.12185218185186386,
        "task_vector_cosine_similarity": -11.481728553771973,
        "task_vector_l2_distance": 1.712143898010254,
        "task_vector_dot_product": 7.93785285949707,
        "weight_space_angle": -1.367104411125183,
        "task_vector_magnitude_ratio": -2.3851828575134277,
        "singular_value_overlap": 10.176033973693848,
        "subspace_overlap": -5.043203353881836,
        "right_subspace_overlap": 16.495820999145508,
        "activation_l2_distance": -3.3141298294067383,
        "activation_cosine_similarity": 10.153569221496582,
        "activation_magnitude_ratio": -2.513495922088623,
        "activation_dot_product": 8.47474479675293,
        "encoder_gradient_cosine_similarity": 8.070306777954102,
        "encoder_gradient_l2_distance": -14.96561050415039,
        "encoder_gradient_dot_product": 5.914538860321045,
        "input_gradient_cosine_similarity": 5.082602024078369,
        "input_gradient_l2_distance": -7.639233589172363,
        "input_gradient_dot_product": -13.79436206817627
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.7910742523053762,
      "val_r": 0.20497417386482297,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 6.732938766479492,
        "right_subspace_overlap_bottom_k": -0.282446026802063,
        "interaction_matrix_overlap_top_k": 4.4192070960998535,
        "interaction_matrix_overlap_bottom_k": -6.728020668029785,
        "task_vector_cosine_similarity": -3.3421857357025146,
        "task_vector_l2_distance": -2.1374993324279785,
        "task_vector_dot_product": -0.5924954414367676,
        "weight_space_angle": 1.7194218635559082,
        "task_vector_magnitude_ratio": -0.6119191646575928,
        "singular_value_overlap": 5.228102684020996,
        "subspace_overlap": -1.7214847803115845,
        "right_subspace_overlap": 1.5034428834915161,
        "activation_l2_distance": 2.846754312515259,
        "activation_cosine_similarity": 5.172369956970215,
        "activation_magnitude_ratio": -1.787134051322937,
        "activation_dot_product": 2.0486552715301514,
        "encoder_gradient_cosine_similarity": 1.534339189529419,
        "encoder_gradient_l2_distance": -5.7666850090026855,
        "encoder_gradient_dot_product": 1.3853273391723633,
        "input_gradient_cosine_similarity": 0.5798174738883972,
        "input_gradient_l2_distance": -5.484748840332031,
        "input_gradient_dot_product": -3.716822862625122
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.8339247886326875,
      "val_r": 0.8018146760327679,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 1.01754629611969,
        "right_subspace_overlap_bottom_k": -5.335995197296143,
        "interaction_matrix_overlap_top_k": -2.078066825866699,
        "interaction_matrix_overlap_bottom_k": 4.876316547393799,
        "task_vector_cosine_similarity": 1.1465963125228882,
        "task_vector_l2_distance": 0.20923340320587158,
        "task_vector_dot_product": -0.06038608029484749,
        "weight_space_angle": 0.47142449021339417,
        "task_vector_magnitude_ratio": 0.04569700360298157,
        "singular_value_overlap": 0.0713970735669136,
        "subspace_overlap": -0.25688299536705017,
        "right_subspace_overlap": 1.0354695320129395,
        "activation_l2_distance": 0.2888197600841522,
        "activation_cosine_similarity": 0.9728414416313171,
        "activation_magnitude_ratio": -0.011523979716002941,
        "activation_dot_product": -0.238947331905365,
        "encoder_gradient_cosine_similarity": 0.08989469707012177,
        "encoder_gradient_l2_distance": -0.7109975814819336,
        "encoder_gradient_dot_product": 0.031633466482162476,
        "input_gradient_cosine_similarity": 0.14858274161815643,
        "input_gradient_l2_distance": -0.5744303464889526,
        "input_gradient_dot_product": -0.13938826322555542
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.7581263207314988,
      "val_r": 0.6718023651773614,
      "n_iterations": 1000,
      "coefficients": {
        "right_subspace_overlap_top_k": 7.73997688293457,
        "right_subspace_overlap_bottom_k": -7.687014579772949,
        "interaction_matrix_overlap_top_k": 4.575259685516357,
        "interaction_matrix_overlap_bottom_k": -6.237167835235596,
        "task_vector_cosine_similarity": -0.5760515928268433,
        "task_vector_l2_distance": 1.0787895917892456,
        "task_vector_dot_product": -2.4030706882476807,
        "weight_space_angle": -0.6496420502662659,
        "task_vector_magnitude_ratio": -0.7465716004371643,
        "singular_value_overlap": 4.723801612854004,
        "subspace_overlap": -1.7076458930969238,
        "right_subspace_overlap": 2.2223153114318848,
        "activation_l2_distance": 5.173887729644775,
        "activation_cosine_similarity": 13.730263710021973,
        "activation_magnitude_ratio": -1.3749322891235352,
        "activation_dot_product": -0.14736291766166687,
        "encoder_gradient_cosine_similarity": 2.683270215988159,
        "encoder_gradient_l2_distance": -6.123068332672119,
        "encoder_gradient_dot_product": 3.365597724914551,
        "input_gradient_cosine_similarity": 0.8801652193069458,
        "input_gradient_l2_distance": -12.682602882385254,
        "input_gradient_dot_product": -4.839468002319336
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.8366909906303619,
      "val_r": 0.7595054659264292,
      "n_iterations": 524,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.3913932740688324,
        "right_subspace_overlap_bottom_k": -3.3666281700134277,
        "interaction_matrix_overlap_top_k": -2.002469539642334,
        "interaction_matrix_overlap_bottom_k": 2.993035316467285,
        "task_vector_cosine_similarity": 0.9305042028427124,
        "task_vector_l2_distance": 0.15294381976127625,
        "task_vector_dot_product": 0.0784420520067215,
        "weight_space_angle": 0.4338989555835724,
        "task_vector_magnitude_ratio": 0.011349677108228207,
        "singular_value_overlap": 0.07408799976110458,
        "subspace_overlap": -0.24142789840698242,
        "right_subspace_overlap": 1.4923418760299683,
        "activation_l2_distance": 0.2476939558982849,
        "activation_cosine_similarity": 0.7099765539169312,
        "activation_magnitude_ratio": 0.024628903716802597,
        "activation_dot_product": -0.15026967227458954,
        "encoder_gradient_cosine_similarity": 0.05044812709093094,
        "encoder_gradient_l2_distance": -0.49949172139167786,
        "encoder_gradient_dot_product": 0.027367806062102318,
        "input_gradient_cosine_similarity": 0.08740367740392685,
        "input_gradient_l2_distance": -0.3629624843597412,
        "input_gradient_dot_product": -0.08382727205753326
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5227520021248523,
      "val_r": 0.05026259338026957,
      "n_iterations": 532,
      "coefficients": {
        "right_subspace_overlap_top_k": 52.30712890625,
        "right_subspace_overlap_bottom_k": -7.991944789886475,
        "interaction_matrix_overlap_top_k": 96.59927368164062,
        "interaction_matrix_overlap_bottom_k": -91.68213653564453,
        "task_vector_cosine_similarity": 101.76899719238281,
        "task_vector_l2_distance": -82.21415710449219,
        "task_vector_dot_product": 34.410987854003906,
        "weight_space_angle": -48.469539642333984,
        "task_vector_magnitude_ratio": 40.72188186645508,
        "singular_value_overlap": 56.11855697631836,
        "subspace_overlap": -89.3602294921875,
        "right_subspace_overlap": 107.32250213623047,
        "activation_l2_distance": -47.88388442993164,
        "activation_cosine_similarity": -33.34040451049805,
        "activation_magnitude_ratio": -129.65147399902344,
        "activation_dot_product": 62.77375411987305,
        "encoder_gradient_cosine_similarity": 94.37999725341797,
        "encoder_gradient_l2_distance": 0.5210189819335938,
        "encoder_gradient_dot_product": 54.2526741027832,
        "input_gradient_cosine_similarity": -119.58772277832031,
        "input_gradient_l2_distance": -25.809022903442383,
        "input_gradient_dot_product": -24.189056396484375
      }
    }
  ],
  "optimization_params": {
    "n_iterations": 1000,
    "learning_rate": 0.01,
    "patience": 50,
    "convergence_threshold": 0.0001
  }
}