{
  "aggregate_metrics": {
    "train_r": 0.421620837883215,
    "train_p": 4.64161144617585e-139,
    "val_r": 0.1070809943945154,
    "val_p": 0.04288718413441424
  },
  "per_fold_stats": {
    "train_r_mean": 0.5024487030867464,
    "train_r_std": 0.05680290509516255,
    "val_r_mean": 0.4055317888759008,
    "val_r_std": 0.14569052101049115,
    "n_nonzero_mean": 16.15,
    "n_nonzero_std": 4.065402809070707
  },
  "average_coefficients": {
    "right_subspace_overlap_top_k": 0.000805655843578279,
    "right_subspace_overlap_bottom_k": 0.002635219134390354,
    "interaction_matrix_overlap_top_k": 3.265680425101891e-05,
    "interaction_matrix_overlap_bottom_k": 0.014827171340584755,
    "effective_rank": -0.00045544159365817904,
    "effective_rank_mergeability_score": 0.0003584517980925739,
    "stable_rank": -0.0006458301795646548,
    "spectral_gap": 0.0005114486557431519,
    "singular_value_ratio": -0.0005408239085227251,
    "layerwise_effective_rank": -0.00045433081686496735,
    "layerwise_effective_rank_mergeability_score": 0.0001990750606637448,
    "task_vector_cosine_similarity": 0.00024969756486825645,
    "task_vector_l2_distance": -0.009389296174049377,
    "task_vector_dot_product": -0.00043643469689413905,
    "weight_space_angle": 0.0001781316677806899,
    "task_vector_magnitude_ratio": -0.0010780319571495056,
    "singular_value_overlap": -0.009563101455569267,
    "subspace_overlap": 0.0007844320498406887,
    "right_subspace_overlap": -9.37360746320337e-05,
    "activation_l2_distance": -0.00047822119086049497,
    "activation_cosine_similarity": -0.0001839774486143142,
    "activation_magnitude_ratio": -0.0023684550542384386,
    "activation_dot_product": -0.0010212415363639593,
    "encoder_gradient_cosine_similarity": -0.00016947943367995322,
    "encoder_gradient_l2_distance": -0.005303363315761089,
    "encoder_gradient_dot_product": 0.00012993000564165413,
    "input_gradient_cosine_similarity": 0.0007108992431312799,
    "input_gradient_l2_distance": -0.011019079945981503,
    "input_gradient_dot_product": -0.0021924260072410107
  },
  "coefficient_std": {
    "right_subspace_overlap_top_k": 0.0020825702231377363,
    "right_subspace_overlap_bottom_k": 0.003239803947508335,
    "interaction_matrix_overlap_top_k": 0.0010138218058273196,
    "interaction_matrix_overlap_bottom_k": 0.004454140551388264,
    "effective_rank": 0.0006450212677009404,
    "effective_rank_mergeability_score": 0.000757409434299916,
    "stable_rank": 0.0007352279499173164,
    "spectral_gap": 0.0008289241814054549,
    "singular_value_ratio": 0.0009193870355375111,
    "layerwise_effective_rank": 0.0007528779678978026,
    "layerwise_effective_rank_mergeability_score": 0.0008836191846057773,
    "task_vector_cosine_similarity": 0.0013643766287714243,
    "task_vector_l2_distance": 0.003601330565288663,
    "task_vector_dot_product": 0.0020834757015109062,
    "weight_space_angle": 0.0015238921623677015,
    "task_vector_magnitude_ratio": 0.000996178132481873,
    "singular_value_overlap": 0.0022803270258009434,
    "subspace_overlap": 0.0011169963981956244,
    "right_subspace_overlap": 0.0011875246418640018,
    "activation_l2_distance": 0.0019319171551615,
    "activation_cosine_similarity": 0.0007783207111060619,
    "activation_magnitude_ratio": 0.0008975396049208939,
    "activation_dot_product": 0.001674165716394782,
    "encoder_gradient_cosine_similarity": 0.000848659488838166,
    "encoder_gradient_l2_distance": 0.002117765136063099,
    "encoder_gradient_dot_product": 0.0012944330228492618,
    "input_gradient_cosine_similarity": 0.000991123029962182,
    "input_gradient_l2_distance": 0.0027732413727790117,
    "input_gradient_dot_product": 0.0015784751158207655
  },
  "nonzero_frequency": {
    "right_subspace_overlap_top_k": 0.35,
    "right_subspace_overlap_bottom_k": 0.85,
    "interaction_matrix_overlap_top_k": 0.4,
    "interaction_matrix_overlap_bottom_k": 0.95,
    "effective_rank": 0.35,
    "effective_rank_mergeability_score": 0.35,
    "stable_rank": 0.45,
    "spectral_gap": 0.45,
    "singular_value_ratio": 0.3,
    "layerwise_effective_rank": 0.3,
    "layerwise_effective_rank_mergeability_score": 0.25,
    "task_vector_cosine_similarity": 0.4,
    "task_vector_l2_distance": 1.0,
    "task_vector_dot_product": 0.5,
    "weight_space_angle": 0.55,
    "task_vector_magnitude_ratio": 0.65,
    "singular_value_overlap": 1.0,
    "subspace_overlap": 0.4,
    "right_subspace_overlap": 0.4,
    "activation_l2_distance": 0.6,
    "activation_cosine_similarity": 0.3,
    "activation_magnitude_ratio": 0.95,
    "activation_dot_product": 0.5,
    "encoder_gradient_cosine_similarity": 0.25,
    "encoder_gradient_l2_distance": 1.0,
    "encoder_gradient_dot_product": 0.3,
    "input_gradient_cosine_similarity": 0.55,
    "input_gradient_l2_distance": 1.0,
    "input_gradient_dot_product": 0.8
  },
  "fold_results": [
    {
      "fold": 0,
      "held_out_task": "SUN397",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.44571185559094634,
      "val_r": 0.4222463259977923,
      "n_iterations": 280,
      "n_nonzero_coefficients": 25,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0023203983437269926,
        "right_subspace_overlap_bottom_k": 0.0021194303408265114,
        "interaction_matrix_overlap_top_k": -0.001140923472121358,
        "interaction_matrix_overlap_bottom_k": 0.013346751220524311,
        "effective_rank": -0.0018136712023988366,
        "effective_rank_mergeability_score": 0.0011418345384299755,
        "stable_rank": -0.0016534366877749562,
        "spectral_gap": 0.0022520325146615505,
        "singular_value_ratio": -0.0023279183078557253,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0014915046049281955,
        "task_vector_l2_distance": -0.007901482284069061,
        "task_vector_dot_product": -0.003193603130057454,
        "weight_space_angle": 0.004511088132858276,
        "task_vector_magnitude_ratio": -0.0036335764452815056,
        "singular_value_overlap": -0.011697445064783096,
        "subspace_overlap": 0.0014839833602309227,
        "right_subspace_overlap": 0.0011793591547757387,
        "activation_l2_distance": -0.0035930625163018703,
        "activation_cosine_similarity": 0.0012809396721422672,
        "activation_magnitude_ratio": -0.002092531882226467,
        "activation_dot_product": -0.0033512571826577187,
        "encoder_gradient_cosine_similarity": -0.0014425376430153847,
        "encoder_gradient_l2_distance": -0.006484708283096552,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.007723072078078985,
        "input_gradient_dot_product": -0.005421279463917017
      }
    },
    {
      "fold": 1,
      "held_out_task": "Cars",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.39286968024858393,
      "val_r": 0.4527938212566739,
      "n_iterations": 370,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.002347813919186592,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.011839976534247398,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": -0.0012218230403959751,
        "stable_rank": 0.0,
        "spectral_gap": -0.0011791171273216605,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": -0.0012400668347254395,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.004510622937232256,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0010091352742165327,
        "singular_value_overlap": -0.009576906450092793,
        "subspace_overlap": 0.0019212467595934868,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002894094679504633,
        "activation_dot_product": -0.0026500271633267403,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.008138502016663551,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.001103008515201509,
        "input_gradient_l2_distance": -0.009985480457544327,
        "input_gradient_dot_product": -0.0013316994300112128
      }
    },
    {
      "fold": 2,
      "held_out_task": "RESISC45",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5091263655071478,
      "val_r": 0.48135550710057395,
      "n_iterations": 219,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0011311606504023075,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.015773914754390717,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.003730436787009239,
        "task_vector_l2_distance": -0.008537748828530312,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0019212665501981974,
        "task_vector_magnitude_ratio": -0.0012363189598545432,
        "singular_value_overlap": -0.009208344854414463,
        "subspace_overlap": 0.0011077579110860825,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0017499782843515277,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0017974991351366043,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.005102494265884161,
        "encoder_gradient_dot_product": 0.0014464739942923188,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.010709858499467373,
        "input_gradient_dot_product": -0.0020882762037217617
      }
    },
    {
      "fold": 3,
      "held_out_task": "EuroSAT",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.461974952597424,
      "val_r": 0.49440456993283666,
      "n_iterations": 450,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": -0.002531318925321102,
        "interaction_matrix_overlap_top_k": -0.0010171683970838785,
        "interaction_matrix_overlap_bottom_k": 0.018459107726812363,
        "effective_rank": -0.0010221963748335838,
        "effective_rank_mergeability_score": 0.0021201292984187603,
        "stable_rank": -0.0017331361304968596,
        "spectral_gap": 0.0010148759465664625,
        "singular_value_ratio": -0.0017621696460992098,
        "layerwise_effective_rank": -0.0015539826126769185,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.00967493001371622,
        "task_vector_dot_product": -0.0011629078071564436,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0012375029036775231,
        "singular_value_overlap": -0.01061371061950922,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002974801231175661,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.001663600793108344,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.010411418043076992,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 4,
      "held_out_task": "SVHN",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5676493249769774,
      "val_r": 0.5996495069981022,
      "n_iterations": 274,
      "n_nonzero_coefficients": 12,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.006091718561947346,
        "interaction_matrix_overlap_top_k": -0.0014750820118933916,
        "interaction_matrix_overlap_bottom_k": 0.01552807167172432,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01384891476482153,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0010690196650102735,
        "singular_value_overlap": -0.010451487265527248,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": -0.0018930187216028571,
        "activation_l2_distance": 0.00212780199944973,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002306812908500433,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0014547175960615277,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.0122010363265872,
        "input_gradient_dot_product": -0.002056861063465476
      }
    },
    {
      "fold": 5,
      "held_out_task": "GTSRB",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.44870857452606383,
      "val_r": 0.775132297944561,
      "n_iterations": 170,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0014500803081318736,
        "right_subspace_overlap_bottom_k": 0.004181359428912401,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.022548800334334373,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.001125953858718276,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": -0.001018450129777193,
        "task_vector_cosine_similarity": 0.0035276487469673157,
        "task_vector_l2_distance": -0.011588611640036106,
        "task_vector_dot_product": 0.001334197586402297,
        "weight_space_angle": -0.0010486497776582837,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.010213136672973633,
        "subspace_overlap": 0.0014709761599078774,
        "right_subspace_overlap": 0.0010734976967796683,
        "activation_l2_distance": 0.0011034727795049548,
        "activation_cosine_similarity": -0.0015862511936575174,
        "activation_magnitude_ratio": -0.0023220342118293047,
        "activation_dot_product": 0.0010268723126500845,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.007174415048211813,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0011241178726777434,
        "input_gradient_l2_distance": -0.011929403059184551,
        "input_gradient_dot_product": -0.001540245721116662
      }
    },
    {
      "fold": 6,
      "held_out_task": "MNIST",
      "n_train_pairs": 164,
      "n_val_pairs": 15,
      "train_r": 0.5821125889266203,
      "val_r": 0.14645334625705625,
      "n_iterations": 296,
      "n_nonzero_coefficients": 17,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0012238050112500787,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.015305436216294765,
        "effective_rank": -0.0010979793732985854,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0012277838541194797,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0012690227013081312,
        "task_vector_l2_distance": -0.007482216227799654,
        "task_vector_dot_product": -0.0041897352784872055,
        "weight_space_angle": 0.001013915054500103,
        "task_vector_magnitude_ratio": -0.0015986048383638263,
        "singular_value_overlap": -0.008794387802481651,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": -0.0010664567817002535,
        "activation_l2_distance": -0.0037347530014812946,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": 0.0,
        "activation_dot_product": -0.004996657371520996,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.007537780795246363,
        "encoder_gradient_dot_product": 0.001392293837852776,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.010918382555246353,
        "input_gradient_dot_product": -0.0033074317034333944
      }
    },
    {
      "fold": 7,
      "held_out_task": "DTD",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.45684139809392077,
      "val_r": 0.29162013931463054,
      "n_iterations": 346,
      "n_nonzero_coefficients": 11,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0018539070151746273,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.017741352319717407,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.010144067928195,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.009122844785451889,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": -0.001834700582548976,
        "activation_magnitude_ratio": -0.0024103899486362934,
        "activation_dot_product": -0.0037911534309387207,
        "encoder_gradient_cosine_similarity": 0.0024318513460457325,
        "encoder_gradient_l2_distance": -0.0044255065731704235,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.006046957802027464,
        "input_gradient_dot_product": -0.0013490698765963316
      }
    },
    {
      "fold": 8,
      "held_out_task": "Flowers102",
      "n_train_pairs": 163,
      "n_val_pairs": 16,
      "train_r": 0.5229965223968887,
      "val_r": 0.4301127952767928,
      "n_iterations": 192,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0050124856643378735,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.01410472672432661,
        "effective_rank": -0.0011550089111551642,
        "effective_rank_mergeability_score": 0.0010081508662551641,
        "stable_rank": -0.0014482707483693957,
        "spectral_gap": 0.0013177110813558102,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0011779589112848043,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": -0.0012908177450299263,
        "task_vector_l2_distance": -0.013642065227031708,
        "task_vector_dot_product": -0.0012243182864040136,
        "weight_space_angle": -0.001292425673455,
        "task_vector_magnitude_ratio": -0.0024761250242590904,
        "singular_value_overlap": -0.010678036138415337,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": -0.0012710430892184377,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002535407431423664,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.006084258668124676,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0015526553615927696,
        "input_gradient_l2_distance": -0.012652521952986717,
        "input_gradient_dot_product": -0.001978909131139517
      }
    },
    {
      "fold": 9,
      "held_out_task": "PCAM",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5416763123362207,
      "val_r": 0.12554357039016265,
      "n_iterations": 302,
      "n_nonzero_coefficients": 13,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0,
        "interaction_matrix_overlap_top_k": 0.0011104519944638014,
        "interaction_matrix_overlap_bottom_k": 0.01901133731007576,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009270046837627888,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0010757308918982744,
        "task_vector_magnitude_ratio": -0.0011221537133678794,
        "singular_value_overlap": -0.0117877759039402,
        "subspace_overlap": 0.0011610242072492838,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002654546871781349,
        "activation_dot_product": -0.002929706359282136,
        "encoder_gradient_cosine_similarity": -0.0020852030720561743,
        "encoder_gradient_l2_distance": -0.003764198161661625,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": -0.0016281340504065156,
        "input_gradient_l2_distance": -0.011006636545062065,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 10,
      "held_out_task": "FER2013",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.512786172081922,
      "val_r": 0.40026867601164595,
      "n_iterations": 285,
      "n_nonzero_coefficients": 12,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.004650072194635868,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.01773810014128685,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0013689125189557672,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.013224311172962189,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0011978994589298964,
        "singular_value_overlap": -0.012077565304934978,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.002903333166614175,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0030341418460011482,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.007036716677248478,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0018709942232817411,
        "input_gradient_l2_distance": -0.01156660821288824,
        "input_gradient_dot_product": -0.0018999448511749506
      }
    },
    {
      "fold": 11,
      "held_out_task": "OxfordIIITPet",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.45062470296605384,
      "val_r": 0.31427006149389736,
      "n_iterations": 205,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0019071708666160703,
        "right_subspace_overlap_bottom_k": -0.0013132755411788821,
        "interaction_matrix_overlap_top_k": -0.00224139541387558,
        "interaction_matrix_overlap_bottom_k": 0.012960173189640045,
        "effective_rank": -0.0010479460470378399,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": -0.0013522794470191002,
        "spectral_gap": 0.0014064429560676217,
        "singular_value_ratio": -0.0012832351494580507,
        "layerwise_effective_rank": -0.0010870866244658828,
        "layerwise_effective_rank_mergeability_score": 0.0014384605456143618,
        "task_vector_cosine_similarity": -0.0012599441688507795,
        "task_vector_l2_distance": -0.006917568854987621,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.001555847586132586,
        "singular_value_overlap": -0.00688306475058198,
        "subspace_overlap": 0.0022116354666650295,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0017668663058429956,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": -0.0010943937813863158,
        "encoder_gradient_l2_distance": -0.004904343280941248,
        "encoder_gradient_dot_product": -0.0012080720625817776,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.007916110567748547,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 12,
      "held_out_task": "STL10",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.4531981215851895,
      "val_r": 0.4817735515808811,
      "n_iterations": 296,
      "n_nonzero_coefficients": 13,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0014351021964102983,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.018854252994060516,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.009138327091932297,
        "task_vector_dot_product": 0.003216539043933153,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.010195150040090084,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.001034726737998426,
        "activation_l2_distance": 0.0019723628647625446,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0015764669515192509,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0057089561596512794,
        "encoder_gradient_dot_product": 0.004646002314984798,
        "input_gradient_cosine_similarity": 0.0027144313789904118,
        "input_gradient_l2_distance": -0.0109324986115098,
        "input_gradient_dot_product": -0.002830484649166465
      }
    },
    {
      "fold": 13,
      "held_out_task": "CIFAR100",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5092316254651469,
      "val_r": 0.5570392266193287,
      "n_iterations": 441,
      "n_nonzero_coefficients": 15,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0038765829522162676,
        "interaction_matrix_overlap_top_k": 0.001891683554276824,
        "interaction_matrix_overlap_bottom_k": 0.012549313716590405,
        "effective_rank": -0.0012847371399402618,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0010844095377251506,
        "task_vector_l2_distance": -0.009684487245976925,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": -0.0023163175210356712,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.009575161151587963,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0015075546689331532,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0019793016836047173,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": -0.001199305639602244,
        "encoder_gradient_l2_distance": -0.0048032477498054504,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0013692504726350307,
        "input_gradient_l2_distance": -0.010200755670666695,
        "input_gradient_dot_product": -0.0021259940695017576
      }
    },
    {
      "fold": 14,
      "held_out_task": "CIFAR10",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.453310627391652,
      "val_r": 0.47313669749576975,
      "n_iterations": 223,
      "n_nonzero_coefficients": 14,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0018236563773825765,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.014656581915915012,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.010521027259528637,
        "task_vector_dot_product": 0.0010526261758059263,
        "weight_space_angle": -0.0017765236552804708,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.011949615553021431,
        "subspace_overlap": 0.0022469155956059694,
        "right_subspace_overlap": 0.0025337375700473785,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.0025384072214365005,
        "activation_dot_product": -0.0010790566448122263,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0065032243728637695,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0014968190807849169,
        "input_gradient_l2_distance": -0.013079710304737091,
        "input_gradient_dot_product": -0.0036103278398513794
      }
    },
    {
      "fold": 15,
      "held_out_task": "Food101",
      "n_train_pairs": 162,
      "n_val_pairs": 17,
      "train_r": 0.5099625093628805,
      "val_r": 0.3708040488278689,
      "n_iterations": 282,
      "n_nonzero_coefficients": 20,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.002914929296821356,
        "interaction_matrix_overlap_top_k": 0.0016745371976867318,
        "interaction_matrix_overlap_bottom_k": 0.011722266674041748,
        "effective_rank": -0.0016872929409146309,
        "effective_rank_mergeability_score": 0.0012064606416970491,
        "stable_rank": -0.0012113905977457762,
        "spectral_gap": 0.001147003029473126,
        "singular_value_ratio": -0.001252182642929256,
        "layerwise_effective_rank": -0.001244403189048171,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.010555845685303211,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": -0.0014293510466814041,
        "singular_value_overlap": -0.00532348221167922,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0014432856114581227,
        "activation_cosine_similarity": -0.0016111378790810704,
        "activation_magnitude_ratio": -0.00407773582264781,
        "activation_dot_product": -0.0022621818352490664,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.005802331492304802,
        "encoder_gradient_dot_product": -0.001771858660504222,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.01084964070469141,
        "input_gradient_dot_product": -0.003138167317956686
      }
    },
    {
      "fold": 16,
      "held_out_task": "FashionMNIST",
      "n_train_pairs": 160,
      "n_val_pairs": 19,
      "train_r": 0.5089611192108546,
      "val_r": 0.32915354571429495,
      "n_iterations": 237,
      "n_nonzero_coefficients": 9,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.005366808269172907,
        "interaction_matrix_overlap_top_k": 0.0018510326044633985,
        "interaction_matrix_overlap_bottom_k": 0.011521491222083569,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.01029190979897976,
        "task_vector_dot_product": 0.0,
        "weight_space_angle": 0.0,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.009727745316922665,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": 0.0,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.002283476060256362,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0020906743593513966,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0012549696257337928,
        "input_gradient_l2_distance": -0.011020966805517673,
        "input_gradient_dot_product": 0.0
      }
    },
    {
      "fold": 17,
      "held_out_task": "EMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5267837371146333,
      "val_r": 0.2635261604396759,
      "n_iterations": 221,
      "n_nonzero_coefficients": 23,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.0,
        "right_subspace_overlap_bottom_k": 0.0063421051017940044,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.018129749223589897,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0013284790329635143,
        "stable_rank": -0.0018927042838186026,
        "spectral_gap": 0.001919551519677043,
        "singular_value_ratio": -0.003152377437800169,
        "layerwise_effective_rank": -0.0013638725504279137,
        "layerwise_effective_rank_mergeability_score": 0.002056812634691596,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": -0.0070373909547924995,
        "task_vector_dot_product": -0.005632298532873392,
        "weight_space_angle": 0.001785901258699596,
        "task_vector_magnitude_ratio": -0.002646197099238634,
        "singular_value_overlap": -0.009749110788106918,
        "subspace_overlap": 0.004085102118551731,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.003513542003929615,
        "activation_cosine_similarity": 0.001191473682411015,
        "activation_magnitude_ratio": -0.004425188060849905,
        "activation_dot_product": -0.0014854302862659097,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.0027938843704760075,
        "encoder_gradient_dot_product": -0.0019062390783801675,
        "input_gradient_cosine_similarity": 0.001613496569916606,
        "input_gradient_l2_distance": -0.01902633160352707,
        "input_gradient_dot_product": -0.005622257478535175
      }
    },
    {
      "fold": 18,
      "held_out_task": "KMNIST",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.6405888430379537,
      "val_r": 0.35591086836630675,
      "n_iterations": 359,
      "n_nonzero_coefficients": 16,
      "coefficients": {
        "right_subspace_overlap_top_k": 0.008604146540164948,
        "right_subspace_overlap_bottom_k": -0.0011452274629846215,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.0,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0015858043916523457,
        "stable_rank": -0.0010286883916705847,
        "spectral_gap": 0.0012245199177414179,
        "singular_value_ratio": 0.0,
        "layerwise_effective_rank": -0.0026593119837343693,
        "layerwise_effective_rank_mergeability_score": 0.002744744997471571,
        "task_vector_cosine_similarity": 0.0,
        "task_vector_l2_distance": 0.0015563133638352156,
        "task_vector_dot_product": -0.0021564646158367395,
        "weight_space_angle": 0.0015031910734251142,
        "task_vector_magnitude_ratio": 0.0,
        "singular_value_overlap": -0.0024986830540001392,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": 0.0,
        "activation_l2_distance": -0.0035677198320627213,
        "activation_cosine_similarity": 0.0,
        "activation_magnitude_ratio": -0.00196931604295969,
        "activation_dot_product": 0.0,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.009542731568217278,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0,
        "input_gradient_l2_distance": -0.007053387816995382,
        "input_gradient_dot_product": -0.0035294685512781143
      }
    },
    {
      "fold": 19,
      "held_out_task": "RenderedSST2",
      "n_train_pairs": 161,
      "n_val_pairs": 18,
      "train_r": 0.5538590283178486,
      "val_r": 0.3454410604991651,
      "n_iterations": 231,
      "n_nonzero_coefficients": 19,
      "coefficients": {
        "right_subspace_overlap_top_k": -0.0023703977931290865,
        "right_subspace_overlap_bottom_k": 0.011524985544383526,
        "interaction_matrix_overlap_top_k": 0.0,
        "interaction_matrix_overlap_bottom_k": 0.014752030372619629,
        "effective_rank": 0.0,
        "effective_rank_mergeability_score": 0.0,
        "stable_rank": 0.0,
        "spectral_gap": 0.0,
        "singular_value_ratio": -0.0010385948698967695,
        "layerwise_effective_rank": 0.0,
        "layerwise_effective_rank_mergeability_score": 0.0,
        "task_vector_cosine_similarity": 0.001962746027857065,
        "task_vector_l2_distance": -0.015370659530162811,
        "task_vector_dot_product": 0.0032272711396217346,
        "weight_space_angle": 0.00202799029648304,
        "task_vector_magnitude_ratio": -0.0013489078264683485,
        "singular_value_overlap": -0.01113838329911232,
        "subspace_overlap": 0.0,
        "right_subspace_overlap": -0.0034655241761356592,
        "activation_l2_distance": 0.0013434863649308681,
        "activation_cosine_similarity": -0.0011198726715520024,
        "activation_magnitude_ratio": -0.0017300860490649939,
        "activation_dot_product": 0.0010937649058178067,
        "encoder_gradient_cosine_similarity": 0.0,
        "encoder_gradient_l2_distance": -0.005050968378782272,
        "encoder_gradient_dot_product": 0.0,
        "input_gradient_cosine_similarity": 0.0017463758122175932,
        "input_gradient_l2_distance": -0.015150820836424828,
        "input_gradient_dot_product": -0.002018110593780875
      }
    }
  ],
  "optimization_params": {
    "lambda_l1": 1.5,
    "n_iterations": 2000,
    "learning_rate": 0.01,
    "patience": 100,
    "convergence_threshold": 1e-05
  }
}