{
  "coefficients": {
    "right_subspace_overlap_top_k": 0.21237088721513123,
    "right_subspace_overlap_bottom_k": 0.08535094438461933,
    "interaction_matrix_overlap_top_k": -0.6771572991066357,
    "interaction_matrix_overlap_bottom_k": 0.126177422193125,
    "effective_rank": -0.06114983869903536,
    "effective_rank_mergeability_score": 0.3314390194101724,
    "stable_rank": 0.23068320067845344,
    "spectral_gap": 0.09581498144032964,
    "singular_value_ratio": 0.17447278949441977,
    "layerwise_effective_rank": 0.23063835601768362,
    "layerwise_effective_rank_mergeability_score": 0.03965082469345525,
    "task_vector_cosine_similarity": 0.16790097282112007,
    "task_vector_l2_distance": -0.13717934964460046,
    "task_vector_dot_product": 0.0379183201188404,
    "weight_space_angle": 0.03528308271912029,
    "task_vector_magnitude_ratio": -0.1493861106728701,
    "singular_value_overlap": -0.04183694112512797,
    "subspace_overlap": 0.029557059925638094,
    "right_subspace_overlap": 0.2123737118428693,
    "activation_l2_distance": 0.1863456585785412,
    "activation_cosine_similarity": 0.1447388671967402,
    "activation_magnitude_ratio": -0.04394078284560035,
    "activation_dot_product": -0.014579238955547072,
    "encoder_gradient_cosine_similarity": -0.038840509035691737,
    "encoder_gradient_l2_distance": -0.03882847353178189,
    "encoder_gradient_dot_product": -0.028044666736680445,
    "input_gradient_cosine_similarity": 0.008675820895637306,
    "input_gradient_l2_distance": -0.09752472328359045,
    "input_gradient_dot_product": -0.020923985988735044
  },
  "correlation": {
    "train": 0.7113909892481955,
    "train_p_value": 5.134051870773928e-19,
    "validation": 0.14877957011810208,
    "validation_p_value": 0.23316481353033203,
    "full_dataset": 0.5149269663042706,
    "full_dataset_p_value": 1.206538069420809e-13
  },
  "n_pairs": {
    "total": 181,
    "train": 115,
    "validation": 66
  },
  "n_metrics": 29,
  "target_metric": "acc/test/avg",
  "optimization": {
    "n_iterations": 1000,
    "total_iterations": 447,
    "stopped_early": true,
    "learning_rate": 0.01,
    "convergence_threshold": 0.0001,
    "patience": 50,
    "final_loss": -0.7114343674698356,
    "validation_split": 0.2,
    "random_seed": 42
  },
  "normalization": {
    "min_vals": {
      "right_subspace_overlap_top_k": 0.25041620259966396,
      "right_subspace_overlap_bottom_k": 0.2723849411974317,
      "interaction_matrix_overlap_top_k": 0.10403256360792888,
      "interaction_matrix_overlap_bottom_k": 0.14161783274491582,
      "effective_rank": 1.5509037971496582,
      "effective_rank_mergeability_score": 0.0006166696548461914,
      "stable_rank": 1.3663403987884521,
      "spectral_gap": 0.04846324399113655,
      "singular_value_ratio": 0.18976633250713348,
      "layerwise_effective_rank": 1.5061951007544805,
      "layerwise_effective_rank_mergeability_score": 0.05279409214075703,
      "task_vector_cosine_similarity": 0.017599662765860558,
      "task_vector_l2_distance": 1.1018004417419434,
      "task_vector_dot_product": 0.01899923011660576,
      "weight_space_angle": 65.43018249703549,
      "task_vector_magnitude_ratio": 0.19405712933159944,
      "singular_value_overlap": 0.8586736580110946,
      "subspace_overlap": 0.057509828710331105,
      "right_subspace_overlap": 0.07918855210520184,
      "activation_l2_distance": 1.3818771839141846,
      "activation_cosine_similarity": 0.765999436378479,
      "activation_magnitude_ratio": 0.8479683236390776,
      "activation_dot_product": 72.62097930908203,
      "encoder_gradient_cosine_similarity": -0.18100124597549438,
      "encoder_gradient_l2_distance": 0.2646402418613434,
      "encoder_gradient_dot_product": -0.09055434912443161,
      "input_gradient_cosine_similarity": -0.029451850801706314,
      "input_gradient_l2_distance": 0.008532422594726086,
      "input_gradient_dot_product": -0.00016633261111564934
    },
    "max_vals": {
      "right_subspace_overlap_top_k": 0.7592418675200329,
      "right_subspace_overlap_bottom_k": 0.4271782482496782,
      "interaction_matrix_overlap_top_k": 0.5886276431803433,
      "interaction_matrix_overlap_bottom_k": 0.2883538798349997,
      "effective_rank": 1.9993833303451538,
      "effective_rank_mergeability_score": 0.4490962028503418,
      "stable_rank": 1.9987672567367554,
      "spectral_gap": 0.8102336525917053,
      "singular_value_ratio": 0.9515367746353149,
      "layerwise_effective_rank": 1.947205907859243,
      "layerwise_effective_rank_mergeability_score": 0.4938048992455195,
      "task_vector_cosine_similarity": 0.4158017635345459,
      "task_vector_l2_distance": 5.254244804382324,
      "task_vector_dot_product": 2.7083942890167236,
      "weight_space_angle": 88.99156153777179,
      "task_vector_magnitude_ratio": 0.9982956026653382,
      "singular_value_overlap": 0.941358577530339,
      "subspace_overlap": 0.19920345094968686,
      "right_subspace_overlap": 0.24009334951076866,
      "activation_l2_distance": 7.238561630249023,
      "activation_cosine_similarity": 0.9904800057411194,
      "activation_magnitude_ratio": 0.9995727165966162,
      "activation_dot_product": 119.74378204345703,
      "encoder_gradient_cosine_similarity": 0.11323171108961105,
      "encoder_gradient_l2_distance": 2.7120490074157715,
      "encoder_gradient_dot_product": 0.06004917994141579,
      "input_gradient_cosine_similarity": 0.06875480711460114,
      "input_gradient_l2_distance": 0.31483009457588196,
      "input_gradient_dot_product": 0.0003173672594130039
    }
  }
}