{
  "coefficients": {
    "right_subspace_overlap_top_k": 0.15542735038897568,
    "right_subspace_overlap_bottom_k": -0.26997868365761346,
    "interaction_matrix_overlap_top_k": -0.42099377568440144,
    "interaction_matrix_overlap_bottom_k": 0.3036423996582754,
    "effective_rank": 0.22809540963431998,
    "effective_rank_mergeability_score": 0.1040780369501592,
    "stable_rank": -0.183064502681024,
    "spectral_gap": 0.10569376501660466,
    "singular_value_ratio": 0.22647951274223593,
    "layerwise_effective_rank": 0.18081584156928793,
    "layerwise_effective_rank_mergeability_score": 0.1513576050151942,
    "task_vector_cosine_similarity": 0.1471606256938126,
    "task_vector_l2_distance": -0.03266029449518027,
    "task_vector_dot_product": 0.029803280415918034,
    "weight_space_angle": 0.10668476990176536,
    "task_vector_magnitude_ratio": -0.08899343616125323,
    "singular_value_overlap": 0.023436371154823502,
    "subspace_overlap": -0.007129360780304687,
    "right_subspace_overlap": 0.15543449040005278,
    "activation_l2_distance": 0.11597519344229186,
    "activation_cosine_similarity": 0.13582328221716844,
    "activation_magnitude_ratio": -0.009716296995015215,
    "activation_dot_product": -0.006289209768876086,
    "encoder_gradient_cosine_similarity": -0.010653219295694303,
    "encoder_gradient_l2_distance": -0.04850885729819487,
    "encoder_gradient_dot_product": -0.009250609545191524,
    "input_gradient_cosine_similarity": 0.007744335608658921,
    "input_gradient_l2_distance": -0.06694688493051429,
    "input_gradient_dot_product": -0.023467138516281
  },
  "correlation": {
    "train": 0.8549169083912536,
    "train_p_value": 7.449024345359661e-35,
    "validation": 0.44113767219870414,
    "validation_p_value": 0.0001482552405352178,
    "full_dataset": 0.6915561169822046,
    "full_dataset_p_value": 6.176317430353756e-28
  },
  "n_pairs": {
    "total": 187,
    "train": 118,
    "validation": 69
  },
  "n_metrics": 29,
  "target_metric": "acc/test/avg",
  "optimization": {
    "n_iterations": 1000,
    "total_iterations": 719,
    "stopped_early": true,
    "learning_rate": 0.01,
    "convergence_threshold": 0.0001,
    "patience": 50,
    "final_loss": -0.8529176662123873,
    "validation_split": 0.2,
    "random_seed": 42
  },
  "normalization": {
    "min_vals": {
      "right_subspace_overlap_top_k": 0.25041620259966396,
      "right_subspace_overlap_bottom_k": 0.2723849411974317,
      "interaction_matrix_overlap_top_k": 0.10403256360792888,
      "interaction_matrix_overlap_bottom_k": 0.14161783274491582,
      "effective_rank": 1.5310468673706055,
      "effective_rank_mergeability_score": 0.0006166696548461914,
      "stable_rank": 1.3470213413238525,
      "spectral_gap": 0.04846324399113655,
      "singular_value_ratio": 0.17907467484474182,
      "layerwise_effective_rank": 1.4840256127297484,
      "layerwise_effective_rank_mergeability_score": 0.05279409214075703,
      "task_vector_cosine_similarity": 0.017599662765860558,
      "task_vector_l2_distance": 1.1018004417419434,
      "task_vector_dot_product": 0.01899923011660576,
      "weight_space_angle": 65.43018249703549,
      "task_vector_magnitude_ratio": 0.17972049093878661,
      "singular_value_overlap": 0.8586736580110946,
      "subspace_overlap": 0.057509828710331105,
      "right_subspace_overlap": 0.07918855210520184,
      "activation_l2_distance": 1.3818771839141846,
      "activation_cosine_similarity": 0.765999436378479,
      "activation_magnitude_ratio": 0.8479683236390776,
      "activation_dot_product": 72.62097930908203,
      "encoder_gradient_cosine_similarity": -0.18100124597549438,
      "encoder_gradient_l2_distance": 0.2646402418613434,
      "encoder_gradient_dot_product": -0.09055434912443161,
      "input_gradient_cosine_similarity": -0.029451850801706314,
      "input_gradient_l2_distance": 0.008532422594726086,
      "input_gradient_dot_product": -0.00016633261111564934
    },
    "max_vals": {
      "right_subspace_overlap_top_k": 0.7592418675200329,
      "right_subspace_overlap_bottom_k": 0.4271782482496782,
      "interaction_matrix_overlap_top_k": 0.5886276431803433,
      "interaction_matrix_overlap_bottom_k": 0.2883538798349997,
      "effective_rank": 1.9993833303451538,
      "effective_rank_mergeability_score": 0.46895313262939453,
      "stable_rank": 1.9987672567367554,
      "spectral_gap": 0.8209252953529358,
      "singular_value_ratio": 0.9515367746353149,
      "layerwise_effective_rank": 1.947205907859243,
      "layerwise_effective_rank_mergeability_score": 0.5159743872702516,
      "task_vector_cosine_similarity": 0.4158017635345459,
      "task_vector_l2_distance": 5.254244804382324,
      "task_vector_dot_product": 2.7083942890167236,
      "weight_space_angle": 88.99156153777179,
      "task_vector_magnitude_ratio": 0.9982956026653382,
      "singular_value_overlap": 0.941358577530339,
      "subspace_overlap": 0.19920345094968686,
      "right_subspace_overlap": 0.24009334951076866,
      "activation_l2_distance": 7.238561630249023,
      "activation_cosine_similarity": 0.9904800057411194,
      "activation_magnitude_ratio": 0.9995727165966162,
      "activation_dot_product": 119.74378204345703,
      "encoder_gradient_cosine_similarity": 0.11323171108961105,
      "encoder_gradient_l2_distance": 2.7120490074157715,
      "encoder_gradient_dot_product": 0.06004917994141579,
      "input_gradient_cosine_similarity": 0.06875480711460114,
      "input_gradient_l2_distance": 0.31483009457588196,
      "input_gradient_dot_product": 0.0003173672594130039
    }
  }
}