{
  "coefficients": {
    "right_subspace_overlap_top_k": 0.19556430979503944,
    "right_subspace_overlap_bottom_k": 0.044655352485868605,
    "interaction_matrix_overlap_top_k": -0.5937515700437175,
    "interaction_matrix_overlap_bottom_k": 0.129160809506071,
    "effective_rank": -0.013944322929909391,
    "effective_rank_mergeability_score": 0.29874922450179014,
    "stable_rank": 0.07669603156457319,
    "spectral_gap": 0.08560735402744798,
    "singular_value_ratio": 0.19919574079578045,
    "layerwise_effective_rank": 0.2613707706883656,
    "layerwise_effective_rank_mergeability_score": 0.023434130883517357,
    "task_vector_cosine_similarity": 0.19662506122097972,
    "task_vector_l2_distance": -0.13931585995010334,
    "task_vector_dot_product": 0.025740805040546995,
    "weight_space_angle": 0.041505406466240326,
    "task_vector_magnitude_ratio": -0.14287791618486248,
    "singular_value_overlap": -0.00785935549165283,
    "subspace_overlap": 0.004309959535366712,
    "right_subspace_overlap": 0.19556861939220035,
    "activation_l2_distance": 0.21909595364988477,
    "activation_cosine_similarity": 0.17276783283560385,
    "activation_magnitude_ratio": -0.03263350838494625,
    "activation_dot_product": 0.009703971942257517,
    "encoder_gradient_cosine_similarity": -0.03130459119810194,
    "encoder_gradient_l2_distance": -0.06208481053479434,
    "encoder_gradient_dot_product": -0.026130303402278763,
    "input_gradient_cosine_similarity": 0.005842078805262423,
    "input_gradient_l2_distance": -0.10500265760347437,
    "input_gradient_dot_product": -0.030688517412955373
  },
  "correlation": {
    "train": 0.7297950890526047,
    "train_p_value": 6.98713622223781e-21,
    "validation": 0.18117176597024018,
    "validation_p_value": 0.136279083876885,
    "full_dataset": 0.5182213212202322,
    "full_dataset_p_value": 3.048145443875653e-14
  },
  "n_pairs": {
    "total": 187,
    "train": 118,
    "validation": 69
  },
  "n_metrics": 29,
  "target_metric": "acc/test/avg",
  "optimization": {
    "n_iterations": 1000,
    "total_iterations": 471,
    "stopped_early": true,
    "learning_rate": 0.01,
    "convergence_threshold": 0.0001,
    "patience": 50,
    "final_loss": -0.7286163859583226,
    "validation_split": 0.2,
    "random_seed": 42
  },
  "normalization": {
    "min_vals": {
      "right_subspace_overlap_top_k": 0.25041620259966396,
      "right_subspace_overlap_bottom_k": 0.2723849411974317,
      "interaction_matrix_overlap_top_k": 0.10403256360792888,
      "interaction_matrix_overlap_bottom_k": 0.14161783274491582,
      "effective_rank": 1.5310468673706055,
      "effective_rank_mergeability_score": 0.0006166696548461914,
      "stable_rank": 1.3470213413238525,
      "spectral_gap": 0.04846324399113655,
      "singular_value_ratio": 0.17907467484474182,
      "layerwise_effective_rank": 1.4840256127297484,
      "layerwise_effective_rank_mergeability_score": 0.05279409214075703,
      "task_vector_cosine_similarity": 0.017599662765860558,
      "task_vector_l2_distance": 1.1018004417419434,
      "task_vector_dot_product": 0.01899923011660576,
      "weight_space_angle": 65.43018249703549,
      "task_vector_magnitude_ratio": 0.17972049093878661,
      "singular_value_overlap": 0.8586736580110946,
      "subspace_overlap": 0.057509828710331105,
      "right_subspace_overlap": 0.07918855210520184,
      "activation_l2_distance": 1.3818771839141846,
      "activation_cosine_similarity": 0.765999436378479,
      "activation_magnitude_ratio": 0.8479683236390776,
      "activation_dot_product": 72.62097930908203,
      "encoder_gradient_cosine_similarity": -0.18100124597549438,
      "encoder_gradient_l2_distance": 0.2646402418613434,
      "encoder_gradient_dot_product": -0.09055434912443161,
      "input_gradient_cosine_similarity": -0.029451850801706314,
      "input_gradient_l2_distance": 0.008532422594726086,
      "input_gradient_dot_product": -0.00016633261111564934
    },
    "max_vals": {
      "right_subspace_overlap_top_k": 0.7592418675200329,
      "right_subspace_overlap_bottom_k": 0.4271782482496782,
      "interaction_matrix_overlap_top_k": 0.5886276431803433,
      "interaction_matrix_overlap_bottom_k": 0.2883538798349997,
      "effective_rank": 1.9993833303451538,
      "effective_rank_mergeability_score": 0.46895313262939453,
      "stable_rank": 1.9987672567367554,
      "spectral_gap": 0.8209252953529358,
      "singular_value_ratio": 0.9515367746353149,
      "layerwise_effective_rank": 1.947205907859243,
      "layerwise_effective_rank_mergeability_score": 0.5159743872702516,
      "task_vector_cosine_similarity": 0.4158017635345459,
      "task_vector_l2_distance": 5.254244804382324,
      "task_vector_dot_product": 2.7083942890167236,
      "weight_space_angle": 88.99156153777179,
      "task_vector_magnitude_ratio": 0.9982956026653382,
      "singular_value_overlap": 0.941358577530339,
      "subspace_overlap": 0.19920345094968686,
      "right_subspace_overlap": 0.24009334951076866,
      "activation_l2_distance": 7.238561630249023,
      "activation_cosine_similarity": 0.9904800057411194,
      "activation_magnitude_ratio": 0.9995727165966162,
      "activation_dot_product": 119.74378204345703,
      "encoder_gradient_cosine_similarity": 0.11323171108961105,
      "encoder_gradient_l2_distance": 2.7120490074157715,
      "encoder_gradient_dot_product": 0.06004917994141579,
      "input_gradient_cosine_similarity": 0.06875480711460114,
      "input_gradient_l2_distance": 0.31483009457588196,
      "input_gradient_dot_product": 0.0003173672594130039
    }
  }
}