{
  "coefficients": {
    "right_subspace_overlap_top_k": 0.15483502404776378,
    "right_subspace_overlap_bottom_k": -0.3339826081339457,
    "interaction_matrix_overlap_top_k": -0.40137181180232423,
    "interaction_matrix_overlap_bottom_k": 0.3363486248453292,
    "effective_rank": 0.25859879225780813,
    "effective_rank_mergeability_score": 0.049363316793296405,
    "stable_rank": -0.21137073708163467,
    "spectral_gap": 0.13055171863413192,
    "singular_value_ratio": 0.17741042617256178,
    "layerwise_effective_rank": 0.14403882597009177,
    "layerwise_effective_rank_mergeability_score": 0.1639232830810135,
    "task_vector_cosine_similarity": 0.1404837681711003,
    "task_vector_l2_distance": -0.0074521530460567136,
    "task_vector_dot_product": 0.032484980105505566,
    "weight_space_angle": 0.13039183540648577,
    "task_vector_magnitude_ratio": -0.01314740962358913,
    "singular_value_overlap": 0.0302894668807691,
    "subspace_overlap": -0.007969705329811538,
    "right_subspace_overlap": 0.15483912225662924,
    "activation_l2_distance": 0.08907319653575006,
    "activation_cosine_similarity": 0.12867941808801234,
    "activation_magnitude_ratio": -0.008527308397311164,
    "activation_dot_product": -0.01810569842243248,
    "encoder_gradient_cosine_similarity": -0.008809670085715794,
    "encoder_gradient_l2_distance": -0.04062167095331543,
    "encoder_gradient_dot_product": -0.004723592079007911,
    "input_gradient_cosine_similarity": 0.0037103914375470016,
    "input_gradient_l2_distance": -0.05258488467583932,
    "input_gradient_dot_product": -0.016354941052812048
  },
  "correlation": {
    "train": 0.8813444308478118,
    "train_p_value": 6.389062110242499e-39,
    "validation": 0.5344745296565481,
    "validation_p_value": 2.2416093076749635e-06,
    "full_dataset": 0.7522715511307757,
    "full_dataset_p_value": 5.373859433477235e-35
  },
  "n_pairs": {
    "total": 185,
    "train": 116,
    "validation": 69
  },
  "n_metrics": 29,
  "target_metric": "acc/test/avg",
  "optimization": {
    "n_iterations": 1000,
    "total_iterations": 780,
    "stopped_early": true,
    "learning_rate": 0.01,
    "convergence_threshold": 0.0001,
    "patience": 50,
    "final_loss": -0.8804086080662906,
    "validation_split": 0.2,
    "random_seed": 42
  },
  "normalization": {
    "min_vals": {
      "right_subspace_overlap_top_k": 0.25041620259966396,
      "right_subspace_overlap_bottom_k": 0.2723849411974317,
      "interaction_matrix_overlap_top_k": 0.10403256360792888,
      "interaction_matrix_overlap_bottom_k": 0.14161783274491582,
      "effective_rank": 1.5310468673706055,
      "effective_rank_mergeability_score": 0.0006166696548461914,
      "stable_rank": 1.3470213413238525,
      "spectral_gap": 0.04846324399113655,
      "singular_value_ratio": 0.17907467484474182,
      "layerwise_effective_rank": 1.4840256127297484,
      "layerwise_effective_rank_mergeability_score": 0.05279409214075703,
      "task_vector_cosine_similarity": 0.017599662765860558,
      "task_vector_l2_distance": 1.1018004417419434,
      "task_vector_dot_product": 0.01899923011660576,
      "weight_space_angle": 65.43018249703549,
      "task_vector_magnitude_ratio": 0.17972049093878661,
      "singular_value_overlap": 0.8586736580110946,
      "subspace_overlap": 0.057509828710331105,
      "right_subspace_overlap": 0.07918855210520184,
      "activation_l2_distance": 1.3818771839141846,
      "activation_cosine_similarity": 0.765999436378479,
      "activation_magnitude_ratio": 0.8479683236390776,
      "activation_dot_product": 72.62097930908203,
      "encoder_gradient_cosine_similarity": -0.18100124597549438,
      "encoder_gradient_l2_distance": 0.2646402418613434,
      "encoder_gradient_dot_product": -0.09055434912443161,
      "input_gradient_cosine_similarity": -0.02535366825759411,
      "input_gradient_l2_distance": 0.008532422594726086,
      "input_gradient_dot_product": -0.00016633261111564934
    },
    "max_vals": {
      "right_subspace_overlap_top_k": 0.7592418675200329,
      "right_subspace_overlap_bottom_k": 0.4271782482496782,
      "interaction_matrix_overlap_top_k": 0.5886276431803433,
      "interaction_matrix_overlap_bottom_k": 0.2883538798349997,
      "effective_rank": 1.9993833303451538,
      "effective_rank_mergeability_score": 0.46895313262939453,
      "stable_rank": 1.9987672567367554,
      "spectral_gap": 0.8209252953529358,
      "singular_value_ratio": 0.9515367746353149,
      "layerwise_effective_rank": 1.947205907859243,
      "layerwise_effective_rank_mergeability_score": 0.5159743872702516,
      "task_vector_cosine_similarity": 0.4158017635345459,
      "task_vector_l2_distance": 5.254244804382324,
      "task_vector_dot_product": 2.7083942890167236,
      "weight_space_angle": 88.99156153777179,
      "task_vector_magnitude_ratio": 0.9982956026653382,
      "singular_value_overlap": 0.941358577530339,
      "subspace_overlap": 0.19920345094968686,
      "right_subspace_overlap": 0.24009334951076866,
      "activation_l2_distance": 7.238561630249023,
      "activation_cosine_similarity": 0.9904800057411194,
      "activation_magnitude_ratio": 0.9995727165966162,
      "activation_dot_product": 119.74378204345703,
      "encoder_gradient_cosine_similarity": 0.11323171108961105,
      "encoder_gradient_l2_distance": 2.7120490074157715,
      "encoder_gradient_dot_product": 0.06004917994141579,
      "input_gradient_cosine_similarity": 0.06875480711460114,
      "input_gradient_l2_distance": 0.31483009457588196,
      "input_gradient_dot_product": 0.0003173672594130039
    }
  }
}