{
  "weight_avg": {
    "aggregate_metrics": {
      "train": {
        "mse": 0.0031673703984699307,
        "mae": 0.04501044331328168,
        "r2": 0.22406406445069826,
        "pearson_r": 0.48043913857059845,
        "p_value": 9.31836890074701e-186
      },
      "validation": {
        "mse": 0.003380632558039914,
        "mae": 0.04746558161137226,
        "r2": 0.17181953587167975,
        "pearson_r": 0.41715428301016666,
        "p_value": 1.662746004816915e-16
      }
    },
    "per_fold_stats": {
      "train_r_mean": 0.5790587489091321,
      "train_r_std": 0.2860043286058345,
      "val_r_mean": 0.44862754229310225,
      "val_r_std": 0.2342729070818839
    },
    "feature_selection": {
      "n_selected_features": 30,
      "selected_features": [
        "stable_rank \u00d7 singular_value_ratio",
        "interaction_matrix_overlap_top_k \u00d7 singular_value_ratio",
        "task_vector_magnitude_ratio",
        "effective_rank \u00d7 layerwise_effective_rank",
        "activation_magnitude_ratio",
        "activation_dot_product",
        "singular_value_overlap",
        "effective_rank_mergeability_score \u00d7 spectral_gap",
        "activation_l2_distance",
        "encoder_gradient_cosine_similarity",
        "encoder_gradient_dot_product",
        "task_vector_dot_product",
        "right_subspace_overlap_top_k \u00d7 interaction_matrix_overlap_top_k",
        "effective_rank \u00d7 effective_rank_mergeability_score",
        "stable_rank \u00d7 spectral_gap",
        "effective_rank_mergeability_score \u00d7 layerwise_effective_rank",
        "right_subspace_overlap_bottom_k \u00d7 interaction_matrix_overlap_bottom_k",
        "input_gradient_dot_product",
        "layerwise_effective_rank",
        "interaction_matrix_overlap_bottom_k \u00d7 stable_rank",
        "activation_cosine_similarity",
        "right_subspace_overlap_top_k \u00d7 layerwise_effective_rank",
        "input_gradient_l2_distance",
        "encoder_gradient_l2_distance",
        "right_subspace_overlap_bottom_k \u00d7 layerwise_effective_rank",
        "interaction_matrix_overlap_top_k \u00d7 spectral_gap",
        "interaction_matrix_overlap_top_k",
        "interaction_matrix_overlap_bottom_k",
        "right_subspace_overlap_top_k \u00d7 interaction_matrix_overlap_bottom_k",
        "right_subspace_overlap_bottom_k \u00d7 interaction_matrix_overlap_top_k"
      ],
      "lasso_alpha": 0.0005428675439323859
    },
    "model_config": {
      "input_dim": 30,
      "hidden_dim": 8,
      "dropout": 0.4,
      "weight_decay": 0.001
    }
  },
  "arithmetic": {
    "aggregate_metrics": {
      "train": {
        "mse": 0.009671509156627105,
        "mae": 0.07828068007165365,
        "r2": -0.12842104539145294,
        "pearson_r": 0.1226504525208136,
        "p_value": 2.835332952784652e-12
      },
      "validation": {
        "mse": 0.007141806117585464,
        "mae": 0.06867556662541123,
        "r2": 0.16673145889887253,
        "pearson_r": 0.43649229235248427,
        "p_value": 4.376085665369065e-18
      }
    },
    "per_fold_stats": {
      "train_r_mean": 0.3074594601948378,
      "train_r_std": 0.2685140369588375,
      "val_r_mean": 0.2846454006074091,
      "val_r_std": 0.19677225646031504
    },
    "feature_selection": {
      "n_selected_features": 15,
      "selected_features": [
        "right_subspace_overlap_top_k",
        "interaction_matrix_overlap_bottom_k",
        "stable_rank",
        "task_vector_l2_distance",
        "task_vector_magnitude_ratio",
        "singular_value_overlap",
        "right_subspace_overlap",
        "activation_cosine_similarity",
        "activation_magnitude_ratio",
        "activation_dot_product",
        "encoder_gradient_l2_distance",
        "input_gradient_l2_distance",
        "input_gradient_dot_product",
        "right_subspace_overlap_top_k \u00d7 interaction_matrix_overlap_bottom_k",
        "right_subspace_overlap_bottom_k \u00d7 layerwise_effective_rank"
      ],
      "lasso_alpha": 0.0062505519252739694
    },
    "model_config": {
      "input_dim": 15,
      "hidden_dim": 8,
      "dropout": 0.4,
      "weight_decay": 0.001
    }
  },
  "tsv": {
    "aggregate_metrics": {
      "train": {
        "mse": 0.003349619496953961,
        "mae": 0.04539368526920834,
        "r2": 0.05145167202129364,
        "pearson_r": 0.385031376877594,
        "p_value": 2.3171219190077353e-114
      },
      "validation": {
        "mse": 0.0022261731634025087,
        "mae": 0.0381378355040149,
        "r2": 0.36959023738165775,
        "pearson_r": 0.6279922375987863,
        "p_value": 1.144151115376042e-40
      }
    },
    "per_fold_stats": {
      "train_r_mean": 0.5466768936300997,
      "train_r_std": 0.28314396525786256,
      "val_r_mean": 0.515652226329794,
      "val_r_std": 0.28873454295176976
    },
    "feature_selection": {
      "n_selected_features": 30,
      "selected_features": [
        "right_subspace_overlap_top_k",
        "activation_dot_product",
        "singular_value_overlap",
        "activation_l2_distance",
        "encoder_gradient_dot_product",
        "input_gradient_dot_product",
        "task_vector_l2_distance",
        "right_subspace_overlap_top_k \u00d7 interaction_matrix_overlap_top_k",
        "right_subspace_overlap",
        "task_vector_cosine_similarity",
        "interaction_matrix_overlap_top_k",
        "task_vector_dot_product",
        "interaction_matrix_overlap_bottom_k \u00d7 effective_rank",
        "interaction_matrix_overlap_top_k \u00d7 spectral_gap",
        "effective_rank \u00d7 effective_rank_mergeability_score",
        "input_gradient_l2_distance",
        "layerwise_effective_rank",
        "encoder_gradient_l2_distance",
        "interaction_matrix_overlap_bottom_k \u00d7 stable_rank",
        "right_subspace_overlap_bottom_k \u00d7 interaction_matrix_overlap_bottom_k",
        "activation_cosine_similarity",
        "right_subspace_overlap_top_k \u00d7 effective_rank",
        "interaction_matrix_overlap_top_k \u00d7 effective_rank",
        "interaction_matrix_overlap_top_k \u00d7 stable_rank",
        "right_subspace_overlap_bottom_k \u00d7 layerwise_effective_rank",
        "right_subspace_overlap_top_k \u00d7 layerwise_effective_rank",
        "right_subspace_overlap_bottom_k",
        "interaction_matrix_overlap_bottom_k",
        "right_subspace_overlap_top_k \u00d7 interaction_matrix_overlap_bottom_k",
        "right_subspace_overlap_bottom_k \u00d7 interaction_matrix_overlap_top_k"
      ],
      "lasso_alpha": 0.0002559547922699536
    },
    "model_config": {
      "input_dim": 30,
      "hidden_dim": 8,
      "dropout": 0.4,
      "weight_decay": 0.001
    }
  },
  "isotropic": {
    "aggregate_metrics": {
      "train": {
        "mse": 0.01405105661603318,
        "mae": 0.09241066571234875,
        "r2": -0.02457223614006554,
        "pearson_r": 0.1929612360027588,
        "p_value": 2.1255014013973193e-28
      },
      "validation": {
        "mse": 0.0148208560322768,
        "mae": 0.09349135340606474,
        "r2": -0.08070432149370821,
        "pearson_r": 0.11173149870624398,
        "p_value": 0.0345762071018506
      }
    },
    "per_fold_stats": {
      "train_r_mean": 0.28012861898835856,
      "train_r_std": 0.19045298646388595,
      "val_r_mean": 0.20021801820950436,
      "val_r_std": 0.2215491168457287
    },
    "feature_selection": {
      "n_selected_features": 12,
      "selected_features": [
        "interaction_matrix_overlap_bottom_k",
        "stable_rank",
        "task_vector_l2_distance",
        "task_vector_magnitude_ratio",
        "singular_value_overlap",
        "activation_magnitude_ratio",
        "activation_dot_product",
        "encoder_gradient_l2_distance",
        "input_gradient_l2_distance",
        "input_gradient_dot_product",
        "right_subspace_overlap_top_k \u00d7 interaction_matrix_overlap_bottom_k",
        "right_subspace_overlap_bottom_k \u00d7 spectral_gap"
      ],
      "lasso_alpha": 0.005179474679231213
    },
    "model_config": {
      "input_dim": 12,
      "hidden_dim": 8,
      "dropout": 0.4,
      "weight_decay": 0.001
    }
  }
}