# ============================================================
# MULTI-ROUND ENTROPY SWEEP CONFIGURATION
# ------------------------------------------------------------

experiment:
  name: "proxy_emulation_entropy_sweep"
  description: "Evaluating model recovery of aggregate preferences using entropy-ranked proxy modes."
  seed: 101

# --- INPUT FILES ---
paths:
  survey_csv: "data/w42/info.csv"
  survey_yaml: "config/surveys/american_trend_panel.yaml"
  responses_csv: "outputs/ATP_w42_20250726_181405/responses.csv"
  endowments_csv: "outputs/ATP_w42_20250726_181405/endowments.csv"
  attribute_bank: "outputs/ATP_w42_20250726_181405/attribute_bank.yaml"

# --- LASSO CONFIGURATION ---
lasso:
  alpha_expr: "np.logspace(-5, 5, 30)"
  max_iter: 10000
  validation:
    strategy: "cv"
    cv_folds: 5
  post_selection_refit: false

# --- ELASTICNET CONFIGURATION (optional) ---
elasticnet:
  alpha_expr: "np.logspace(-5, 5, 30)"
  l1_ratio_expr: "np.linspace(0.1, 1.0, 10)"
  max_iter: 10000
  validation:
    strategy: "cv"
    cv_folds: 5
  plot_style: "2D"
  post_selection_refit: false

# --- SPLIT SETTINGS ---
split_settings:
  use_proxy_only: true
  train_val_split: ["train", "valid"]
  test_split: "test"

# --- ENTROPY SWEEP RUNNER SETTINGS ---
runner:
  models: ["lasso"]                            # Regression models to run
  n_repeats: 10                                # Number of repetitions
  n_proxies: 30                                # Number of proxy agents per run
  n_ground_truth: 30                           # Number of GT agents to assign
  ground_truth_entropy_threshold: 0.4          # Select GT modes above this threshold
  seed: 101                                    # Base seed (incremented across repeats)
  plot: false                                  # Set to true if you want prediction/diag plots
  verbose: false
  output_dir: "outputs/entropy_sweep"          # Output directory