# ============================================================
# PANEL EMPIRICAL STUDY SWEEP CONFIGURATION
# This YAML governs a multi-round panel study with multiple waves and repeats.
# Each sweep runs a full endowment generation and regression experiment.
# ============================================================

# --- Sweep Settings (used only in the panel sweeper) ---
sweep: # 
  output_dir: "outputs/panel_study"      # Base directory for sweep outputs
  waves: ["W26", "W27", "W29", "W32", "W34", "W36", "W41", "W42", "W45", "W49", "W50", "W54", "W82", "W92"]  # Wave IDs to sweep over
  repeats: 3                              # Number of repeats per wave

# --- Metadata for Experiment Settings (copied and modified per sweep) ---
experiment:
  name: "ATP_panel_study"
  description: "Panel sweep across 17 waves using active endowment generation and regression."
  version: "v1"
  random_seed: 101        # Base seed; incremented per repeat

# --- Paths (relative to wave ID, which is injected per sweep step) ---
paths:
  survey_csv: "data/{wave}/info.csv"
  survey_yaml: "config/surveys/american_trend_panel.yaml"
  attribute_bank: "config/attribute_banks/attribute_bank.yaml"
  aggregate_json: "data/{wave}/{wave}_aggregate_results.json"

# --- Report Styling ---
report:
  endowment: styles/generation_report.css
  regression: styles/lasso_report.css

# ============================================================
#           [STAGE 1] ACTIVE ENDOWMENT GENERATION
# ============================================================

agent:
  type: openai
  model_name: gpt-4o
  formality: >
    You are completing a survey. Your answer should reflect the person described in the profile above, using their preferences, beliefs and experiences.
    Respond with only the final answer string, not the code or label in brackets.
    Do not include any reasoning, explanation, or commentary.
    Do not preface your answer with phrases like 'I would choose'.
    Just return the answer text exactly as it appears in the options.
  delay: 0.1
  kwargs:
    temperature: 0
    max_tokens: 128


endowment_model:
  model: gpt-4o-mini
  temperature: 0.9
  batch_size: 5
  delay: 0.5
  retry_failed: true
  max_attributes: 10
  randomize_attributes: true

attribute_learner:
  model: gpt-4o
  max_tokens: 1024

generation:
  target_n: 300
  initial_n: 10
  num_update_steps: 5
  parallel: true
  max_workers: 110
  question_patch:
    fraction: 0.75
    top_k: 3
    min_repeats: 2
  verbose: true

# ============================================================
#           [STAGE 2] LASSO / ELASTIC NET REGRESSION
# ============================================================

lasso:
  alpha_expr: "np.logspace(-5, 5, 30)"
  max_iter: 10000
  validation:
    strategy: "cv"
    cv_folds: 5
  post_selection_refit: false

elasticnet:
  alpha_expr: "np.logspace(-5, 5, 30)"
  l1_ratio_expr: "np.linspace(0.1, 1, 10)"
  max_iter: 10000
  validation:
    strategy: "cv"
    cv_folds: 5
  plot_style: "2D"
  post_selection_refit: false

split_settings:
  use_proxy_only: true
  train_val_split: ["train", "valid"]
  test_split: "test"

weight_assignment_model: "lasso"
