# ============================================================
# PANEL EMPIRICAL STUDY SWEEP CONFIGURATION
# This YAML governs a multi-round panel study with multiple waves and repeats.
# Each sweep runs a full endowment generation and regression experiment.
# ============================================================

# --- Sweep Settings (used only in the panel sweeper) ---
sweep: # 
  output_dir: "outputs/panel_study_gemini"      # Base directory for sweep outputs
  waves: ["W26", "W27", "W29", "W32", "W34", "W36", "W41", "W42", "W45", "W49", "W50", "W54", "W82", "W92"]  # Wave IDs to sweep over
  repeats: 3                              # Number of repeats per wave

# --- Metadata for Experiment Settings (copied and modified per sweep) ---
experiment:
  name: "ATP_panel_study_gemini"
  description: "Panel sweep across 14 waves using active endowment generation and regression."
  version: "v1"
  random_seed: 101        # Base seed; incremented per repeat

# --- Paths (relative to wave ID, which is injected per sweep step) ---
paths:
  survey_csv: "data/{wave}/info.csv"
  survey_yaml: "config/surveys/american_trend_panel.yaml"
  attribute_bank: "config/attribute_banks/attribute_bank.yaml"
  aggregate_json: "data/{wave}/{wave}_aggregate_results.json"

# --- Report Styling ---
report:
  endowment: styles/generation_report.css
  regression: styles/lasso_report.css

# ============================================================
#           [STAGE 1] ACTIVE ENDOWMENT GENERATION
# ============================================================

agent:
  type: gemini
  model_name: gemini-2.0-flash 
  formality: >
    You are completing a survey. Your answer should reflect the person described in the profile above, using their preferences, beliefs and experiences.
    Respond with only the final answer string, not the code or label in brackets.
    Do not include any reasoning, explanation, or commentary.
    Do not preface your answer with phrases like 'I would choose'.
    Just return the answer text exactly as it appears in the options.
  delay: 0.1
  kwargs:
    temperature: 0
    max_tokens: 128


endowment_model:
  backend_type: gemini         # LLM backend for endowment generation 
  model_name: gemini-2.0-flash      # LLM model for endowment generation 
  temperature: 0.9
  batch_size: 5
  delay: 0.5
  retry_failed: true
  max_attributes: 10
  randomize_attributes: true

attribute_learner:
  backend_type: gemini         # LLM backend for attribute generation 
  model_name: gemini-2.0-flash      # LLM model for attribute generation 
  max_tokens: 1024

generation:
  target_n: 300
  initial_n: 10
  num_update_steps: 5
  parallel: true
  max_workers: 20
  question_patch:
    fraction: 0.75
    top_k: 3
    min_repeats: 2
  verbose: true

# ============================================================
#           [STAGE 2] LASSO / ELASTIC NET REGRESSION
# ============================================================

lasso:
  alpha_expr: "np.logspace(-5, 3, 20)"
  max_iter: 10000
  validation:
    strategy: "cv"
    cv_folds: 5
  post_selection_refit: false

elasticnet:
  alpha_expr: "np.logspace(-5, 3, 20)"
  l1_ratio_expr: "np.linspace(0.1, 1, 10)"
  max_iter: 10000
  validation:
    strategy: "cv"
    cv_folds: 5
  plot_style: "2D"
  post_selection_refit: false

split_settings:
  use_proxy_only: true
  train_val_split: ["train", "valid"]
  test_split: "test"

weight_assignment_model: "lasso"
