# ============================================================
# PLUGIN PIPELINE CONFIGURATION FOR SURVEY ELICITATION & LASSO
# ------------------------------------------------------------
# This YAML file runs both stages of the alignment:
#
# Stage 1: Parallel elicitation of responses for pre-generated endowments
# Stage 2: Run Lasso/ElasticNet regression to select relevant endowments
#
# Each module (survey, agent, runner, lasso/elasticnet) has its own settings.
# ============================================================

# --- FILE MANAGEMENT & METADATA ---

# >>> Alignment Metadata <<<
metadata:
  name: "ATP_w36_plugin"        # Short name used in output folder naming
  description: "Elicit responses for pre-generated ATP Wave 36 endowments and run regression."
  version: "v1"
  seed: 101

# >>> Input & Reference File Paths <<<
paths:
  survey_csv: "data/w36/info.csv"                           # CSV with question text and codes
  survey_yaml: "config/surveys/american_trend_panel.yaml"   # Schema for interpreting survey CSV
  endowments_csv: "outputs/ATP_w36_20250918_153000/endowments.csv"   # Pre-generated endowments
  aggregate_json: "data/w36/W36_aggregate_results.json"     # Optional: human target distributions

# >>> Report Styling <<<
report:
  plugin: styles/generation_report.css
  regression: styles/lasso_report.css       # Style for regression experiment report

# ============================================================
#           [STAGE 1] PARALLEL ELICITATION
# ============================================================

# --- RESPONSE AGENT CONFIGURATION ---
# Settings for the LLM agent that simulates survey responses.
agent: 
  type: openai
  model_name: gpt-4o-mini
  formality: >                 # System prompt detailing formality requirements for the response
    You are completing a survey. Your answer should reflect the person described in the profile above, using their preferences, beliefs and experiences.
    Respond with only the final answer string, not the code or label in brackets.
    Do not include any reasoning, explanation, or commentary.
    Do not preface your answer with phrases like 'I would choose'.
    Just return the answer text exactly as it appears in the options.
  kwargs:
    temperature: 0             # Deterministic responses
    max_tokens: 128            # Upper limit for response length

# --- RUNNER SETTINGS ---
runner:
  parallel: true              # Whether to use parallel workers
  max_workers: 30             # Number of worker threads
  verbose: true               # Verbose logging
  target_n: 300               # (NEW) cap number of endowments sampled for elicitation
# ============================================================
#           [STAGE 2] LASSO REGRESSION APPROXIMATION
# ============================================================

lasso:
  alpha_expr: "np.logspace(-5, 1, 20)"       # Lasso tuning grid
  max_iter: 10000
  validation:
    strategy: "cv"
    cv_folds: 5
  post_selection_refit: true

elasticnet:
  alpha_expr: "np.logspace(-5, 1, 20)"       
  l1_ratio_expr: "np.linspace(0.1, 1, 10)"  
  max_iter: 10000
  validation:
    strategy: "cv"
    cv_folds: 5
  plot_style: "2D"
  post_selection_refit: true

# --- SPLIT SETTINGS ---
split_settings:
  use_proxy_only: true
  train_val_split: ["train", "valid"]
  test_split: "test"

# --- MODEL WEIGHT USAGE ---
weight_assignment_model: "lasso"

# ============================================================
# NOTES:
# - Endowments must already exist in endowments.csv.
# - This pipeline does not generate new endowments, only elicits responses.
# - Weights for endowments will be assigned using `weight_assignment_model`.
# ============================================================