# ============================================================
# PLUGIN PIPELINE CONFIGURATION FOR SURVEY ELICITATION & LASSO
# ------------------------------------------------------------
# This YAML file runs both stages of the alignment:
#
# Stage 1: Parallel elicitation of responses for pre-generated endowments
# Stage 2: Run Lasso/ElasticNet regression to select relevant endowments
#
# Each module (survey, agent, runner, lasso/elasticnet) has its own settings.
# ============================================================

# --- FILE MANAGEMENT & METADATA ---

# >>> Alignment Metadata <<<
metadata:
  name: "backend_performance"        # Short name used in output folder naming
  description: "Elicit responses for backend gemini-2.0-flash on ATP W42. (300 repeats)."
  version: "v1"
  seed: 101

# >>> Input & Reference File Paths <<<
paths:
  survey_csv: "data/w42/info.csv"
  survey_yaml: "config/surveys/american_trend_panel.yaml"
  endowments_csv: "data/raw_backend/base_endowments.csv"   # Pre-generated endowments
  aggregate_json: "data/w42/W42_aggregate_results.json"

# >>> Report Styling <<<
report:
  plugin: styles/generation_report.css
  regression: styles/lasso_report.css       # Style for regression experiment report

# ============================================================
#           [STAGE 1] PARALLEL ELICITATION
# ============================================================

# --- RESPONSE AGENT CONFIGURATION ---
# Settings for the LLM agent that simulates survey responses.
agent: 
  type: gemini
  model_name: gemini-2.0-flash 
  formality: >                 # System prompt detailing formality requirements for the response
    You are completing a public opinion survey. Answer each question as an average adult respondent in the US population, based only on the question text and options.
    Respond with only the final answer string, not the code or label in brackets.
    Do not include any reasoning, explanation, or commentary.
    Do not preface your answer with phrases like 'I would choose'.
    Just return the answer text exactly as it appears in the options.
  kwargs:
    temperature: 0.7             # Non-deterministic responses
    max_tokens: 128            # Upper limit for response length

# --- RUNNER SETTINGS ---
runner:
  parallel: true              # Whether to use parallel workers
  max_workers: 20             # Number of worker threads
  verbose: true               # Verbose logging
  target_n: 300               # (NEW) cap number of endowments sampled for elicitation