# Judgment Operators - Base Configuration
# Paper: "Judgment Operators for Multi-Agent Action Spaces"

output_dir: runs

# Reproducibility
seeds: [0, 1, 2, 3, 4]
temperature: 0.7

# =============================================================================
# Experiment Suites
# =============================================================================

suites:
  # Wikipedia format constraints (Table 1, 6, 7)
  - name: wikipedia_format
    type: webarena_wiki
    path: data/webarena/wiki_format_tasks.jsonl
    n_instances: 100
    max_steps: 10
    task_type: format_constrained
    constraints:
      enumeration_format: true
      require_citations: true
      verbatim_quotes: true
    policy_text: |
      Format: "Entity: Value | Entity: Value | ..."
      All claims require CITATION with URL
      Quoted text must appear verbatim in source

  # Wikipedia multi-agent (Protocol domain)
  - name: wikipedia_multiagent
    type: webarena_wiki
    path: data/webarena/wiki_multiagent_tasks.jsonl
    n_instances: 30
    max_steps: 10
    task_type: multi_agent
    constraints:
      enforce_role_separation: true
      require_citations: true
      schema_validation: true
    policy_text: |
      RESEARCHER: Navigate and gather information only
      WRITER: Synthesize answers from gathered info only
      VERIFIER: Check citations and format only

# =============================================================================
# Methods
# =============================================================================

methods:
  # No Operator baseline
  - name: NO
    kind: no_operator

  # JO with fixed rules (no learning)
  - name: JO_static
    kind: judgment_operator
    dynamic_precedents: false
    retrieve_threshold: 0.70

  # Full JO with precedent learning
  - name: JO_dynamic
    kind: judgment_operator
    dynamic_precedents: true
    retrieve_threshold: 0.70
    max_precedent_capacity: 200

# =============================================================================
# Ablations
# =============================================================================

ablations:
  # Retrieval threshold sensitivity
  - name: JO_dynamic_t50
    base: JO_dynamic
    retrieve_threshold: 0.50

  - name: JO_dynamic_t85
    base: JO_dynamic
    retrieve_threshold: 0.85

# =============================================================================
# Multi-Agent Configuration
# =============================================================================

agent_counts: [1, 2]
model_backends: ["openai"]
model_name: "gpt-4o-mini"
