#!/bin/bash

# ==============================
# Agent / Task / Model lists
# ==============================
AGENT_IDS=("openhands")      # example agents
TASK_IDS=("lost_in_the_middle" "medical_bias" "self_correction" "known_evaluation")  # example tasks
LLM_MODELS=("o4-mini")  # example models

# ==============================
# API keys for different providers
# ==============================
OPENAI_API_KEY=""
ANTHROPIC_API_KEY=""

# ==============================
# Run all combinations
# ==============================
for agent in "${AGENT_IDS[@]}"; do
  for task in "${TASK_IDS[@]}"; do
    for model in "${LLM_MODELS[@]}"; do

      # Determine which key to use
      if [[ "$model" == claude* ]]; then
        API_KEY="$ANTHROPIC_API_KEY"
      else
        API_KEY="$OPENAI_API_KEY"
      fi

      echo "===================================================="
      echo "Running Agent: $agent | Task: $task | Model: $model"
      echo "===================================================="

      # Execute the run
      python run_agent.py \
        --AGENT_ID "$agent" \
        --TASK_ID "$task" \
        --LLM_MODEL "$model" \
        --RUN_TIMES 1 \
        --LLM_API_KEY "$API_KEY"

    done
  done
done
