#!/bin/bash
set -xeuo pipefail

# Get the configuration name and engine name from arguments
CONFIG_NAME="$1"
ENGINE="${2:-vllm}"

# Download model if needed
huggingface-cli download Qwen/Qwen2.5-0.5B --local-dir "$HOME/models/Qwen/Qwen2.5-0.5B"

# Run the training with the specified configuration
python3 -m verl.trainer.main_ppo \
    --config-name "$CONFIG_NAME" "$@" 