
usage() {
    echo "Usage: $0 [OPTIONS]"
    echo ""
    echo "Options:"
    echo "  -m, --model MODEL              Model name (default: fireworks_ai/llama4-maverick-instruct-basic)"
    echo "  -d, --dataset DATASET          Dataset path (default: data/single_turn_data.json)"
    echo "  -o, --output OUTPUT_DIR        Output directory (default: eval_results_single_turn)"
    echo "  -t, --tool-use / --no-tool-use Enable/disable tool use (default: enabled)"
    echo "  -s, --system-prompt LEVEL      System prompt level: low, medium, high (default: high)"
    echo "  -c, --max-calls MAX_CALLS      Maximum tool calls (default: 20)"
    echo "  -r, --trial TRIAL              Trial number (default: 1)"
    echo "  -w, --workers NUM_WORKERS      Number of parallel workers (default: 16)"
    echo "  -h, --help                     Show this help message"
    echo ""
    echo "Environment variables (used as defaults if not overridden by arguments):"
    echo "  MODEL_NAME, OUTPUT_DIR, TOOL_USE, SYSTEM_PROMPT_LEVEL"
    exit 1
}

# Default values (can be overridden by environment variables or command-line args)
MODEL_NAME="${MODEL_NAME:-fireworks_ai/llama4-maverick-instruct-basic}"
DATASET_PATH="data/single_turn_data.json"
OUTPUT_DIR="${OUTPUT_DIR:-eval_results_single_turn}"
TOOL_USE="${TOOL_USE:-true}"
SYSTEM_PROMPT_LEVEL="${SYSTEM_PROMPT_LEVEL:-high}"
MAX_TOOL_CALLS=20
TRIAL=1
NUM_WORKERS=64

# Parse command-line arguments
while [[ $# -gt 0 ]]; do
    case $1 in
        -m|--model)
            MODEL_NAME="$2"
            shift 2
            ;;
        -d|--dataset)
            DATASET_PATH="$2"
            shift 2
            ;;
        -o|--output)
            OUTPUT_DIR="$2"
            shift 2
            ;;
        -t|--tool-use)
            TOOL_USE="true"
            shift
            ;;
        --no-tool-use)
            TOOL_USE="false"
            shift
            ;;
        -s|--system-prompt)
            SYSTEM_PROMPT_LEVEL="$2"
            shift 2
            ;;
        -c|--max-calls)
            MAX_TOOL_CALLS="$2"
            shift 2
            ;;
        -r|--trial)
            TRIAL="$2"
            shift 2
            ;;
        -w|--workers)
            NUM_WORKERS="$2"
            shift 2
            ;;
        -h|--help)
            usage
            ;;
        *)
            echo "Unknown option: $1"
            usage
            ;;
    esac
done

echo "Starting model response generation..."
echo "=================================="

echo "Configuration:"
echo "  Model: $MODEL_NAME"
echo "  Dataset: $DATASET_PATH"
echo "  Output directory: $OUTPUT_DIR"
echo "  Tool use: $TOOL_USE"
echo "  System prompt level: $SYSTEM_PROMPT_LEVEL"
echo "  Max tool calls: $MAX_TOOL_CALLS"
echo "  Trial: $TRIAL"
echo "  Number of workers: $NUM_WORKERS"
echo "=================================="

# Build the command
CMD="python run_model_response_single_turn.py"
CMD="$CMD --model $MODEL_NAME"
CMD="$CMD --dataset $DATASET_PATH"
CMD="$CMD --output_dir $OUTPUT_DIR"

if [ "$TOOL_USE" = true ]; then
    CMD="$CMD --tool_use"
else
    CMD="$CMD --no_tool_use"
fi

CMD="$CMD --system_prompt_level $SYSTEM_PROMPT_LEVEL"
CMD="$CMD --max_tool_calls $MAX_TOOL_CALLS"
CMD="$CMD --trial $TRIAL"
CMD="$CMD --num_workers $NUM_WORKERS"

echo "Running command:"
echo "$CMD"
echo "=================================="

# Execute the command
eval $CMD

# Check if the command executed successfully
if [ $? -eq 0 ]; then
    echo "=================================="
    echo "Model response generation completed successfully!"
else
    echo "=================================="
    echo "Model response generation failed with exit code $?"
    exit 1
fi 