#!/bin/bash

# ---------------------------------------------------------------------
# Env setup
# ---------------------------------------------------------------------
source /data/user/miniconda3/etc/profile.d/conda.sh
conda activate rllm2
cd /data/user/rllm

set -a
. /data/user/LiveCodeBench/.env
set +a

set -x

echo "Node: $(hostname -s)"
nvidia-smi -L || true

# --- vLLM / torch env
unset ROCR_VISIBLE_DEVICES ROCM_VISIBLE_DEVICES HIP_VISIBLE_DEVICES
export VLLM_ATTENTION_BACKEND=FLASH_ATTN
export PYTORCH_CUDA_ALLOC_CONF="expandable_segments:False"
export VLLM_USE_V1=1
export VLLM_ALLOW_LONG_MAX_MODEL_LEN=1
export VLLM_ENGINE_ITERATION_TIMEOUT_S=1000000000
export CUDA_DEVICE_ORDER=PCI_BUS_ID
export HYDRA_FULL_ERROR=1

python examples/bugs_refactor/eval_ckpts.py \
  --hf_repo anonymous/selfplay_large_ckpts \
  --base_model Qwen/Qwen2.5-Coder-7B-Instruct \
  --ckpt_cache_dir /data/user/selfplay_large_ckpts \
  --outdir ./eval_outputs/selfplay_large \
  --run_generator_fixer_flow_py examples/bugs_refactor/run_generator_fixer_flow.py \
  --val_datasets "bugbench_gpt-oss-20b_sampled:test_small" \
  --n_tasks 2000 --n_parallel 32 \
  --tp 1 --max_model_len 16384 --gpu_mem_util 0.90 --fixer_attempts_val 1 --temperature 0.6 --top_p 0.95 \
  --extra_flow_args "--include_failed_test_output --eval_pregenerated_only" \
  --port 31000 --kill_existing

# python examples/bugs_refactor/eval_ckpts.py \
#   --hf_repo anonymous/selfplay_large_ckpts \
#   --single_ckpt /data/user/selfplay_large_ckpts/repo_raw/global_step_20/actor_merged \
#   --base_model Qwen/Qwen2.5-Coder-7B-Instruct \
#   --ckpt_cache_dir /data/user/selfplay_large_ckpts \
#   --outdir ./eval_outputs/selfplay_large \
#   --run_generator_fixer_flow_py examples/bugs_refactor/run_generator_fixer_flow.py \
#   --val_datasets "bugbench_gpt-oss-20b_sampled:test_small" \
#   --n_tasks 2000 --n_parallel 32 \
#   --tp 1 --max_model_len 16384 --gpu_mem_util 0.90 --fixer_attempts_val 1 --temperature 0.6 --top_p 0.95 \
#   --extra_flow_args "--include_failed_test_output --eval_pregenerated_only" \
#   --port 31000 --kill_existing