#!/bin/bash

# ---------------------------------------------------------------------
# Env setup
# ---------------------------------------------------------------------
source /data/user/miniconda3/etc/profile.d/conda.sh
conda activate rllm2
cd /data/user/rllm

set -a
. /data/user/LiveCodeBench/.env
set +a

set -x

echo "Node: $(hostname -s)"
nvidia-smi -L || true

# --- vLLM / torch env
unset ROCR_VISIBLE_DEVICES ROCM_VISIBLE_DEVICES HIP_VISIBLE_DEVICES
export VLLM_ATTENTION_BACKEND=FLASH_ATTN
export PYTORCH_CUDA_ALLOC_CONF="expandable_segments:False"
export VLLM_USE_V1=1
export VLLM_ALLOW_LONG_MAX_MODEL_LEN=1
export VLLM_ENGINE_ITERATION_TIMEOUT_S=1000000000
export CUDA_DEVICE_ORDER=PCI_BUS_ID
export HYDRA_FULL_ERROR=1

HF_REPO="selfplay_ours_embed_nomix_large_ckpts"

python examples/bugs_refactor/eval_ckpts.py \
  --hf_repo anonymous/$HF_REPO \
  --base_model Qwen/Qwen2.5-Coder-7B-Instruct \
  --ckpt_cache_dir /data/user/$HF_REPO \
  --outdir ./eval_outputs/$HF_REPO \
  --run_generator_fixer_flow_py examples/bugs_refactor/run_generator_fixer_flow.py \
  --val_datasets "bugbench:test_small" \
  --n_tasks 2000 --n_parallel 32 \
  --tp 1 --max_model_len 16384 --gpu_mem_util 0.90 --fixer_attempts_val 1 --temperature 0.6 --top_p 0.95 \
  --extra_flow_args "--include_failed_test_output --eval_pregenerated_only" \
  --port 33000 --kill_existing

python examples/bugs_refactor/eval_ckpts.py \
  --hf_repo anonymous/selfplay_ours_embed_nomix_large_ckpts \
  --base_model Qwen/Qwen2.5-Coder-7B-Instruct \
  --ckpt_cache_dir /data/user/selfplay_ours_embed_nomix_large_ckpts \
  --outdir ./eval_outputs/selfplay_ours_embed_nomix_large_ckpts \
  --run_generator_fixer_flow_py examples/bugs_refactor/run_generator_fixer_flow.py \
  --val_datasets "bugbench:test_small" \
  --n_tasks 2000 --n_parallel 32 \
  --tp 1 --max_model_len 16384 --gpu_mem_util 0.90 --fixer_attempts_val 1 --temperature 0.6 --top_p 0.95 \
  --extra_flow_args "--include_failed_test_output --eval_pregenerated_only" \
  --port 33000 --kill_existing