dir_name=$(basename $(dirname "$0"))
time_stamp=$(date +"%m%d%H%M%S")
LOG_DIR="$PWD/log/${time_stamp}_$dir_name"
PLACE_CFG_FOLDER=$PWD/place-config/${time_stamp}_$dir_name
PART=1

mkdir -p $LOG_DIR
mkdir -p $PLACE_CFG_FOLDER


mpirun -v --allow-run-as-root \
      --bind-to none --map-by slot --hostfile /root/hostfile \
      --mca btl_tcp_if_include bond1 --mca oob_tcp_if_include bond1 --mca routed direct \
      -x PATH -x LIBRARY_PATH -x LD_LIBRARY_PATH \
      pip install polaris-cpp-py math_verify
sleep 3

mpirun -v --allow-run-as-root \
      --bind-to none --map-by slot --hostfile /root/hostfile \
      --mca btl_tcp_if_include bond1 --mca oob_tcp_if_include bond1 --mca routed direct \
      -x PATH -x LIBRARY_PATH -x LD_LIBRARY_PATH \
      python tools/auto_place.py \
      --fn gen --config-folder $PLACE_CFG_FOLDER \
      --sampler-tp-size 2 --sampler-pp-size 1 \
      --critic-tp-size 2 --critic-pp-size 2 \
      --actor-tp-size 2 --actor-pp-size 2 --actor-cp-size 2 \

mpirun -v --allow-run-as-root \
      --bind-to none --map-by slot --hostfile $PLACE_CFG_FOLDER/sampler.hostfile \
      --mca btl_tcp_if_include bond1 --mca oob_tcp_if_include bond1 --mca routed direct \
      -x PATH -x LIBRARY_PATH -x LD_LIBRARY_PATH \
      bash tasks/math_rl_v3/qwen/$dir_name/grpo.sh $PLACE_CFG_FOLDER sampler $time_stamp >$LOG_DIR/sampler$PART.log 2>&1 &

mpirun -v --allow-run-as-root \
      --bind-to none --map-by slot --hostfile $PLACE_CFG_FOLDER/critic.hostfile \
      --mca btl_tcp_if_include bond1 --mca oob_tcp_if_include bond1 --mca routed direct \
      -x PATH -x LIBRARY_PATH -x LD_LIBRARY_PATH \
      bash tasks/math_rl_v3/qwen/$dir_name/grpo.sh $PLACE_CFG_FOLDER critic $time_stamp >$LOG_DIR/critic$PART.log 2>&1 &

mpirun -v --allow-run-as-root \
      --bind-to none --map-by slot --hostfile $PLACE_CFG_FOLDER/actor.hostfile \
      --mca btl_tcp_if_include bond1 --mca oob_tcp_if_include bond1 --mca routed direct \
      -x PATH -x LIBRARY_PATH -x LD_LIBRARY_PATH \
      bash tasks/math_rl_v3/qwen/$dir_name/grpo.sh $PLACE_CFG_FOLDER actor $time_stamp >$LOG_DIR/actor$PART.log 2>&1 &

wait
