#!/bin/bash
set -x

MODEL_PATH=/MODEL_PATH
CONFIG_PATH=/CONFIG_PATH
TRAIN_DATASET_PATH=/TRAIN_DATASET_PATH
VAL_DATASET_PATH=/VAL_DATASET_PATH
CHECKPOINT_DIR=/CHECKPOINT_DIR
CUDA_VISIBLE_DEVICES=/CUDA_VISIBLE_DEVICES
N_GPUS_PER_NODE=/N_GPUS_PER_NODE

mkdir -p "${CHECKPOINT_DIR}"

LOG_DIR="./logs"
mkdir -p "${LOG_DIR}"

RAY_TMPDIR="/RAY_TMPDIR"
mkdir -p "${RAY_TMPDIR}"
export RAY_TMPDIR

TIMESTAMP=$(date +"%Y%m%d_%H%M%S")
LOG_FILE="/LOG_FILE"

CUDA_VISIBLE_DEVICES=${CUDA_VISIBLE_DEVICES} python3 -m verl.trainer.main \
    config=${CONFIG_PATH} \
    worker.actor.model.model_path=${MODEL_PATH} \
    data.train_files=${TRAIN_DATASET_PATH} \
    data.val_files=${VAL_DATASET_PATH} \
    trainer.experiment_name=faithful \
    trainer.save_checkpoint_path=${CHECKPOINT_DIR} \
    trainer.n_gpus_per_node=${N_GPUS_PER_NODE} \
    2>&1 | tee "${LOG_FILE}"

