SCRIPT_DIR=$(dirname "$(realpath "$BASH_SOURCE")")
WORK_DIR=$(dirname "$SCRIPT_DIR")
echo "cd ${WORK_DIR}"
cd ${WORK_DIR}

time_postfix=$(date +%Y%m%d_%H%M)
export WANDB_API_KEY=""
export WANDB_PROJECT=""
export WANDB_ENTITY=""
wandb login $WANDB_API_KEY

mkdir -p outputs/logs
mkdir -p outputs/ckpt

deepspeed main.py \
    --deepspeed_config configs/ds_config.json \
    --basepath Qwen/Qwen3-4B-Thinking-2507 \
    --trainpath data/sharegpt_train.json \
    --testpath data/sharegpt_test.json \
    --savedir outputs/ckpt/Qwen3-4B-Thinking-2507 \
    --config_path configs/qwen3_4b_config.json \
    --confidence_loss_type confidence_progress_remain \
    2>&1 | tee outputs/logs/train_Qwen3_4B_Thinking2507_Eagle3_shareGPT_cpr-${time_postfix}.log