#!/usr/bin/env bash
set -euo pipefail
MODEL_NAME_OR_PATH=""
OUTPUT_DIR=""
DEEPSPEED_CONFIG=""
RESUME_FROM_CHECKPOINT=""

while [[ $# -gt 0 ]]; do
  case "$1" in
    --model_name_or_path)
      MODEL_NAME_OR_PATH="$2"; shift 2;;
    --output_dir)
      OUTPUT_DIR="$2"; shift 2;;
    --deepspeed_config)
      DEEPSPEED_CONFIG="$2"; shift 2;;
    --resume_from_checkpoint)
      RESUME_FROM_CHECKPOINT="$2"; shift 2;;
    -h|--help)
      sed -n '1,60p' "$0"; exit 0;;
    *)
      echo "Unknown argument: $1"; exit 1;;
  esac
done

if [[ -z "${MODEL_NAME_OR_PATH}" ]]; then
  echo "Error: --model_name_or_path is required"; exit 1;
fi
if [[ -z "${OUTPUT_DIR}" ]]; then
  echo "Error: --output_dir is required"; exit 1;
fi
if [[ -z "${DEEPSPEED_CONFIG}" ]]; then
  echo "Error: --deepspeed_config is required"; exit 1;
fi

RESUME_ARG=()
if [[ -n "${RESUME_FROM_CHECKPOINT}" ]]; then
  RESUME_ARG=( --resume_from_checkpoint "${RESUME_FROM_CHECKPOINT}" )
fi

llamafactory-cli train \
  --model_name_or_path "${MODEL_NAME_OR_PATH}" \
  --trust_remote_code true \
  \
  --stage sft \
  --do_train true \
  --finetuning_type full \
  \
  --dataset rewrite \
  --template qwen3 \
  --cutoff_len 8192 \
  --max_samples 3600 \
  --overwrite_cache true \
  --preprocessing_num_workers 16 \
  --dataloader_num_workers 3 \
  \
  --output_dir "${OUTPUT_DIR}" \
  --logging_steps 10 \
  --save_steps 50 \
  --plot_loss true \
  --overwrite_output_dir true \
  --save_only_model false \
  --report_to none \
  \
  --per_device_train_batch_size 2 \
  --gradient_accumulation_steps 4 \
  --learning_rate 1e-5 \
  --num_train_epochs 3.0 \
  --lr_scheduler_type cosine \
  --warmup_ratio 0.1 \
  --bf16 true \
  --ddp_timeout 180000000 \
  --gradient_checkpointing true \
  --deepspeed "${DEEPSPEED_CONFIG}" \
  "${RESUME_ARG[@]}"
