#!/bin/bash
MODEL_PATH="/storage/Qwen2.5-VL-3B-Instruct/"   
OUTPUT_DIR="/storage/"
DS_CONFIG="src/configs/ds_config.json"
FONT_PATH="/storage/GoNotoCurrent.ttf"
FONT_SIZE=7
N_PARTS=1
BATCH_SIZE=1
EPOCHS=3
LEARNING_RATE=2e-5
WEIGHT_DECAY=0.1
NUM_WORKERS=4
# MIXED_PRECISION="bf16" # "fp16" 
MIXED_PRECISION="fp16" # "fp16"

# Distributed training parameters
MASTER_ADDR="127.0.0.1"
MASTER_PORT=12345

# Wandb parameters
WANDB_PROJECT="qwen_project"
WANDB_RUN_NAME="qwen_OpenHermes"

torchrun --master_port=29500 --nnodes=1 --nproc_per_node=8 src/train_custom_qwen.py \
        --ds-config $DS_CONFIG \
	    --model-path $MODEL_PATH\
       	--output-dir $OUTPUT_DIR \
	    --font-path $FONT_PATH \
	    --font-size $FONT_SIZE \
	    --n-parts $N_PARTS \
	    --batch-size $BATCH_SIZE \
	    --epochs $EPOCHS \
	    --lr $LEARNING_RATE \
	    --weight-decay $WEIGHT_DECAY \
	    --num-workers $NUM_WORKERS \
	    --wandb-project $WANDB_PROJECT \
	    --wandb-run-name $WANDB_RUN_NAME \
	    --mixed-precision $MIXED_PRECISION \
	    --grad-accum-steps 16 \
		--use-wandb \
		--save-src 
		
