#!/bin/bash

WORKSPACE_FOLDER="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
MODEL_DIR="training/llava_finetuning_stage_2"  
VISION_TOWER_DIR="CLIP"  
DATA_PATH="DIYHealthGPT/datasets/train_all.json"
IMAGE_FOLDER="DIYHealthGPT/DIYHealth-tmp"
OUTPUT_PATH="training/stage3/"

export NCCL_P2P_DISABLE=1
export NCCL_IB_DISABLE=1

deepspeed --num_gpus=1 --master_port 29600 "${WORKSPACE_FOLDER}/llava/train/train_.py" \
    --moe_lora_enable "True" \
    --freeze_mm_mlp_adapter "True"\
    --moe_lora_r "16" \
    --moe_lora_alpha "64" \
    --moe_lora_num "4" \
    --hyper_lora_r "8" \
    --hyper_lora_alpha "32" \
    --hyper_lora_num "4" \
    --compress_dim "8" \
    --mm_projector_lr "2e-5" \
    --model_name_or_path "$MODEL_DIR" \
    --version "phi3_instruct" \
    --data_path "$DATA_PATH" \
    --image_folder "$IMAGE_FOLDER" \
    --vision_tower "$VISION_TOWER_DIR" \
    --mm_projector_type "mlp2x_gelu" \
    --mm_vision_select_layer "-2" \
    --mm_use_im_start_end "False" \
    --mm_use_im_patch_token "False" \
    --image_aspect_ratio "pad" \
    --group_by_modality_length "True" \
    --bf16 "True" \
    --output_dir "$OUTPUT_PATH" \
    --num_train_epochs "2" \
    --per_device_train_batch_size "4" \
    --per_device_eval_batch_size "2" \
    --gradient_accumulation_steps "8" \
    --save_strategy "no" \
    --learning_rate "1e-5" \
    --weight_decay "0.01" \
    --warmup_ratio "0.03" \
    --lr_scheduler_type "cosine" \
    --logging_steps "1" \
    --tf32 "True" \
    --model_max_length "2048" \
    --gradient_checkpointing "True" \
    --dataloader_num_workers "4" \
    --lazy_preprocess "True" \
    --report_to "wandb" \
    --deepspeed "scripts/zero3.json"
