#!/bin/bash

audio_model_type=large_v3_turbo-qwen2_7b_instruct

model_suffix="${audio_model_type#*-}"
if [ "$model_suffix" = "qwen2_7b_instruct" ]; then
    text_model_type="Qwen2.5-7B-Instruct"
elif [ "$model_suffix" = "qwen2_3b_instruct" ]; then
    text_model_type="Qwen2.5-3B-Instruct"
elif [ "$model_suffix" = "qwen2_05b_instruct" ]; then
    text_model_type="Qwen2.5-0.5B-Instruct"
else
    text_model_type=none
fi

echo "text_model_type: ${text_model_type}"

cur_time=$(date +%Y-%m-%d_%H-%M-%S)
output_dir="outputs/train/alignchat/finetune/${audio_model_type}/${cur_time}"
logging_dir="${output_dir}/logs"

mkdir -p ${output_dir}
mkdir -p ${logging_dir}

cp $0 ${output_dir}

CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 accelerate launch --config-file configs/deepspeed_configs/zero1_gpu8.yaml \
    train/finetune_alignchat.py \
    --audio_model_path path/to/pretrained/model \
    --audio_model_type "$audio_model_type" \
    --dataset_paths \
        datasets/response_without_instruction/"$text_model_type"/openbookqa \
        datasets/response_without_instruction/"$text_model_type"/spoken-web-questions \
        datasets/response_without_instruction/"$text_model_type"/VoiceAssistant-400K \
        datasets/response_without_instruction/"$text_model_type"/DeepDialogue-orpheus \
        datasets/response_without_instruction/"$text_model_type"/DeepDialogue-xtts \
        datasets/response_with_instruction/"$text_model_type"/libritts_r_filtered \
        datasets/response_with_instruction/"$text_model_type"/fleurs \
        datasets/response_with_instruction/"$text_model_type"/EuroSpeech \
        datasets/response_with_instruction/"$text_model_type"/DeepDialogue-orpheus \
        datasets/response_with_instruction/"$text_model_type"/DeepDialogue-xtts \
        datasets/response_with_instruction/"$text_model_type"/VoiceAssistant-400K \
        datasets/response_with_instruction/"$text_model_type"/spoken-web-questions \
        datasets/response_with_instruction/"$text_model_type"/common_voice_21_0 \
    --dataset_ratios 1.0 1.0 1.0 1.0 1.0 1.0 1.0 1.0 1.0 1.0 1.0 1.0 1.0 \
    --dataset_split train \
    --output_dir "${output_dir}" \
    --logging_dir "${logging_dir}" \
    --warmup_ratio 0.05 \
    --lr_scheduler_type cosine_with_min_lr \
    --learning_rate 1e-4 \
    --min_learning_rate 1e-6 \
    --loss_ratios 1.0 1.0 5.0 \
    --loss_types lm l1 cos_l2 \
    --freeze_encoder True --freeze_decoder False \
    --do_train \
    --per_device_train_batch_size 3 \
    --gradient_accumulation_steps 32 \
    --num_train_epochs 2 \
    --save_strategy steps \
    --save_only_model True \
    --save_steps 1500 \
    --save_total_limit 10 \
    --logging_steps 1 \
    --logging_strategy steps \
    --seed 42 \
    --bf16 \
    --weight_decay 1e-3 \
    --dataloader_num_workers 8 \
    --remove_unused_columns False \
    --ddp_find_unused_parameters False
