#!/bin/bash
export PYTHONPATH=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden:/apdcephfs_cq12/share_302080740/user/raytseng/research/lhotse:$PYTHONPATH

# # ----------------train from scratch------------------
export CUDA_VISIBLE_DEVICES=0,1,2,3
torchrun --nproc_per_node=4 \
        --master-port=29511 \
        train.py \
        exp_dir=exp/captionstew_scratch_weakly_plus_10M_fp16 \
        model.id2label_json=/apdcephfs_cq12/share_302080740/user/raytseng/data/CaptionStew/labels/weakly_plus_shards/id2label_combined.json \
        model.config.is_multilabel=true \
        data.train_data_config=configs/captionstew_full/train_data_config_captionstew_weakly_plus.yaml \
        data.max_duration=1280 \
        trainer.use_fp16=true \
        data.use_infinite_dataset=true \
        trainer.lr_steps_per_epoch=2500 \
        trainer.start_batch=244000 \

# # # ----------------asr init------------------
# pretrained_checkpoint=/apdcephfs_cq10/share_1603164/user/yiwenyshao/independent/auden/egs/asr/exp/auden_zh_r3large_full_8gpu/averaged_iter1412000_avg10.pt
# model_name=zipformer-tag-large  # asr is large model
# export CUDA_VISIBLE_DEVICES=4,5,6,7
# torchrun --nproc_per_node=4 \
#         --master-port=29502 \
#         train.py \
#         exp_dir=exp/audioset_asr_init \
#         id2label_json=configs/audioset/id2label_audioset.json \
#         model.name=$model_name \
#         model.config.num_classes=527 \
#         ++model.config.is_multilabel=true \
#         data.train_data_config=configs/audioset/train_data_config_audioset.yaml \
#         data.max_duration=800 \
#         trainer.use_fp16=false \
#         data.use_infinite_dataset=true \
#         trainer.lr_steps_per_epoch=10000 \
