#!/bin/bash
export PYTHONPATH=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden:$PYTHONPATH

# # ----------------train from scratch------------------
# torchrun --nproc_per_node=8 \
#         --master_port=29501 \
#         train.py \
#         exp_dir=exp/wavcaps_As_Tl \
#         data.train_data_config=configs/wavcaps/train_data_config_wavcaps.yaml \
#         data.max_duration=400 \
#         data.valid_sets='[/apdcephfs_cq12/share_302080740/data/audio_test_data/audiocaps/audiocaps_val.jsonl.gz]' \
#         data.use_infinite_dataset=true \
#         trainer.lr_steps_per_epoch=10000 \
#         trainer.freeze_modules=['text_encoder']


# # ----------------audioset init, unfreeze ------------------
# pretrained_checkpoint=/apdcephfs_cq10/share_1603164/user/yiwenyshao/independent/auden/egs/audio_tag/exp/audioset_scratch/averaged_iter460000_avg10.pt
# torchrun --nproc_per_node=8 \
#         --master_port=29501 \
#         train.py \
#         exp_dir=exp/wavcaps_Au_Tl \
#         data.train_data_config=configs/wavcaps/train_data_config_wavcaps.yaml \
#         data.max_duration=400 \
#         data.valid_sets='[/apdcephfs_cq12/share_302080740/data/audio_test_data/audiocaps/audiocaps_val.jsonl.gz]' \
#         data.use_infinite_dataset=true \
#         trainer.lr_steps_per_epoch=10000 \
#         trainer.freeze_modules=['text_encoder'] \
#         trainer.initialization.checkpoint=$pretrained_checkpoint \
#         trainer.base_lr=0.0045


# # ----------------audioset init, freeze ------------------
# pretrained_checkpoint=/apdcephfs_cq10/share_1603164/user/yiwenyshao/independent/auden/egs/audio_tag/exp/audioset_scratch/averaged_iter460000_avg10.pt
# torchrun --nproc_per_node=8 \
#         --master_port=29501 \
#         train.py \
#         exp_dir=exp/wavcaps_Al_Tl \
#         data.train_data_config=configs/wavcaps/train_data_config_wavcaps.yaml \
#         data.max_duration=400 \
#         data.valid_sets='[/apdcephfs_cq12/share_302080740/data/audio_test_data/audiocaps/audiocaps_val.jsonl.gz]' \
#         data.use_infinite_dataset=true \
#         trainer.lr_steps_per_epoch=10000 \
#         trainer.freeze_modules=['text_encoder','encoder_emb','encoder'] \
#         trainer.initialization.checkpoint=$pretrained_checkpoint

# ----------------audioset init unfreeze, text unfreeze ------------------
# pretrained_checkpoint=/apdcephfs_cq12/share_302080740/user/xuanruzhou/Auden/egs/audio_classification/exp/audioset_baseline_new/epoch-50.pt
CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 torchrun --nproc_per_node=8 \
        --master_port=29501 \
        train.py \
        exp_dir=exp/wavcaps_CLAP_Au_Tu_1e-2_fp16_bsz6400 \
        ++model.config.text_encoder_type="roberta-base" \
        data.train_data_config=configs/wavcaps/train_data_config_wavcaps.yaml \
        data.max_duration=800 \
        data.valid_sets='[/apdcephfs_cq12/share_302080740/data/audio_test_data/audiocaps/audiocaps_val.jsonl.gz]' \
        data.use_infinite_dataset=true \
        data.num_workers=12 \
        trainer.use_fp16=true \
        trainer.lr_steps_per_epoch=5000 \
        trainer.base_lr=0.01 \
        ++model.config.init_text_encoder_from_scratch=true \