#!/bin/bash
export PYTHONPATH=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden:$PYTHONPATH

pretrained_model_checkpoint=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_clap/exp/CaptionStew_400k_CLAP_Au_Tu_1e-2_fp16_bsz5120_shuffled/checkpoint-252k.pt
# audioset_pretrained=exp/audioset_bucket_2M_init/averaged_epoch9_avg3.pt
#asr_pretrained=/apdcephfs_cq10/share_1603164/user/yiwenyshao/independent/auden/egs/asr/exp/auden_zh_r3large_full_8gpu/averaged_iter1412000_avg10.pt
CUDA_VISIBLE_DEVICES=3 torchrun --nproc_per_node=1 \
        --master_port=29503 \
        train.py \
        exp_dir=/apdcephfs_cq10_1603164/share_1603164/user/raytseng/research/exp/audio_tagging/vggsound_CaptionStew_400k_CLAP_252k_4_5e-3_bsz1280_MHAP \
        ++model.config.pooling=mhap \
        model.id2label_json=configs/vggsound/id2label_vggsound.json \
        data.train_data_config=configs/vggsound/train_data_config_vggsound.yaml \
        data.valid_sets='[/apdcephfs_cq12/share_302080740/data/audio_test_data/audiotag/vggsound_test.jsonl.gz]' \
        data.max_duration=1280 \
        data.use_infinite_dataset=true \
        trainer.lr_steps_per_epoch=720 \
        trainer.base_lr=0.0045 \
        trainer.initialization.checkpoint=$pretrained_model_checkpoint \
        trainer.freeze_modules='[encoder_embed, encoder]' \
        trainer.valid_interval=250 \


# export CUDA_VISIBLE_DEVICES=4,5,6,7
# torchrun --nproc_per_node=4 \
#         --master_port=29501 \
#         train.py \
#         exp_dir=exp/vggsound_scratch_test \
#         model.config_preset=base \
#         model.id2label_json=configs/vggsound/id2label_vggsound.json \
#         data.train_data_config=configs/vggsound/train_data_config_vggsound.yaml \
#         data.valid_sets='[/apdcephfs_cq12/share_302080740/data/audio_test_data/audiotag/vggsound_test.jsonl.gz]' \
#         data.max_duration=800 \
#         data.use_infinite_dataset=true \
#         trainer.lr_steps_per_epoch=1000 \
#         trainer.base_lr=0.045