#!/bin/bash
export PYTHONPATH=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden:$PYTHONPATH

# valid_sets='[/apdcephfs_cq12/share_302080740/user/raytseng/data/AudioSet-SL/manifests/audioset_eval_subset_0.jsonl.gz,/apdcephfs_cq12/share_302080740/user/raytseng/data/AudioSet-SL/manifests/audioset_eval_subset_1.jsonl.gz,/apdcephfs_cq12/share_302080740/user/raytseng/data/AudioSet-SL/manifests/audioset_eval_subset_2.jsonl.gz,/apdcephfs_cq12/share_302080740/user/raytseng/data/AudioSet-SL/manifests/audioset_eval_subset_3.jsonl.gz,/apdcephfs_cq12/share_302080740/user/raytseng/data/AudioSet-SL/manifests/audioset_eval_subset_4.jsonl.gz]'
valid_sets='[/apdcephfs_cq12/share_302080740/user/raytseng/data/AudioSet-SL/manifests/audioset_eval_subset_0.jsonl.gz]'

# linear probing of a frozen audio encoder on AudioSet-SL for sound event detection
pretrained_model_checkpoint=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_captioning/exp/CaptionStew_1M_masked_captioning_AU_TU_5e-3_fp16_bsz5120_shuffled/checkpoint-50000.pt
CUDA_VISIBLE_DEVICES=4,5,6,7 torchrun --nproc_per_node=4 \
         --master_port=29504 \
        train.py \
        exp_dir=/apdcephfs_cq12/share_302080740/user/raytseng/research/exp/sound_event_detection/audioset-sl_CaptionStew_1M_captioningPa_TUAU_50k_4_5e-1_bsz2560_warmup \
        model.id2label_json=configs/audioset-sl/id2label_audioset-sl.json \
        data.train_data_config=configs/audioset-sl/train_data_config_audioset-sl.yaml \
        data.valid_sets=$valid_sets \
        data.max_duration=640 \
        trainer.use_fp16=false \
        trainer.base_lr=0.45 \
        trainer.warmup_batches=1600 \
        trainer.initialization.checkpoint=$pretrained_model_checkpoint \
        trainer.freeze_modules='[encoder_embed, encoder]' \
        ++trainer.psds_types='[psds1_no_penalty]' \
        trainer.valid_interval=2000 \
