#!/bin/bash
export PYTHONPATH=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden:$PYTHONPATH

# linear probing of a frozen audio encoder on DESED for sound event detection
pretrained_model_checkpoint=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_clap/exp/wavcaps_CLAP_Au_Tu_1e-2_fp16_bsz6400/checkpoint-200000.pt
CUDA_VISIBLE_DEVICES=1 torchrun --nproc_per_node=1 \
         --master_port=29501 \
        train_desed.py \
        exp_dir=exp/testing \
        model.id2label_json=configs/desed/id2label_desed.json \
        model.name=zipformer-desed \
        trainer.valid_interval=100 \
        data.train_data_config=configs/desed/train_data_config_desed.yaml \
        data.valid_sets='['/apdcephfs_cq12/share_302080740/user/raytseng/data/dcase_2022_task4/manifest/desed_development_real_mono.jsonl.gz']' \
        data.max_duration=1280 \
        trainer.use_fp16=false \
        data.use_infinite_dataset=true \
        data.mix_dataset=false \
        trainer.base_lr=0.05 \
        trainer.initialization.checkpoint=$pretrained_model_checkpoint \
        trainer.freeze_modules='[encoder_embed, encoder]' \
        ++trainer.psds_types='['psds1', 'psds2']' \