#!/bin/bash
export PYTHONPATH=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden:$PYTHONPATH

# # ----------------finetune on audiocaps from a pretrained checkpoint------------------
# pretrained_checkpoint=/apdcephfs_cq12/share_302080740/user/xuanruzhou/Auden/egs/audio_classification/exp/audioset_baseline_new/epoch-50.pt
# CUDA_VISIBLE_DEVICES=3,4 torchrun --nproc_per_node=2 --master_port=29501 \
#         train.py \
#         exp_dir=exp/audio_captioning_testing \
#         data.train_data_config=configs/audiocaps/train_data_config_audiocaps.yaml \
#         data.max_duration=800 \
#         data.valid_sets='[/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_captioning/manifests/audiocaps_val.jsonl.gz]' \
#         data.use_infinite_dataset=true \
#         trainer.lr_steps_per_epoch=10000 \
#         trainer.freeze_modules=['encoder_embed','encoder'] \
#         trainer.initialization.checkpoint=$pretrained_checkpoint \
#         trainer.valid_interval=100 \

# # ----------------finetune on audiocaps from a pretrained checkpoint with masked captioning------------------
# pretrained_checkpoint=/apdcephfs_cq12/share_302080740/user/xuanruzhou/Auden/egs/audio_classification/exp/audioset_baseline_new/epoch-50.pt
# CUDA_VISIBLE_DEVICES=3,4 torchrun --nproc_per_node=2 --master_port=29501 \
#         train.py \
#         exp_dir=exp/audio_masked_captioning_testing \
#         model.name="zipformer-masked-captioning" \
#         data.train_data_config=configs/audiocaps/train_data_config_audiocaps.yaml \
#         data.max_duration=800 \
#         data.valid_sets='[/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_captioning/manifests/audiocaps_val.jsonl.gz]' \
#         data.use_infinite_dataset=true \
#         trainer.lr_steps_per_epoch=10000 \
#         trainer.freeze_modules=['encoder_embed','encoder'] \
#         trainer.initialization.checkpoint=$pretrained_checkpoint \
#         trainer.valid_interval=100 \

pretrained_checkpoint=/apdcephfs_cq12/share_302080740/user/xuanruzhou/Auden/egs/audio_classification/exp/audioset_baseline_new/epoch-50.pt
CUDA_VISIBLE_DEVICES=0,1 torchrun --nproc_per_node=2 --master_port=29501 \
        train.py \
        exp_dir=exp/audiosetcaps_captioning_testing \
        data.train_data_config=configs/audiosetcaps/train_data_config_audiosetcaps.yaml \
        data.max_duration=800 \
        data.valid_sets='[/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_captioning/manifests/audiocaps_val.jsonl.gz]' \
        data.use_infinite_dataset=true \
        trainer.lr_steps_per_epoch=10000 \
        trainer.freeze_modules=['encoder_embed','encoder'] \
        trainer.initialization.checkpoint=$pretrained_checkpoint \
        trainer.valid_interval=100 \