#!/bin/bash
export PYTHONPATH=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden:$PYTHONPATH

# # ---------------CLAP pretrained step 100k, freeze------------------
# pretrained_model_checkpoint=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_clap/exp/wavcaps_CLAP_Au_Tu_1e-2_fp16_bsz6400/checkpoint-100000.pt
# torchrun --nproc_per_node=1 \
#          --master_port=29503 \
#         train.py \
#         ++exp_dir=urbansound8k_clap_100k_4.5e-3_bsz80 \
#         trainer.valid_interval=100 \
#         data.train_data_config=configs/urbansound8k/train_data_config_urbansound8k.yaml \
#         data.valid_sets='[/apdcephfs_cq12/share_302080740/data/audio_train_data/manifests/urbansound/urbansound_9.jsonl.gz]' \
#         data.max_duration=80 \
#         trainer.use_fp16=false \
#         data.use_infinite_dataset=true \
#         trainer.base_lr=0.0045 \
#         trainer.initial_batch_count=100000 \
#         ++trainer.checkpoint.pretrained_model=$pretrained_model_checkpoint \
#         ++trainer.checkpoint.init_modules='[encoder_embed, encoder]' \

# ---------------Cap pretrained step 100k, freeze------------------
pretrained_model_checkpoint=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_captioning/exp/wavcaps_captioning_Au_Tu_5e-3_fp16_bsz6400/checkpoint-100000.pt
CUDA_VISIBLE_DEVICES=1 torchrun --nproc_per_node=1 \
         --master_port=29501 \
        train.py \
        exp_dir=exps/urbansound8k_captioning_100k_lr4_5e-3_bsz80 \
        model.id2label_json=configs/urbansound8k/id2label_urbansound8k.json \
        trainer.valid_interval=100 \
        data.train_data_config=configs/urbansound8k/train_data_config_urbansound8k.yaml \
        data.valid_sets='[/apdcephfs_cq12/share_302080740/data/audio_train_data/manifests/audiotag/urbansound_9.jsonl.gz]' \
        data.max_duration=80 \
        trainer.use_fp16=false \
        data.use_infinite_dataset=true \
        trainer.base_lr=0.0045 \
        trainer.initialization.checkpoint=$pretrained_model_checkpoint \
        trainer.freeze_modules='[encoder_embed, encoder]' \

# # ---------------CapPa pretrained step 100k, freeze------------------
# pretrained_model_checkpoint=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_captioning/exp/wavcaps_masked_captioning_Au_Tu_5e-3_fp16_bsz6400/checkpoint-100000.pt
# torchrun --nproc_per_node=1 \
#          --master_port=29503 \
#         train.py \
#         ++exp_dir=urbansound8k_captioningPa_100k_4.5e-3_bsz80 \
#         trainer.valid_interval=100 \
#         data.train_data_config=configs/urbansound8k/train_data_config_urbansound8k.yaml \
#         data.valid_sets='[/apdcephfs_cq12/share_302080740/data/audio_train_data/manifests/urbansound/urbansound_9.jsonl.gz]' \
#         data.max_duration=80 \
#         trainer.use_fp16=false \
#         data.use_infinite_dataset=true \
#         trainer.base_lr=0.0045 \
#         trainer.initial_batch_count=100000 \
#         ++trainer.checkpoint.pretrained_model=$pretrained_model_checkpoint \
#         ++trainer.checkpoint.init_modules='[encoder_embed, encoder]' \