#!/bin/bash
# export PYTHONPATH=/apdcephfs_cq10/share_1603164/user/yiwenyshao/independent/auden:/apdcephfs_cq10/share_1603164/user/yiwenyshao/lhotse:/apdcephfs_cq7/share_1297902/common/allenycwang/Auden:$PYTHONPATH
export PYTHONPATH=/apdcephfs_cq10/share_1603164/user/yiwenyshao/lhotse:/apdcephfs_cq7/share_1297902/common/allenycwang/Auden:$PYTHONPATH

export CUDA_VISIBLE_DEVICES=4
# ----------------train from scratch------------------
torchrun --nproc_per_node=1 \
        --master_port=25751 \
         train.py \
         exp_dir=exp/auden_gs_key_from_scratch \
         model.id2label_json=configs/gs_key/id2label_gs_key.json \
         trainer.valid_interval=100 \
         trainer.base_lr=0.015 \
         trainer.use_fp16=False \
         trainer.num_epochs=100 \
         data.max_duration=480 \
         ++data.train_data_config='configs/gs_key/train_data_config_gs_key.yaml' \
         ++data.valid_sets='["/apdcephfs_cq7/share_1297902/common/allenycwang/data/music_test_data/manifests/gs_key_valid.jsonl.gz"]' \
         ++model.num_encoder_layers='[2,2,3,4,3,2]' \
         ++model.feedforward_dim='[512,768,1024,1536,1024,768]' \
         ++model.encoder_dim='[192,256,384,512,384,256]' \
         ++model.config.fuse_encoder=true \
         ++model.config.evaluate_key=true \
         ++data.label_field=key \

# # ----------------finetune from audioset------------------
# pretrained_model_checkpoint=/apdcephfs_cq10/share_1603164/user/yiwenyshao/independent/auden/egs/audio_tag/exp/audioset_bucket_2M_orig/averaged_epoch30_avg10.pt
# torchrun --nproc_per_node=1 \
#          train.py \
#          exp_dir=exp/auden_gs_key_audiosetinit \
#          model.id2label_json=configs/gs_key/id2label_gs_key.json \
#          trainer.valid_interval=100 \
#          trainer.base_lr=0.0045 \
#          trainer.initialization.checkpoint=$pretrained_model_checkpoint \
#          trainer.lr_batches=100000 \
#          trainer.lr_epochs=100 \
#          trainer.use_fp16=False \
#          trainer.num_epochs=100 \
#          data.max_duration=480 \
#          data.use_infinite_dataset=True \
#          ++data.train_data_config='configs/gs_key/train_data_config_gs_key.yaml' \
#          ++data.valid_sets='["/apdcephfs_cq7/share_1297902/common/allenycwang/data/music_test_data/manifests/gs_key_valid.jsonl.gz"]' \
#          ++trainer.freeze_modules='[encoder_embed, encoder]' \
#          ++model.config.num_encoder_layers='[2,2,3,4,3,2]' \
#          ++model.config.feedforward_dim='[512,768,1024,1536,1024,768]' \
#          ++model.config.encoder_dim='[192,256,384,512,384,256]' \
#          ++model.config.fuse_encoder=true \
#          ++model.config.evaluate_key=true \
#          ++data.label_field=key \