#!/bin/bash
export PYTHONPATH=/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden:$PYTHONPATH

valid_sets='[/apdcephfs_cq12/share_302080740/user/raytseng/research/Auden-refactor-online/Auden/egs/audio_captioning/manifests/audiocaps_val.jsonl.gz]'

CUDA_VISIBLE_DEVICES=0 torchrun --nproc_per_node=0 \
        --master_port=29500 \
        train.py \
        exp_dir=exp/testing \
        ++model.config.text_encoder_type="roberta-base" \
        data.train_data_config=configs/captionstew_full/train_data_config_captionstew_full.yaml \
        data.max_duration=640 \
        data.valid_sets=$valid_sets \
        data.use_infinite_dataset=true \
        data.num_workers=12 \
        trainer.use_fp16=true \
        trainer.lr_steps_per_epoch=25000 \
        trainer.base_lr=0.01 \
        ++model.config.init_text_encoder_from_scratch=true \
        trainer.valid_interval=100 \