sae_type=vlsae
topk=512
hidden_ratio=8
warmup_epochs=2
num_epochs=10

CUDA_VISIBLE_DEVICES=0 python llava_alignment_model_trainer.py

CUDA_VISIBLE_DEVICES=0 python trainsae_for_llava_mean.py --sae_type ${sae_type} \
    --topk ${topk} --hidden_ratio ${hidden_ratio} --num_epochs ${num_epochs} --warmup_epochs ${warmup_epochs} \
    --initial_lr 0.0001 --batch_size 512 --alpha 0