# torchrun --nproc_per_node=4 --master_port 18340 v2/train.py
# gpus: "0"
gpus: "2, 3"

transformers_args:
  # model args
  # train_from_scratch: true
  remove_unused_columns: false
  data_dir: ["slake_vqa"]
  vlm_model_path: "llava-hf/llava-v1.6-mistral-7b-hf"
  exp_name: "llava-mistral-lora"
  lora_rank: 16
  # peft_model_path: "/vsphhome/xwx/med-MLLM/v2/output/llava-mistral-lora-20250306-17:26:58/checkpoint-459"
  my_lora: false
  # zero2 a100
  # per_device_eval_batch_size: 1
  # per_device_train_batch_size: 1
  # gradient_accumulation_steps: 8
  # eval_accumulation_steps: 1
  # zero3 a100
  per_device_eval_batch_size: 1
  per_device_train_batch_size: 1
  gradient_accumulation_steps: 8
  eval_accumulation_steps: 8

  

