# torchrun --nproc_per_node=4 --master_port 18341 v2/train.py
# gpus: "0"
# gpus: "4, 5, 6, 7"
gpus: "0, 1, 2, 3"
# gpus: "0, 1, 2, 3, 4, 5, 6, 7"

transformers_args:
  # model args
  # train_from_scratch: true
  remove_unused_columns: false
  vlm_model_path: "llava-hf/llava-v1.6-mistral-7b-hf"
  exp_name: "llava-mistral-core_div_A_neighbor_lora"
  lora_rank: 16
  # peft_model_path: "v2/output/llava-mistral-my_lora-20250308-11:09:11/checkpoint-459"
  my_lora: true
  # zero2 a100
  # per_device_eval_batch_size: 1
  # per_device_train_batch_size: 1
  # gradient_accumulation_steps: 8
  # eval_accumulation_steps: 1
  # zero3 a100
  per_device_eval_batch_size: 1
  per_device_train_batch_size: 1
  gradient_accumulation_steps: 4
  eval_accumulation_steps: 1

  

