# torchrun --nproc_per_node=8 --master_port 18343 v2/train.py
# gpus: "0"
gpus: "0,1,2,3,4,5,6,7"
# gpus: "0, 1, 2, 3"

transformers_args:
  # model args
  # train_from_scratch: true
  remove_unused_columns: false
  vlm_model_path: "llava-hf/llava-v1.6-mistral-7b-hf"
  peft_model_path: "v2/output/llava-mistral-core_no_div_neighbor_lora-rank16-['multi_modal_projector']-['down_proj']-['slake_vqa']-20250405-13:28:40/checkpoint-924"
  
  exp_name: "eval"
  use_peft: true
  peft_type: "vb-lora"  ## lora, ada-lora, vb-lora, vera, dora, prefix-tuning, prompt-tuning, ia3
  lora_rank: 16
  p_tuning_token: 256
  my_lora: true
  
  # deepspeed: null
  do_train: false
  do_eval: true
  requires_grad_list: []
  # zero2 a100
  # per_device_eval_batch_size: 1
  # per_device_train_batch_size: 1
  # gradient_accumulation_steps: 8
  # eval_accumulation_steps: 1
  # zero3 a100
  per_device_eval_batch_size: 1
  per_device_train_batch_size: 1
  gradient_accumulation_steps: 8
  eval_accumulation_steps: 1

  


