model: Qwen/Qwen2-VL-2B-Instruct
loss: sft
tag: refcoco
data_path: ../data/data/refcoco_mix_base/annotations.json
image_dir: ../data/data/refcoco_mix_base/images
output_dir: ../data/ckpt
max_length: 2048
grad_acc: 4
batch_size: 4
