model: llava-hf/llava-onevision-qwen2-0.5b-ov-hf
loss: sft
tag: refcoco
data_path: ../data/data/refcoco_mix/annotations.json
image_dir: ../data/data/refcoco_mix/images
output_dir: ../data/ckpt
max_length: 2048
