#!/bin/bash

base=liuhaotian/llava-v1.5-7b
epoch=2
# ROOT=$(dirname $(dirname "$(realpath "$0")"))
# DATA_ROOT="$(dirname $(dirname $(dirname $(dirname $ROOT))))/data"
# Run from LLaRA/train-llava, as in bash scripts/script.sh
ROOT=./
DATA_ROOT=../../../../data

export WANDB_PROJECT=digit_llara

deepspeed --master_port 29641 $ROOT/llava/train/train_mem.py     --deepspeed $ROOT/scripts/zero3_offload.json     --model_name_or_path $base     --version v1     --data_path $DATA_ROOT/vima/D-inBC-text-multi_aux-obj_det_aux-obj_loc_aux-act_pred_aux-fut_pred1_1_1_1-train-80k-front.json     --image_folder  $DATA_ROOT/vima/images     --vision_tower openai/clip-vit-large-patch14-336     --mm_projector_type mlp2x_gelu     --mm_vision_select_layer -2     --mm_use_im_start_end False     --mm_use_im_patch_token False     --image_aspect_ratio pad     --group_by_modality_length True     --bf16 True     --num_train_epochs $epoch     --per_device_train_batch_size 8     --per_device_eval_batch_size 4     --gradient_accumulation_steps 1     --evaluation_strategy "no"     --save_strategy "steps"     --save_steps 50000     --save_total_limit 1     --learning_rate 2e-5     --weight_decay 0.     --warmup_ratio 0.03     --lr_scheduler_type "cosine"     --logging_steps 1     --tf32 True     --model_max_length 2048     --gradient_checkpointing True     --dataloader_num_workers 4     --lazy_preprocess True     --output_dir $DATA_ROOT/vima/checkpoints/$base-80k-ep$epoch-digit_base     --run_name 80k-digit_base     --loss_type digit_base
