#!/bin/bash
echo "conda location: $(which conda)"
echo "Python location: $(which python)"
echo "Python version: $(python --version)"


export EXP_NAME=your_EXP_NAME
export HF_DATASETS_CACHE=your_cache_path
export HF_HOME=your_cache_path
export WANDB_DISABLED=false
export WANDB_PROJECT=wandb_temp
export WANDB_API_KEY=your_key
export HUGGING_FACE_HUB_TOKEN=your_token

export WANDB_RUN_GROUP=vlm2vector
export EXP_NAME=Your_task_name
export WANDB_NAME=$EXP_NAME
export EXP_DIR=.../$EXP_NAME
export WANDB_DIR=$EXP_DIR
echo $EXP_DIR

cmd="
CUDA_VISIBLE_DEVICES=0,1,2,3,4,5,6,7 \
torchrun \
  --nproc_per_node=8 \
  --master_port=2208 \
  --max_restarts=0 \
    train.py \
  --lora \
  --lora_r 16 \
  --model_name /your/path/to/Qwen2-VL-2B-Instruct \
  --bf16 \
  --pooling eos \
  --normalize True \
  --temperature 0.02 \
  --dataloader_num_workers 1 \
  --dataset_config /your/path/to/train_alltasks.yaml \
  --run_name $EXP_NAME \
  --output_dir $EXP_DIR \
  --grad_cache True \
  --per_device_train_batch_size 128 \
  --gc_q_chunk_size 8 \
  --gc_p_chunk_size 8 \
  --interleave_batch_size 64 \
  --image_resolution high \
  --lr_scheduler_type linear \
  --learning_rate 5e-5 \
  --max_steps 2000 \
  --warmup_steps 100 \
  --save_steps 50 \
  --logging_steps 1 \
  --save_safetensors True \
  --remove_unused_columns False \
  --resume_from auto \
  --report_to tensorboard \
  2>&1 | tee $EXP_DIR/train.log
"

echo $cmd
eval $cmd
