#!/bin/bash

# LoRA     
rank=16
alpha=2*rank
gpuid=0
learning_rate=3e-5
timestamp=$(date +%Y%m%d-%H%M%S)

model_p_or_n=/yourbasemodelpath
model_path=/youradapterpath
results_path=/resultspath

mkdir -p $model_path
mkdir -p $results_path


export WANDB_MODE=disabled
  
CUDA_VISIBLE_DEVICES=$gpuid python -u finetune.py \
  --base_model $model_p_or_n \
  --data_path 'ft-training_set/commonsense_170k.json' \
  --output_dir $model_path \
  --batch_size 16 \
  --micro_batch_size 4 \
  --num_epochs 3 \
  --learning_rate $learning_rate \
  --cutoff_len 256 \
  --val_set_size 120 \
  --adapter_name lora \
  --load_8bit False \
  --lora_r $rank \
  --lora_alpha $alpha \
  --lora_dropout 0.05 \
  --lora_act_fn tanh \
  --target_modules '["q_proj", "k_proj", "v_proj", "up_proj", "down_proj"]' \
  --use_gradient_checkpointing True \
  --wandb_project ""

#     
for ds in ARC-Easy openbookqa social_i_qa ARC-Challenge winogrande piqa boolq hellaswag
do
  CUDA_VISIBLE_DEVICES=$gpuid python -u commonsense_evaluate.py \
    --model LLaMA3 \
    --adapter LoRA \
    --dataset $ds \
    --batch_size 1 \
    --base_model $model_p_or_n \
    --lora_weights $model_path \
    --save_dir $results_path \
    --lora_r $rank \
    --lora_act_fn tanh
done