TODAY=`date +%y%m%d%H%M`

## GPU Args
CUDA_VISIBLE_DEVICES=${1}
N_PROC=1
PORT_NUM=$(( ( RANDOM % 10000 )  + 10000 ))

## Model Args
MODEL_PATH=meta-llama
MODEL_NAME=Llama-2-7b-hf
CONFIG=amq/configs/llama.json
QUANTIZATION_PROXY_PATHS=("/SSD/hqq/Llama-2-7b-hf_2bit_128gs_1axis" "/SSD/hqq/Llama-2-7b-hf_3bit_128gs_1axis" "/SSD/hqq/Llama-2-7b-hf_4bit_128gs_1axis")

## Search Args
SENSITIVITY_THRESHOLD=2.0
SENSITIVITY_DATASETS=wikitext2
SENSITIVITY_N_SAMPLE=128
SENSITIVITY_SEQLEN=2048

PREDICTOR=rbf
ITERATIONS=200
N_DOE=250
N_ITER=50
MAX_VALUE=1.0

SUBSET_POP_SIZE=100
GA_POP_SIZE=200
CROSSOVER_PROB=0.9
MUT_PROB=0.1

SAVE_ITER=1
RESULT_FILE=results.txt

## Data Args
DATASET=wikitext2
N_SAMPLE=128
SEQLEN=2048
SEED=0

## Base Args
SAVE_PATH=amq/results/search/${TODAY}_${MODEL_NAME}_dataset_${DATASET}
GPU_ID=${CUDA_VISIBLE_DEVICES}

args=(
    --model_path ${MODEL_PATH} \
    --model_name ${MODEL_NAME} \
    --config ${CONFIG} \
    --quantization_proxy_paths ${QUANTIZATION_PROXY_PATHS[@]}
    --gpu_id ${GPU_ID} \
    --sensitivity_threshold ${SENSITIVITY_THRESHOLD} \
    --sensitivity_datasets ${SENSITIVITY_DATASETS} \
    --sensitivity_n_sample ${SENSITIVITY_N_SAMPLE} \
    --sensitivity_seqlen ${SENSITIVITY_SEQLEN} \
    --predictor ${PREDICTOR} \
    --iterations ${ITERATIONS} \
    --n_doe ${N_DOE} \
    --n_iter ${N_ITER} \
    --max_value ${MAX_VALUE} \
    --subset_pop_size ${SUBSET_POP_SIZE} \
    --ga_pop_size ${GA_POP_SIZE} \
    --crossover_prob ${CROSSOVER_PROB} \
    --mut_prob ${MUT_PROB} \
    --save_iter ${SAVE_ITER} \
    --save_path ${SAVE_PATH} \
    --result_file ${RESULT_FILE} \
    --dataset ${DATASET} \
    --n_sample ${N_SAMPLE}
    --seqlen ${SEQLEN} \
    --seed ${SEED} \
)

echo ${args[@]}

CUDA_VISIBLE_DEVICES=${CUDA_VISIBLE_DEVICES} accelerate launch --num_processes=${N_PROC} --num_machines=1 --main_process_port=${PORT_NUM} amq/amq_search.py ${args[@]}
