# Set the environment variables first before running the command.
export HF_ALLOW_CODE_EVAL=1
export HF_DATASETS_TRUST_REMOTE_CODE=true

task=gsm8k
length=256
block_length=32
num_fewshot=0
steps=$((length / block_length))

# baseline
CUDA_VISIBLE_DEVICES=0,1,2,3 accelerate launch --main_process_port 29600 eval_llada.py --tasks ${task} --num_fewshot ${num_fewshot} \
--confirm_run_unsafe_code --model llada_dist \
--model_args model_path=GSAI-ML/LLaDA-8B-Instruct,gen_length=${length},steps=${steps},block_length=${block_length},show_speed=True,task="gsm8k"

#dParallel
CUDA_VISIBLE_DEVICES=1,2,3,4 accelerate launch --main_process_port 29600 eval_llada.py --tasks ${task} --num_fewshot ${num_fewshot} \
--confirm_run_unsafe_code --model llada_dist \
--model_args model_path='',gen_length=${length},steps=${steps},block_length=${block_length},show_speed=True,threshold=0.5,task="gsm8k"



task=minerva_math
length=256
block_length=32
num_fewshot=4
steps=$((length / block_length))

# baseline
CUDA_VISIBLE_DEVICES=0,1,2,3 accelerate launch --main_process_port 29600 eval_llada.py --tasks ${task} --num_fewshot ${num_fewshot} \
--confirm_run_unsafe_code --model llada_dist \
--model_args model_path=GSAI-ML/LLaDA-8B-Instruct,gen_length=${length},steps=${steps},block_length=${block_length},show_speed=True,task="minerva_math"

#dParallel
CUDA_VISIBLE_DEVICES=1,2,3,4 accelerate launch --main_process_port 29600 eval_llada.py --tasks ${task} --num_fewshot ${num_fewshot} \
--confirm_run_unsafe_code --model llada_dist \
--model_args model_path='',gen_length=${length},steps=${steps},block_length=${block_length},show_speed=True,threshold=0.5,task="minerva_math"







