#!/bin/bash

# ====== CONFIGURATION ======
model_path="path/to/folder/pretrained_model/"
task="humaneval_instruct"
max_tokens="768"
diffusion_steps="192" # Have no effects on the CoDiLA model evaluation
limit=5
model_arch="codila"
experiment_name="test"
block_size="4"

# ====== HELPERS ======

timestamp=$(date +%Y%m%d_%H%M%S_%3N)
safe_model_name=$(echo "$model_path" | sed 's/[^a-zA-Z0-9_]/_/g')

log_dir="./data/logs-average/$task/$experiment_name/steps=$diffusion_steps-max_tokens=$max_tokens/$safe_model_name"
output_dir="./data/output_reproduce-average/$task/$experiment_name/steps=$diffusion_steps-max_tokens=$max_tokens/$safe_model_name"

mkdir -p "$log_dir" "$output_dir"

echo "Running local job | task=$task | steps=$diffusion_steps"

# Compose limit argument only if it's not "None"
if [[ "$limit" == "None" ]]; then
    limit_arg=""
else
    limit_arg="--limit $limit"
fi

model_args="pretrained=$model_path,trust_remote_code=True,max_new_tokens=$max_tokens,diffusion_steps=$diffusion_steps,dtype=bfloat16,alg=$alg,block_size=$block_size"


export PATH=/usr/local/cuda/bin:$PATH
export LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH
export PYTHONPATH=.
export VLLM_ENABLE_V1_MULTIPROCESSING=0
export HF_ALLOW_CODE_EVAL=1
export VLLM_LOG_LEVEL=error


python3 -u -m lm_eval \
    --model "$model_arch" \
    --model_args "$model_args" \
    --tasks "$task" \
    --device cuda \
    --batch_size 1 \
    --num_fewshot 0 \
    --output_path "$output_dir/$timestamp" \
    $limit_arg \
    --confirm_run_unsafe_code \
    --apply_chat_template \
    > "${log_dir}/${timestamp}.out" 2> "${log_dir}/${timestamp}.err"
