#!/bin/bash

mkdir -p output_dirs/ruler_llama3.1

CUDA_VISIBLE_DEVICES=0 python3 run_ruler.py \
    --method "restkv" \
    --model_path "meta-llama/Llama-3.1-8B-Instruct" \
    --max_capacity_prompts 1024 \
    --attn_implementation flash_attention_2 \
    --save_dir output_dirs/ruler_llama3.1 \
    --add_file_name "llama3.1" \
    --window_size 32 \
    --pooling "adaptive" \
    --kernel_sizes 21 \
    --use_wo \
    --use_ema \

python3 eval_ruler.py \
    --results_dir output_dirs/ruler_llama3.1/llama-3.1-8b-instruct_1024/4096

# uncomment the following lines to evaluate other input lengths
# python3 eval_ruler.py \
#     --results_dir output_dirs/ruler_llama3.1/llama-3.1-8b-instruct_1024/8192

# python3 eval_ruler.py \
#     --results_dir output_dirs/ruler_llama3.1/llama-3.1-8b-instruct_1024/16384