#!/bin/bash


PROOFPILE_LONG_SMALL="--tokenized testset/pp-tokenized-llama2 --dataset-min-tokens 131072 --samples 10 --truncate"


PROOFPILE_LONG_SMALL_LLAMA3_1="--tokenized testset/pp-tokenized-llama3 --dataset-min-tokens 131072 --samples 10 --truncate --split train"

PROOFPILE_LONG_SMALL_QWEN2_5="--tokenized testset/pp-tokenized-qwen2.5 --dataset-min-tokens 131072 --samples 10 --truncate --split train"



CUSTOM="--custom-model-together"



python eval/perplexity.py \
    ${PROOFPILE_LONG_SMALL_LLAMA3_1} \
    --output-file output/mrrope-llama3.csv \
    --original-max-position-embeddings 8192 \
    --min-tokens 8192 --max-tokens 131072 --tokens-step 8192 --aggressive-memory \
    --flash-attention \
    --radix 16 \
    -m models/llama3.1-8b-ins

python eval/perplexity.py \
    ${PROOFPILE_LONG_SMALL_LLAMA3_1} \
    --output-file output/yarn-llama3.csv \
    --original-max-position-embeddings 8192 \
    --min-tokens 8192 --max-tokens 131072 --tokens-step 8192 --aggressive-memory \
    --flash-attention \
    --yarn 16 \
    -m models/llama3.1-8b-ins




