#!/bin/bash
  python perplexity_yarn.py --tokenized output/govreport-test-tokenized-awq \
  --dataset-min-tokens 20384 --samples 10 \
  --output-file ppl_results/int_quant_hardmard_no_interpolation_qkv \
  --min-tokens 256 --max-tokens 6016 -m /home/yeq6/Research_project/llama/llama-2-7b-chat_hf \
  --sliding-window 2048 --tokens-step 384 --aggressive-memory \
  --original --awq \
  --comment int_quant_hardmard_no_interpolation_qkv --apply_hardmard --no_pi