#!/bin/bash

python perplexity_yarn.py --tokenized output/govreport-test-tokenized-awq \
 --dataset-min-tokens 20384 --samples 10 \
 --output-file ppl_results/new_embedding_only/per_head_individual_channel_all_attention_negtive \
 --min-tokens 256 --max-tokens 19456 -m /home/yeq6/Research_project/llama/llama-2-7b-chat_hf \
 --awq_cache llm-awq/awq_cache/llama2-7b-w4-g128_mine.pt \
 --beta_point 1287 --sliding-window 2048 --tokens-step 384 --aggressive-memory --yarn 8 \
 --original --custom-model --original-max-position-embeddings 2048 --awq --rescale_per_head \
 --individual_channel_up "124,90,62,52,86,108,118,75,114,120,50,93,115,73,58,81,80,94,89,69,63,51,46,106,107,84,44,42,123,68,88,15,6,28,12,17,1,20,8,35" \
 --comment per_head_all_attention_individual_channel_negtive_top31 \
 --rescale_attention_all \
 --individual_channel_scale 2