dataset: ruler
data_dir: '4096'
model: meta-llama/Meta-Llama-3.1-8B-Instruct
device: null
press_name: adakv_manifold_kv
compression_ratio: 0.25
key_channel_compression_ratio: null
fraction: 0.01
max_new_tokens: null
max_context_length: 4096
query_aware: false
needle_depth: null
compression_interval: null
target_size: null
hidden_states_buffer_size: null
output_dir: ./icml_results/validation
log_level: INFO
model_kwargs:
  attn_implementation: flash_attention_2
  dtype: auto
  device_map: auto
press_init_command: AdaKVPress(press=ManifoldKVSnapKVScorerPress(compression_ratio=0.25,
  distance_metric='l2'), alpha_safeguard=0.2)
seed: 42
