name: 'meta-llama/Llama-2-7b-chat-hf'
use_fp16: True 
use_flashattn2: False 
prompt_max_len: 800
response_max_len: 800 
n_beams: 1 
use_sampling: True 
sampling_temp: 0.7
