repo_id = "meta-llama/Llama-2-7b-hf"
local_dir = "../cache/models/llama-2-7b"

token = "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"

import torch
from transformers import LlamaForCausalLM, LlamaTokenizer

# model_id="/PATH/to/Llama-2-7b"

tokenizer = LlamaTokenizer.from_pretrained(repo_id, cache_dir=local_dir)
# model =LlamaForCausalLM.from_pretrained(model_id)
model =LlamaForCausalLM.from_pretrained(repo_id, torch_dtype=torch.float16, cache_dir=local_dir)
# model = LlamaForCausalLM()