DEFAULT_GRAPH_PAD_ID = -500 

# Mistral format
MISTRAL_BOS = '<s>[INST]'
MISTRAL_EOS_USER = '[/INST]'
MISTRAL_EOS = '</s>'

# Llama3 format  
LLAMA3_BOS = '<|begin_of_text|><|start_header_id|>user<|end_header_id|>\n\n'
LLAMA3_EOS_USER = '<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n'
LLAMA3_EOS = '<|eot_id|>'

# Default (Mistral) for backward compatibility
BOS = MISTRAL_BOS
EOS_USER = MISTRAL_EOS_USER
EOS = MISTRAL_EOS

IGNORE_INDEX = -100 
DEFAULT_G_START_TOKEN = "<g_start>"
DEFAULT_G_END_TOKEN = "<g_end>"
UNKNOW = "Unkown Label"

def get_model_tokens(model_name):
    """Get appropriate tokens based on model name"""
    if "Llama" in model_name or "llama" in model_name:
        return LLAMA3_BOS, LLAMA3_EOS_USER, LLAMA3_EOS
    else:  # Default to Mistral format
        return MISTRAL_BOS, MISTRAL_EOS_USER, MISTRAL_EOS
