from transformers import AutoModelForCausalLM, AutoTokenizer

def load_model_and_tokenizer(model_name):

    model = AutoModelForCausalLM.from_pretrained(
        model_name,
        device_map="auto"
    )
    model.config.use_cache = False
    model.config.pretraining_tp = 1

    tokenizer = AutoTokenizer.from_pretrained(model_name, 
                                              trust_remote_code=True)
    
        # Add special tokens if they don't exist
    special_tokens = {}
    if tokenizer.pad_token is None:
        special_tokens['pad_token'] = '<|endoftext|>'
    if tokenizer.bos_token is None:
        special_tokens['bos_token'] = '<s>'
    if tokenizer.eos_token is None:
        special_tokens['eos_token'] = '</s>'
    
    if special_tokens:
        tokenizer.add_special_tokens(special_tokens)
        # Resize model embeddings to match new tokenizer size
        model.resize_token_embeddings(len(tokenizer))
    
    tokenizer.padding_side = 'right'

    return model, tokenizer