from transformers import AutoModelForCausalLM, AutoTokenizer, AutoConfig
import torch

def load_model_and_tokenizer(model_name, device, cache_dir="./cache", local_files_only=False):
    model = AutoModelForCausalLM.from_pretrained(
        model_name,
        torch_dtype=torch.float32,
        cache_dir=cache_dir,
        local_files_only=local_files_only,
    ).to(device)

    model.eval()

    tokenizer = AutoTokenizer.from_pretrained(
        model_name,
        cache_dir=cache_dir,
        local_files_only=local_files_only,
        max_length=model.config.max_position_embeddings, # TODO: Fallback if not set?
    )
    
    # Auto-set padding side based on model type
    config = AutoConfig.from_pretrained(model_name, cache_dir=cache_dir, local_files_only=local_files_only)
    is_decoder_only = not config.is_encoder_decoder
    tokenizer.padding_side = "left" if is_decoder_only else "right"

    if tokenizer.pad_token is None:
        tokenizer.add_special_tokens({'pad_token': '[PAD]'})
        model.resize_token_embeddings(len(tokenizer))

    return model, tokenizer