from transformers import AutoTokenizer

model_name = "liuhaotian/llava-v1.5-7b"
tokenizer = AutoTokenizer.from_pretrained(
    model_name,
    padding_side="right",
    use_fast=False,
)
text = "123123213 423423 00 000 100 42 81 1 22"
print(tokenizer.tokenize(text))
import ipdb; ipdb.set_trace()  # noqa # fmt: skip
