# Model Constants
IGNORE_INDEX = -100
IMAGE_TOKEN_INDEX = 151655
VIDEO_TOKEN_INDEX = 151656

# the traditional way for a image placeholder in training data.
DEFAULT_IMAGE_TOKEN = "<image>"
DEFAULT_VIDEO_TOKEN = "<video>"

VISION_START_TOKEN = "<|vision_start|>"
VISION_END_TOKEN = "<|vision_end|>"
VISION_TOKEN = "<|vision_pad|>"
IMAGE_TOKEN = "<|image_pad|>"   # for each image token feature
VIDEO_TOKEN = "<|video_pad|>"   # for each video token feature
