NaViL-2B / constants.py
Changyao's picture
Upload folder using huggingface_hub
20f5bc9 verified
IMG_CONTEXT_TOKEN = '<IMG_CONTEXT>'
IMG_START_TOKEN = '<img>'
IMG_END_TOKEN = '</img>'
IMG_LINE_BREAK_TOKEN = '<IMG_LINE_BREAK>'
IMG_FRAME_BREAK_TOKEN = '<IMG_FRAME_BREAK>'
QUAD_START_TOKEN = '<quad>'
QUAD_END_TOKEN = '</quad>'
REF_START_TOKEN = '<ref>'
REF_END_TOKEN = '</ref>'
BOX_START_TOKEN = '<box>'
BOX_END_TOKEN = '</box>'
IMG_UNCOND_TOKEN = '<img_uncond>'
IMAGENET_MEAN = (0.485, 0.456, 0.406)
IMAGENET_STD = (0.229, 0.224, 0.225)
CLIP_MEAN = (0.4814546, 0.4578275, 0.40821073)
CLIP_STD = (0.2686295, 0.2613025, 0.2757711)
SIGLIP_MEAN = (0.5, 0.5, 0.5)
SIGLIP_STD = (0.5, 0.5, 0.5)
VAE_MEAN = (0.5, 0.5, 0.5)
VAE_STD = (0.5, 0.5, 0.5)
SPECIAL_TOKEN_LIST = [
BOX_END_TOKEN, BOX_START_TOKEN,
IMG_CONTEXT_TOKEN, IMG_END_TOKEN,
IMG_START_TOKEN, QUAD_END_TOKEN,
QUAD_START_TOKEN, REF_END_TOKEN,
REF_START_TOKEN, IMG_UNCOND_TOKEN,
IMG_LINE_BREAK_TOKEN, IMG_FRAME_BREAK_TOKEN,
]