IMAGENET_CLIP_TEMPLATES = [
    "a photo of a",
    "a rendering of a",
    "a cropped photo of the",
    "the photo of a",
    "a photo of a clean",
    "a photo of a dirty",
    "a dark photo of the",
    "a close-up photo of a",
    "a bright photo of the",
    "a cropped photo of a",
    "a photo of the",
    "a good photo of the",
    "a photo of one",
    "a close-up photo of the",
    "a rendition of the",
    "a photo of the clean",
    "a rendition of a",
    "a photo of a nice",
    "a good photo of a",
    "a photo of the nice",
    "a photo of the small",
    "a photo of the large",
    "a photo of a small",
    "an illustration of a",
    "a rendering of a",
    "a cropped photo of the",
    "the photo of a",
    "an illustration of a clean",
    "an illustration of a dirty",
    "a dark photo of the",
    "a close-up photo of a",
    "a bright photo of the",
    "a cropped photo of a",
    "an illustration of the",
    "a good photo of the",
    "an illustration of one",
    "a close-up photo of the",
    "a rendition of the",
    "an illustration of the clean",
    "a rendition of a",
    "an illustration of a nice",
    "a good photo of a",
    "an illustration of the nice",
    "an illustration of the small",
    "an illustration of the large",
    "an illustration of a small",
    "a depiction of a",
    "a rendering of a",
    "a cropped photo of the",
    "the photo of a",
    "a depiction of a clean",
    "a depiction of a dirty",
    "a dark photo of the",
    "a close-up photo of a",
    "a bright photo of the",
    "a cropped photo of a",
    "a depiction of the",
    "a good photo of the",
    "a depiction of one",
    "a close-up photo of the",
    "a rendition of the",
    "a depiction of the clean",
    "a rendition of a",
    "a depiction of a nice",
    "a good photo of a",
    "a depiction of the nice",
    "a depiction of the small",
    "a depiction of the large",
    "a depiction of a small",
]

INSTRUCT_PREFIX_TEMPLATES = [
    "turn it into a",
    "transform it into a",
    "change it into a",
    "convert it into a",
    "alter it into a",
    "make it into a"
]


CLIP_CLASSES = [
    "elephant",
    "giraffe",
    "tiger",
    "kangaroo",
    "panda",
    "koala",
    "zebra",
    "hippopotamus",
    "rhinoceros",
    "polar bear",
    "penguin",
    "dolphin",
    "eagle",
    "owl",
    "crocodile",
    "gorilla",
    "wolf",
    "fox",
]
