mirror of
https://github.com/open-mmlab/mmsegmentation.git
synced 2025-06-03 22:03:48 +08:00
205 lines
7.0 KiB
Python
205 lines
7.0 KiB
Python
|
# Copyright (c) OpenMMLab. All rights reserved.
|
||
|
|
||
|
# Source: https://github.com/openai/CLIP.
|
||
|
|
||
|
IMAGENET_TEMPLATES = [
|
||
|
'a bad photo of a {}.',
|
||
|
'a photo of many {}.',
|
||
|
'a sculpture of a {}.',
|
||
|
'a photo of the hard to see {}.',
|
||
|
'a low resolution photo of the {}.',
|
||
|
'a rendering of a {}.',
|
||
|
'graffiti of a {}.',
|
||
|
'a bad photo of the {}.',
|
||
|
'a cropped photo of the {}.',
|
||
|
'a tattoo of a {}.',
|
||
|
'the embroidered {}.',
|
||
|
'a photo of a hard to see {}.',
|
||
|
'a bright photo of a {}.',
|
||
|
'a photo of a clean {}.',
|
||
|
'a photo of a dirty {}.',
|
||
|
'a dark photo of the {}.',
|
||
|
'a drawing of a {}.',
|
||
|
'a photo of my {}.',
|
||
|
'the plastic {}.',
|
||
|
'a photo of the cool {}.',
|
||
|
'a close-up photo of a {}.',
|
||
|
'a black and white photo of the {}.',
|
||
|
'a painting of the {}.',
|
||
|
'a painting of a {}.',
|
||
|
'a pixelated photo of the {}.',
|
||
|
'a sculpture of the {}.',
|
||
|
'a bright photo of the {}.',
|
||
|
'a cropped photo of a {}.',
|
||
|
'a plastic {}.',
|
||
|
'a photo of the dirty {}.',
|
||
|
'a jpeg corrupted photo of a {}.',
|
||
|
'a blurry photo of the {}.',
|
||
|
'a photo of the {}.',
|
||
|
'a good photo of the {}.',
|
||
|
'a rendering of the {}.',
|
||
|
'a {} in a video game.',
|
||
|
'a photo of one {}.',
|
||
|
'a doodle of a {}.',
|
||
|
'a close-up photo of the {}.',
|
||
|
'a photo of a {}.',
|
||
|
'the origami {}.',
|
||
|
'the {} in a video game.',
|
||
|
'a sketch of a {}.',
|
||
|
'a doodle of the {}.',
|
||
|
'a origami {}.',
|
||
|
'a low resolution photo of a {}.',
|
||
|
'the toy {}.',
|
||
|
'a rendition of the {}.',
|
||
|
'a photo of the clean {}.',
|
||
|
'a photo of a large {}.',
|
||
|
'a rendition of a {}.',
|
||
|
'a photo of a nice {}.',
|
||
|
'a photo of a weird {}.',
|
||
|
'a blurry photo of a {}.',
|
||
|
'a cartoon {}.',
|
||
|
'art of a {}.',
|
||
|
'a sketch of the {}.',
|
||
|
'a embroidered {}.',
|
||
|
'a pixelated photo of a {}.',
|
||
|
'itap of the {}.',
|
||
|
'a jpeg corrupted photo of the {}.',
|
||
|
'a good photo of a {}.',
|
||
|
'a plushie {}.',
|
||
|
'a photo of the nice {}.',
|
||
|
'a photo of the small {}.',
|
||
|
'a photo of the weird {}.',
|
||
|
'the cartoon {}.',
|
||
|
'art of the {}.',
|
||
|
'a drawing of the {}.',
|
||
|
'a photo of the large {}.',
|
||
|
'a black and white photo of a {}.',
|
||
|
'the plushie {}.',
|
||
|
'a dark photo of a {}.',
|
||
|
'itap of a {}.',
|
||
|
'graffiti of the {}.',
|
||
|
'a toy {}.',
|
||
|
'itap of my {}.',
|
||
|
'a photo of a cool {}.',
|
||
|
'a photo of a small {}.',
|
||
|
'a tattoo of the {}.',
|
||
|
# 'A photo of a {} in the scene.',
|
||
|
]
|
||
|
|
||
|
# v1: 59.0875
|
||
|
IMAGENET_TEMPLATES_SELECT = [
|
||
|
'itap of a {}.',
|
||
|
'a bad photo of the {}.',
|
||
|
'a origami {}.',
|
||
|
'a photo of the large {}.',
|
||
|
'a {} in a video game.',
|
||
|
'art of the {}.',
|
||
|
'a photo of the small {}.',
|
||
|
'A photo of a {} in the scene',
|
||
|
]
|
||
|
|
||
|
# v9
|
||
|
IMAGENET_TEMPLATES_SELECT_CLIP = [
|
||
|
'a bad photo of the {}.',
|
||
|
'a photo of the large {}.',
|
||
|
'a photo of the small {}.',
|
||
|
'a cropped photo of a {}.',
|
||
|
'This is a photo of a {}',
|
||
|
'This is a photo of a small {}',
|
||
|
'This is a photo of a medium {}',
|
||
|
'This is a photo of a large {}',
|
||
|
'This is a masked photo of a {}',
|
||
|
'This is a masked photo of a small {}',
|
||
|
'This is a masked photo of a medium {}',
|
||
|
'This is a masked photo of a large {}',
|
||
|
'This is a cropped photo of a {}',
|
||
|
'This is a cropped photo of a small {}',
|
||
|
'This is a cropped photo of a medium {}',
|
||
|
'This is a cropped photo of a large {}',
|
||
|
'A photo of a {} in the scene',
|
||
|
'a bad photo of the {} in the scene',
|
||
|
'a photo of the large {} in the scene',
|
||
|
'a photo of the small {} in the scene',
|
||
|
'a cropped photo of a {} in the scene',
|
||
|
'a photo of a masked {} in the scene',
|
||
|
'There is a {} in the scene',
|
||
|
'There is the {} in the scene',
|
||
|
'This is a {} in the scene',
|
||
|
'This is the {} in the scene',
|
||
|
'This is one {} in the scene',
|
||
|
'There is a masked {} in the scene',
|
||
|
'There is the masked {} in the scene',
|
||
|
'This is a masked {} in the scene',
|
||
|
'This is the masked {} in the scene',
|
||
|
'This is one masked {} in the scene',
|
||
|
]
|
||
|
|
||
|
# v10, for comparison
|
||
|
# IMAGENET_TEMPLATES_SELECT_CLIP = [
|
||
|
# 'a photo of a {}.',
|
||
|
#
|
||
|
# 'This is a photo of a {}',
|
||
|
# 'This is a photo of a small {}',
|
||
|
# 'This is a photo of a medium {}',
|
||
|
# 'This is a photo of a large {}',
|
||
|
#
|
||
|
# 'This is a photo of a {}',
|
||
|
# 'This is a photo of a small {}',
|
||
|
# 'This is a photo of a medium {}',
|
||
|
# 'This is a photo of a large {}',
|
||
|
#
|
||
|
# 'a photo of a {} in the scene',
|
||
|
# 'a photo of a {} in the scene',
|
||
|
#
|
||
|
# 'There is a {} in the scene',
|
||
|
# 'There is the {} in the scene',
|
||
|
# 'This is a {} in the scene',
|
||
|
# 'This is the {} in the scene',
|
||
|
# 'This is one {} in the scene',
|
||
|
# ]
|
||
|
|
||
|
ViLD_templates = [
|
||
|
'There is {article} {category} in the scene.',
|
||
|
'There is the {category} in the scene.',
|
||
|
'a photo of {article} {category} in the scene.',
|
||
|
'a photo of the {category} in the scene.',
|
||
|
'a photo of one {category} in the scene.', 'itap of {article} {category}.',
|
||
|
'itap of my {category}.', 'itap of the {category}.',
|
||
|
'a photo of {article} {category}.', 'a photo of my {category}.',
|
||
|
'a photo of the {category}.', 'a photo of one {category}.',
|
||
|
'a photo of many {category}.', 'a good photo of {article} {category}.',
|
||
|
'a good photo of the {category}.', 'a bad photo of {article} {category}.',
|
||
|
'a bad photo of the {category}.', 'a photo of a nice {category}.',
|
||
|
'a photo of the nice {category}.', 'a photo of a cool {category}.',
|
||
|
'a photo of the cool {category}.', 'a photo of a weird {category}.',
|
||
|
'a photo of the weird {category}.', 'a photo of a small {category}.',
|
||
|
'a photo of the small {category}.', 'a photo of a large {category}.',
|
||
|
'a photo of the large {category}.', 'a photo of a clean {category}.',
|
||
|
'a photo of the clean {category}.', 'a photo of a dirty {category}.',
|
||
|
'a photo of the dirty {category}.',
|
||
|
'a bright photo of {article} {category}.',
|
||
|
'a bright photo of the {category}.',
|
||
|
'a dark photo of {article} {category}.', 'a dark photo of the {category}.',
|
||
|
'a photo of a hard to see {category}.',
|
||
|
'a photo of the hard to see {category}.',
|
||
|
'a low resolution photo of {article} {category}.',
|
||
|
'a low resolution photo of the {category}.',
|
||
|
'a cropped photo of {article} {category}.',
|
||
|
'a cropped photo of the {category}.',
|
||
|
'a close-up photo of {article} {category}.',
|
||
|
'a close-up photo of the {category}.',
|
||
|
'a jpeg corrupted photo of {article} {category}.',
|
||
|
'a jpeg corrupted photo of the {category}.',
|
||
|
'a blurry photo of {article} {category}.',
|
||
|
'a blurry photo of the {category}.',
|
||
|
'a pixelated photo of {article} {category}.',
|
||
|
'a pixelated photo of the {category}.',
|
||
|
'a black and white photo of the {category}.',
|
||
|
'a black and white photo of {article} {category}.',
|
||
|
'a plastic {category}.', 'the plastic {category}.', 'a toy {category}.',
|
||
|
'the toy {category}.', 'a plushie {category}.', 'the plushie {category}.',
|
||
|
'a cartoon {category}.', 'the cartoon {category}.',
|
||
|
'an embroidered {category}.', 'the embroidered {category}.',
|
||
|
'a painting of the {category}.', 'a painting of a {category}.'
|
||
|
]
|