mmpretrain/configs/chinese_clip/metafile.yml

80 lines
2.9 KiB
YAML

Collections:
- Name: ChineseCLIP
Metadata:
Training Data:
- LAION-5B
- WuKong
- VisualGenome
- MSCOCO
Architecture:
- Transformer
Paper:
Title: 'Chinese CLIP: Contrastive Vision-Language Pretraining in Chinese'
URL: https://arxiv.org/abs/2211.01335
README: configs/chinese_clip/README.md
Models:
- Name: cn-clip_resnet50_zeroshot-cls_cifar100
Metadata:
FLOPs: null
Parameters: 77000000
In Collection: ChineseCLIP
Results:
- Task: Image Classification
Dataset: CIFAR100
Metrics:
Top 1 Accuracy: 40.7
Weights: https://download.openmmlab.com/mmpretrain/v1.0/chinese_clip/cn-clip_resnet50_3rdparty_20230519-6a2b3eb2.pth
Config: configs/chinese_clip/cn-clip_resnet50_zeroshot-cls_cifar100.py
Converted From:
Weights: https://clip-cn-beijing.oss-cn-beijing.aliyuncs.com/checkpoints/clip_cn_rn50.pt
Code: https://github.com/OFA-Sys/Chinese-CLIP
- Name: cn-clip_vit-base-p16_zeroshot-cls_cifar100
Metadata:
FLOPs: null
Parameters: 188000000
In Collection: ChineseCLIP
Results:
- Task: Image Classification
Dataset: CIFAR100
Metrics:
Top 1 Accuracy: 64.5
Weights: https://download.openmmlab.com/mmpretrain/v1.0/chinese_clip/cn-clip_vit-base-p16_3rdparty_20230519-37fbc59e.pth
Config: configs/chinese_clip/cn-clip_vit-base-p16_zeroshot-cls_cifar100.py
Converted From:
Weights: https://clip-cn-beijing.oss-cn-beijing.aliyuncs.com/checkpoints/clip_cn_vit-b-16.pt
Code: https://github.com/OFA-Sys/Chinese-CLIP
- Name: cn-clip_vit-large-p14_zeroshot-cls_cifar100
Metadata:
FLOPs: null
Parameters: 406000000
In Collection: ChineseCLIP
Results:
- Task: Image Classification
Dataset: CIFAR100
Metrics:
Top 1 Accuracy: 74.8
Weights: https://download.openmmlab.com/mmpretrain/v1.0/chinese_clip/cn-clip_vit-large-p14_3rdparty_20230519-3f844503.pth
Config: configs/chinese_clip/cn-clip_vit-large-p14_zeroshot-cls_cifar100.py
Converted From:
Weights: https://clip-cn-beijing.oss-cn-beijing.aliyuncs.com/checkpoints/clip_cn_vit-l-14.pt
Code: https://github.com/OFA-Sys/Chinese-CLIP
- Name: cn-clip_vit-huge-p14_zeroshot-cls_cifar100
Metadata:
FLOPs: null
Parameters: 958000000
In Collection: ChineseCLIP
Results:
- Task: Image Classification
Dataset: CIFAR100
Metrics:
Top 1 Accuracy: 79.1
Weights: https://download.openmmlab.com/mmpretrain/v1.0/chinese_clip/cn-clip_vit-huge-p14_3rdparty_20230519-e4f49b00.pth
Config: configs/chinese_clip/cn-clip_vit-huge-p14_zeroshot-cls_cifar100.py
Converted From:
Weights: https://clip-cn-beijing.oss-cn-beijing.aliyuncs.com/checkpoints/clip_cn_vit-h-14.pt
Code: https://github.com/OFA-Sys/Chinese-CLIP