pytorch-image-models/timm/models/_pretrained.py

import copy
from collections import deque, defaultdict
from dataclasses import dataclass, field, replace, asdict
from typing import Any, Deque, Dict, Tuple, Optional, Union


__all__ = ['PretrainedCfg', 'filter_pretrained_cfg', 'DefaultCfg', 'split_model_name_tag', 'generate_default_cfgs']


@dataclass
class PretrainedCfg:
    """
    """
    # weight locations
    url: Optional[Union[str, Tuple[str, str]]] = None
    file: Optional[str] = None
    hf_hub_id: Optional[str] = None
    hf_hub_filename: Optional[str] = None

    source: Optional[str] = None  # source of cfg / weight location used (url, file, hf-hub)
    architecture: Optional[str] = None  # architecture variant can be set when not implicit
    tag: Optional[str] = None  # pretrained tag of source
    custom_load: bool = False  # use custom model specific model.load_pretrained() (ie for npz files)

    # input / data config
    input_size: Tuple[int, int, int] = (3, 224, 224)
    test_input_size: Optional[Tuple[int, int, int]] = None
    min_input_size: Optional[Tuple[int, int, int]] = None
    fixed_input_size: bool = False
    interpolation: str = 'bicubic'
    crop_pct: float = 0.875
    test_crop_pct: Optional[float] = None
    crop_mode: str = 'center'
    mean: Tuple[float, ...] = (0.485, 0.456, 0.406)
    std: Tuple[float, ...] = (0.229, 0.224, 0.225)

    # head / classifier config and meta-data
    num_classes: int = 1000
    label_offset: Optional[int] = None
    label_names: Optional[Tuple[str]] = None
    label_descriptions: Optional[Dict[str, str]] = None

    # model attributes that vary with above or required for pretrained adaptation
    pool_size: Optional[Tuple[int, ...]] = None
    test_pool_size: Optional[Tuple[int, ...]] = None
    first_conv: Optional[str] = None
    classifier: Optional[str] = None

    license: Optional[str] = None
    description: Optional[str] = None
    origin_url: Optional[str] = None
    paper_name: Optional[str] = None
    paper_ids: Optional[Union[str, Tuple[str]]] = None
    notes: Optional[Tuple[str]] = None

    @property
    def has_weights(self):
        return self.url or self.file or self.hf_hub_id

    def to_dict(self, remove_source=False, remove_null=True):
        return filter_pretrained_cfg(
            asdict(self),
            remove_source=remove_source,
            remove_null=remove_null
        )


def filter_pretrained_cfg(cfg, remove_source=False, remove_null=True):
    filtered_cfg = {}
    keep_null = {'pool_size', 'first_conv', 'classifier'}  # always keep these keys, even if none
    for k, v in cfg.items():
        if remove_source and k in {'url', 'file', 'hf_hub_id', 'hf_hub_id', 'hf_hub_filename', 'source'}:
            continue
        if remove_null and v is None and k not in keep_null:
            continue
        filtered_cfg[k] = v
    return filtered_cfg


@dataclass
class DefaultCfg:
    tags: Deque[str] = field(default_factory=deque)  # priority queue of tags (first is default)
    cfgs: Dict[str, PretrainedCfg] = field(default_factory=dict)  # pretrained cfgs by tag
    is_pretrained: bool = False  # at least one of the configs has a pretrained source set

    @property
    def default(self):
        return self.cfgs[self.tags[0]]

    @property
    def default_with_tag(self):
        tag = self.tags[0]
        return tag, self.cfgs[tag]


def split_model_name_tag(model_name: str, no_tag=''):
    model_name, *tag_list = model_name.split('.', 1)
    tag = tag_list[0] if tag_list else no_tag
    return model_name, tag


def generate_default_cfgs(cfgs: Dict[str, Union[Dict[str, Any], PretrainedCfg]]):
    out = defaultdict(DefaultCfg)
    default_set = set()  # no tag and tags ending with * are prioritized as default

    for k, v in cfgs.items():
        if isinstance(v, dict):
            v = PretrainedCfg(**v)
        has_weights = v.has_weights

        model, tag = split_model_name_tag(k)
        is_default_set = model in default_set
        priority = (has_weights and not tag) or (tag.endswith('*') and not is_default_set)
        tag = tag.strip('*')

        default_cfg = out[model]

        if priority:
            default_cfg.tags.appendleft(tag)
            default_set.add(model)
        elif has_weights and not default_cfg.is_pretrained:
            default_cfg.tags.appendleft(tag)
        else:
            default_cfg.tags.append(tag)

        if has_weights:
            default_cfg.is_pretrained = True

        default_cfg.cfgs[tag] = v

    return out
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`import copy`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`from collections import deque, defaultdict`
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`from dataclasses import dataclass, field, replace, asdict`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`from typing import Any, Deque, Dict, Tuple, Optional, Union`


Add a deprecation phase to module re-org 2022-12-10 06:39:45 +08:00			`__all__ = ['PretrainedCfg', 'filter_pretrained_cfg', 'DefaultCfg', 'split_model_name_tag', 'generate_default_cfgs']`


Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`@dataclass`
			`class PretrainedCfg:`
			`"""`
			`"""`
			`# weight locations`
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`url: Optional[Union[str, Tuple[str, str]]] = None`
			`file: Optional[str] = None`
			`hf_hub_id: Optional[str] = None`
			`hf_hub_filename: Optional[str] = None`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`source: Optional[str] = None # source of cfg / weight location used (url, file, hf-hub)`
			`architecture: Optional[str] = None # architecture variant can be set when not implicit`
Update efficientnet.py and convnext.py to multi-weight, add ImageNet-12k pretrained EfficientNet-B5 and ConvNeXt-Nano. 2022-12-15 12:33:23 +08:00			`tag: Optional[str] = None # pretrained tag of source`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`custom_load: bool = False # use custom model specific model.load_pretrained() (ie for npz files)`

			`# input / data config`
			`input_size: Tuple[int, int, int] = (3, 224, 224)`
			`test_input_size: Optional[Tuple[int, int, int]] = None`
			`min_input_size: Optional[Tuple[int, int, int]] = None`
			`fixed_input_size: bool = False`
			`interpolation: str = 'bicubic'`
			`crop_pct: float = 0.875`
			`test_crop_pct: Optional[float] = None`
Add crop_mode for pretraind config / image transforms. Add support for dynamo compilation to benchmark/train/validate 2022-11-22 08:30:56 +08:00			`crop_mode: str = 'center'`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`mean: Tuple[float, ...] = (0.485, 0.456, 0.406)`
			`std: Tuple[float, ...] = (0.229, 0.224, 0.225)`

Improve support for custom dataset label name/description through HF hub export, via pretrained_cfg 2023-02-08 23:56:19 +08:00			`# head / classifier config and meta-data`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`num_classes: int = 1000`
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`label_offset: Optional[int] = None`
Improve support for custom dataset label name/description through HF hub export, via pretrained_cfg 2023-02-08 23:56:19 +08:00			`label_names: Optional[Tuple[str]] = None`
			`label_descriptions: Optional[Dict[str, str]] = None`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00
			`# model attributes that vary with above or required for pretrained adaptation`
			`pool_size: Optional[Tuple[int, ...]] = None`
			`test_pool_size: Optional[Tuple[int, ...]] = None`
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`first_conv: Optional[str] = None`
			`classifier: Optional[str] = None`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`license: Optional[str] = None`
Convert mobilenetv3 to multi-weight, tweak PretrainedCfg metadata 2022-12-17 01:29:13 +08:00			`description: Optional[str] = None`
			`origin_url: Optional[str] = None`
			`paper_name: Optional[str] = None`
			`paper_ids: Optional[Union[str, Tuple[str]]] = None`
			`notes: Optional[Tuple[str]] = None`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00
			`@property`
			`def has_weights(self):`
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`return self.url or self.file or self.hf_hub_id`

			`def to_dict(self, remove_source=False, remove_null=True):`
			`return filter_pretrained_cfg(`
			`asdict(self),`
			`remove_source=remove_source,`
			`remove_null=remove_null`
			`)`


			`def filter_pretrained_cfg(cfg, remove_source=False, remove_null=True):`
			`filtered_cfg = {}`
Add FlexiViT models and weights, refactoring, push more weights * push all vision_transformer.py weights to HF hub finalize more pretrained tags for pushed weights * refactor pos_embed files and module locations, move some pos embed modules to layers * tweak hf hub helpers to aid bulk uploading and updating 2022-12-23 09:19:45 +08:00			`keep_null = {'pool_size', 'first_conv', 'classifier'} # always keep these keys, even if none`
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`for k, v in cfg.items():`
			`if remove_source and k in {'url', 'file', 'hf_hub_id', 'hf_hub_id', 'hf_hub_filename', 'source'}:`
			`continue`
Add FlexiViT models and weights, refactoring, push more weights * push all vision_transformer.py weights to HF hub finalize more pretrained tags for pushed weights * refactor pos_embed files and module locations, move some pos embed modules to layers * tweak hf hub helpers to aid bulk uploading and updating 2022-12-23 09:19:45 +08:00			`if remove_null and v is None and k not in keep_null:`
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`continue`
			`filtered_cfg[k] = v`
			`return filtered_cfg`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00

			`@dataclass`
			`class DefaultCfg:`
			`tags: Deque[str] = field(default_factory=deque) # priority queue of tags (first is default)`
			`cfgs: Dict[str, PretrainedCfg] = field(default_factory=dict) # pretrained cfgs by tag`
			`is_pretrained: bool = False # at least one of the configs has a pretrained source set`

			`@property`
			`def default(self):`
			`return self.cfgs[self.tags[0]]`

			`@property`
			`def default_with_tag(self):`
			`tag = self.tags[0]`
			`return tag, self.cfgs[tag]`


			`def split_model_name_tag(model_name: str, no_tag=''):`
			`model_name, *tag_list = model_name.split('.', 1)`
			`tag = tag_list[0] if tag_list else no_tag`
			`return model_name, tag`


Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`def generate_default_cfgs(cfgs: Dict[str, Union[Dict[str, Any], PretrainedCfg]]):`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`out = defaultdict(DefaultCfg)`
			`default_set = set() # no tag and tags ending with * are prioritized as default`

			`for k, v in cfgs.items():`
			`if isinstance(v, dict):`
			`v = PretrainedCfg(**v)`
			`has_weights = v.has_weights`

			`model, tag = split_model_name_tag(k)`
			`is_default_set = model in default_set`
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`priority = (has_weights and not tag) or (tag.endswith('*') and not is_default_set)`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`tag = tag.strip('*')`

			`default_cfg = out[model]`

			`if priority:`
			`default_cfg.tags.appendleft(tag)`
			`default_set.add(model)`
Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`elif has_weights and not default_cfg.is_pretrained:`
Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`default_cfg.tags.appendleft(tag)`
			`else:`
			`default_cfg.tags.append(tag)`

Add ported Tensorflow MaxVit weights. Add a few more CLIP ViT fine-tunes. Tweak some model tag names. Improve model tag name sorting. Update HF hub push config layout. 2022-12-03 08:54:18 +08:00			`if has_weights:`
			`default_cfg.is_pretrained = True`

Initial multi-weight support, handled so old pretraing config handling co-exists with new tags. 2022-10-27 13:18:39 +08:00			`default_cfg.cfgs[tag] = v`

			`return out`