PaddleClas/ppcls/arch/__init__.py

#copyright (c) 2021 PaddlePaddle Authors. All Rights Reserve.
#
#Licensed under the Apache License, Version 2.0 (the "License");
#you may not use this file except in compliance with the License.
#You may obtain a copy of the License at
#
#    http://www.apache.org/licenses/LICENSE-2.0
#
#Unless required by applicable law or agreed to in writing, software
#distributed under the License is distributed on an "AS IS" BASIS,
#WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#See the License for the specific language governing permissions and
#limitations under the License.

import copy
import importlib

import paddle
import paddle.nn as nn
from paddle.jit import to_static
from paddle.static import InputSpec

from . import backbone, gears
from .backbone import *
from .gears import build_gear
from .utils import *
from ppcls.arch.backbone.base.theseus_layer import TheseusLayer
from ppcls.utils import logger
from ppcls.utils.save_load import load_dygraph_pretrain
from ppcls.arch.slim import prune_model, quantize_model
from ppcls.arch.distill.afd_attention import LinearTransformStudent, LinearTransformTeacher

__all__ = ["build_model", "RecModel", "DistillationModel", "AttentionModel"]


def build_model(config, mode="train"):
    arch_config = copy.deepcopy(config["Arch"])
    model_type = arch_config.pop("name")
    use_sync_bn = arch_config.pop("use_sync_bn", False)
    mod = importlib.import_module(__name__)
    arch = getattr(mod, model_type)(**arch_config)
    if use_sync_bn:
        arch = nn.SyncBatchNorm.convert_sync_batchnorm(arch)

    if isinstance(arch, TheseusLayer):
        prune_model(config, arch)
        quantize_model(config, arch, mode)

    logger.info("The FLOPs and Params of Arch:")
    try:
        flops = paddle.flops(arch, [1, *config["Global"]["image_shape"]])
    except Exception as e:
        logger.warning(
            f"An error occurred when calculating FLOPs and Params of Arch. Please check the Global.image_shape in config. The details of error is: {e}"
        )

    return arch


def apply_to_static(config, model):
    support_to_static = config['Global'].get('to_static', False)

    if support_to_static:
        specs = None
        if 'image_shape' in config['Global']:
            specs = [InputSpec([None] + config['Global']['image_shape'])]
            specs[0].stop_gradient = True
        model = to_static(model, input_spec=specs)
        logger.info("Successfully to apply @to_static with specs: {}".format(
            specs))
    return model


class RecModel(TheseusLayer):
    def __init__(self, **config):
        super().__init__()
        backbone_config = config["Backbone"]
        backbone_name = backbone_config.pop("name")
        self.backbone = eval(backbone_name)(**backbone_config)
        if "BackboneStopLayer" in config:
            backbone_stop_layer = config["BackboneStopLayer"]["name"]
            self.backbone.stop_after(backbone_stop_layer)

        if "Neck" in config:
            self.neck = build_gear(config["Neck"])
        else:
            self.neck = None

        if "Head" in config:
            self.head = build_gear(config["Head"])
        else:
            self.head = None

    def forward(self, x, label=None):
        out = dict()
        x = self.backbone(x)
        out["backbone"] = x
        if self.neck is not None:
            x = self.neck(x)
            out["neck"] = x
        out["features"] = x
        if self.head is not None:
            y = self.head(x, label)
            out["logits"] = y
        return out


class DistillationModel(nn.Layer):
    def __init__(self,
                 models=None,
                 pretrained_list=None,
                 freeze_params_list=None,
                 **kargs):
        super().__init__()
        assert isinstance(models, list)
        self.model_list = []
        self.model_name_list = []
        if pretrained_list is not None:
            assert len(pretrained_list) == len(models)

        if freeze_params_list is None:
            freeze_params_list = [False] * len(models)
        assert len(freeze_params_list) == len(models)
        for idx, model_config in enumerate(models):
            assert len(model_config) == 1
            key = list(model_config.keys())[0]
            model_config = model_config[key]
            model_name = model_config.pop("name")
            model = eval(model_name)(**model_config)

            if freeze_params_list[idx]:
                for param in model.parameters():
                    param.trainable = False
            self.model_list.append(self.add_sublayer(key, model))
            self.model_name_list.append(key)

        if pretrained_list is not None:
            for idx, pretrained in enumerate(pretrained_list):
                if pretrained is not None:
                    load_dygraph_pretrain(
                        self.model_name_list[idx], path=pretrained)

    def forward(self, x, label=None):
        result_dict = dict()
        for idx, model_name in enumerate(self.model_name_list):
            if label is None:
                result_dict[model_name] = self.model_list[idx](x)
            else:
                result_dict[model_name] = self.model_list[idx](x, label)
        return result_dict


class AttentionModel(DistillationModel):
    def __init__(self,
                 models=None,
                 pretrained_list=None,
                 freeze_params_list=None,
                 **kargs):
        super().__init__(models, pretrained_list, freeze_params_list, **kargs)

    def forward(self, x, label=None):
        result_dict = dict()
        out = x
        for idx, model_name in enumerate(self.model_name_list):
            if label is None:
                out = self.model_list[idx](out)
                result_dict.update(out)
            else:
                out = self.model_list[idx](out, label)
                result_dict.update(out)
        return result_dict
add vehicle neck and fix bugs 2021-06-04 16:44:24 +08:00			`#copyright (c) 2021 PaddlePaddle Authors. All Rights Reserve.`
Init PaddleClas 2020-04-09 02:16:30 +08:00			`#`
			`#Licensed under the Apache License, Version 2.0 (the "License");`
			`#you may not use this file except in compliance with the License.`
			`#You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`#Unless required by applicable law or agreed to in writing, software`
			`#distributed under the License is distributed on an "AS IS" BASIS,`
			`#WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`#See the License for the specific language governing permissions and`
			`#limitations under the License.`

[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00			`import copy`
			`import importlib`

feat: log the FLOPs and Params when building model 2022-05-17 08:44:30 +00:00			`import paddle`
[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00			`import paddle.nn as nn`
support to_static for benchmark 2021-06-21 06:14:06 +00:00			`from paddle.jit import to_static`
			`from paddle.static import InputSpec`
[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00
add vehicle neck and fix bugs 2021-06-04 16:44:24 +08:00			`from . import backbone, gears`
move files 2021-05-24 11:42:24 +08:00			`from .backbone import *`
add vehicle neck 2021-06-04 14:54:34 +08:00			`from .gears import build_gear`
polish download pretrain 2020-04-13 18:53:03 +08:00			`from .utils import *`
update return_res method 2021-09-15 11:03:46 +08:00			`from ppcls.arch.backbone.base.theseus_layer import TheseusLayer`
support to_static for benchmark 2021-06-21 06:14:06 +00:00			`from ppcls.utils import logger`
add distillation and fix some apis (#810) * fix save load and imagenet dataset * refine trainer 2021-06-10 16:30:05 +08:00			`from ppcls.utils.save_load import load_dygraph_pretrain`
move slim into arch 2021-12-09 20:08:57 +08:00			`from ppcls.arch.slim import prune_model, quantize_model`
add AFD (#1683) * add AFD 2022-02-28 19:11:50 +08:00			`from ppcls.arch.distill.afd_attention import LinearTransformStudent, LinearTransformTeacher`
add pruner and quanter for theseus 2021-12-09 14:51:40 +08:00
add AFD (#1683) * add AFD 2022-02-28 19:11:50 +08:00			`__all__ = ["build_model", "RecModel", "DistillationModel", "AttentionModel"]`
Update __init__.py 2021-06-01 11:30:26 +08:00
[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00
fix quant logic (#1941) * fix quant logic * add support for trt+int8 inference * add support for swin quant * fix swin and quant * fix assert info * fix assert info * fix log 2022-05-23 19:04:27 +08:00			`def build_model(config, mode="train"):`
add pruner and quanter for theseus 2021-12-09 14:51:40 +08:00			`arch_config = copy.deepcopy(config["Arch"])`
			`model_type = arch_config.pop("name")`
update code 2022-05-14 10:03:55 +00:00			`use_sync_bn = arch_config.pop("use_sync_bn", False)`
[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00			`mod = importlib.import_module(__name__)`
add pruner and quanter for theseus 2021-12-09 14:51:40 +08:00			`arch = getattr(mod, model_type)(**arch_config)`
update code 2022-05-14 10:03:55 +00:00			`if use_sync_bn:`
			`arch = nn.SyncBatchNorm.convert_sync_batchnorm(arch)`
update code and docs 2022-05-23 01:11:03 +00:00
add pruner and quanter for theseus 2021-12-09 14:51:40 +08:00			`if isinstance(arch, TheseusLayer):`
			`prune_model(config, arch)`
fix quant logic (#1941) * fix quant logic * add support for trt+int8 inference * add support for swin quant * fix swin and quant * fix assert info * fix assert info * fix log 2022-05-23 19:04:27 +08:00			`quantize_model(config, arch, mode)`
feat: log the FLOPs and Params when building model 2022-05-17 08:44:30 +00:00
			`logger.info("The FLOPs and Params of Arch:")`
			`try:`
			`flops = paddle.flops(arch, [1, *config["Global"]["image_shape"]])`
			`except Exception as e:`
			`logger.warning(`
			`f"An error occurred when calculating FLOPs and Params of Arch. Please check the Global.image_shape in config. The details of error is: {e}"`
			`)`

[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00			`return arch`


support to_static for benchmark 2021-06-21 06:14:06 +00:00			`def apply_to_static(config, model):`
			`support_to_static = config['Global'].get('to_static', False)`

			`if support_to_static:`
			`specs = None`
			`if 'image_shape' in config['Global']:`
			`specs = [InputSpec([None] + config['Global']['image_shape'])]`
stop_gradient=True for input spec (#1943) 2022-05-23 09:48:27 +08:00			`specs[0].stop_gradient = True`
support to_static for benchmark 2021-06-21 06:14:06 +00:00			`model = to_static(model, input_spec=specs)`
			`logger.info("Successfully to apply @to_static with specs: {}".format(`
			`specs))`
			`return model`


add pruner and quanter for theseus 2021-12-09 14:51:40 +08:00			`class RecModel(TheseusLayer):`
[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00			`def __init__(self, **config):`
			`super().__init__()`
			`backbone_config = config["Backbone"]`
			`backbone_name = backbone_config.pop("name")`
add vehicle neck and fix bugs 2021-06-04 16:44:24 +08:00			`self.backbone = eval(backbone_name)(**backbone_config)`
add vehicle neck 2021-06-04 14:54:34 +08:00			`if "BackboneStopLayer" in config:`
add vehicle neck and fix bugs 2021-06-04 16:44:24 +08:00			`backbone_stop_layer = config["BackboneStopLayer"]["name"]`
			`self.backbone.stop_after(backbone_stop_layer)`
add CompCars train 2021-06-02 20:04:24 +08:00
add vehicle neck 2021-06-04 14:54:34 +08:00			`if "Neck" in config:`
			`self.neck = build_gear(config["Neck"])`
[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00			`else:`
			`self.neck = None`
add CompCars train 2021-06-02 20:04:24 +08:00
add vehicle neck 2021-06-04 14:54:34 +08:00			`if "Head" in config:`
			`self.head = build_gear(config["Head"])`
			`else:`
			`self.head = None`
[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00
dbg label 2021-06-05 17:56:40 +08:00			`def forward(self, x, label=None):`
add dist of rec model (#1574) * add distillation loss func and rec distillation 2022-01-05 19:25:36 +08:00			`out = dict()`
add vehicle neck and fix bugs 2021-06-04 16:44:24 +08:00			`x = self.backbone(x)`
add dist of rec model (#1574) * add distillation loss func and rec distillation 2022-01-05 19:25:36 +08:00			`out["backbone"] = x`
[WIP]add arch init (#744) * polish trainer 2021-05-27 18:41:44 +08:00			`if self.neck is not None:`
add vehicle neck and fix bugs 2021-06-04 16:44:24 +08:00			`x = self.neck(x)`
fox dist err (#1621) * fox dist err * fix init * fix init 2022-01-06 09:46:52 +08:00			`out["neck"] = x`
add dist of rec model (#1574) * add distillation loss func and rec distillation 2022-01-05 19:25:36 +08:00			`out["features"] = x`
add vehicle neck 2021-06-04 14:54:34 +08:00			`if self.head is not None:`
add vehicle neck and fix bugs 2021-06-04 16:44:24 +08:00			`y = self.head(x, label)`
fox dist err (#1621) * fox dist err * fix init * fix init 2022-01-06 09:46:52 +08:00			`out["logits"] = y`
add dist of rec model (#1574) * add distillation loss func and rec distillation 2022-01-05 19:25:36 +08:00			`return out`
add distillation and fix some apis (#810) * fix save load and imagenet dataset * refine trainer 2021-06-10 16:30:05 +08:00

			`class DistillationModel(nn.Layer):`
			`def __init__(self,`
			`models=None,`
			`pretrained_list=None,`
fix distillation model infer and export model 2021-06-13 05:01:56 +00:00			`freeze_params_list=None,`
			`**kargs):`
add distillation and fix some apis (#810) * fix save load and imagenet dataset * refine trainer 2021-06-10 16:30:05 +08:00			`super().__init__()`
			`assert isinstance(models, list)`
			`self.model_list = []`
			`self.model_name_list = []`
			`if pretrained_list is not None:`
			`assert len(pretrained_list) == len(models)`

			`if freeze_params_list is None:`
			`freeze_params_list = [False] * len(models)`
			`assert len(freeze_params_list) == len(models)`
			`for idx, model_config in enumerate(models):`
			`assert len(model_config) == 1`
			`key = list(model_config.keys())[0]`
			`model_config = model_config[key]`
			`model_name = model_config.pop("name")`
			`model = eval(model_name)(**model_config)`

			`if freeze_params_list[idx]:`
			`for param in model.parameters():`
			`param.trainable = False`
			`self.model_list.append(self.add_sublayer(key, model))`
			`self.model_name_list.append(key)`

			`if pretrained_list is not None:`
			`for idx, pretrained in enumerate(pretrained_list):`
			`if pretrained is not None:`
			`load_dygraph_pretrain(`
			`self.model_name_list[idx], path=pretrained)`

			`def forward(self, x, label=None):`
			`result_dict = dict()`
			`for idx, model_name in enumerate(self.model_name_list):`
			`if label is None:`
			`result_dict[model_name] = self.model_list[idx](x)`
			`else:`
fix distillation model infer and export model 2021-06-13 05:01:56 +00:00			`result_dict[model_name] = self.model_list[idx](x, label)`
add distillation and fix some apis (#810) * fix save load and imagenet dataset * refine trainer 2021-06-10 16:30:05 +08:00			`return result_dict`
add AFD (#1683) * add AFD 2022-02-28 19:11:50 +08:00

			`class AttentionModel(DistillationModel):`
			`def __init__(self,`
			`models=None,`
			`pretrained_list=None,`
			`freeze_params_list=None,`
			`**kargs):`
			`super().__init__(models, pretrained_list, freeze_params_list, **kargs)`

			`def forward(self, x, label=None):`
			`result_dict = dict()`
			`out = x`
			`for idx, model_name in enumerate(self.model_name_list):`
			`if label is None:`
			`out = self.model_list[idx](out)`
			`result_dict.update(out)`
			`else:`
			`out = self.model_list[idx](out, label)`
			`result_dict.update(out)`
			`return result_dict`