fast-reid/fastreid/modeling/meta_arch/baseline.py

# encoding: utf-8
"""
@author:  liaoxingyu
@contact: sherlockliao01@gmail.com
"""

import torch
from torch import nn

from fastreid.layers import GeneralizedMeanPoolingP, AdaptiveAvgMaxPool2d, FastGlobalAvgPool2d
from fastreid.modeling.backbones import build_backbone
from fastreid.modeling.heads import build_reid_heads
from fastreid.modeling.losses import *
from .build import META_ARCH_REGISTRY


@META_ARCH_REGISTRY.register()
class Baseline(nn.Module):
    def __init__(self, cfg):
        super().__init__()
        self._cfg = cfg
        assert len(cfg.MODEL.PIXEL_MEAN) == len(cfg.MODEL.PIXEL_STD)
        self.register_buffer("pixel_mean", torch.tensor(cfg.MODEL.PIXEL_MEAN).view(1, -1, 1, 1))
        self.register_buffer("pixel_std", torch.tensor(cfg.MODEL.PIXEL_STD).view(1, -1, 1, 1))

        # backbone
        self.backbone = build_backbone(cfg)

        # head
        pool_type = cfg.MODEL.HEADS.POOL_LAYER
        if pool_type == 'avgpool':      pool_layer = FastGlobalAvgPool2d()
        elif pool_type == 'maxpool':    pool_layer = nn.AdaptiveMaxPool2d(1)
        elif pool_type == 'gempool':    pool_layer = GeneralizedMeanPoolingP()
        elif pool_type == "avgmaxpool": pool_layer = AdaptiveAvgMaxPool2d()
        elif pool_type == "identity":   pool_layer = nn.Identity()
        else:
            raise KeyError(f"{pool_type} is invalid, please choose from "
                           f"'avgpool', 'maxpool', 'gempool', 'avgmaxpool' and 'identity'.")

        in_feat = cfg.MODEL.HEADS.IN_FEAT
        num_classes = cfg.MODEL.HEADS.NUM_CLASSES
        self.heads = build_reid_heads(cfg, in_feat, num_classes, pool_layer)

    @property
    def device(self):
        return self.pixel_mean.device

    def forward(self, batched_inputs):
        images = self.preprocess_image(batched_inputs)
        features = self.backbone(images)

        if self.training:
            assert "targets" in batched_inputs, "Person ID annotation are missing in training!"
            targets = batched_inputs["targets"].long().to(self.device)

            # PreciseBN flag, When do preciseBN on different dataset, the number of classes in new dataset
            # may be larger than that in the original dataset, so the circle/arcface will
            # throw an error. We just set all the targets to 0 to avoid this problem.
            if targets.sum() < 0: targets.zero_()

            return self.heads(features, targets), targets
        else:
            return self.heads(features)

    def preprocess_image(self, batched_inputs):
        """
        Normalize and batch the input images.
        """
        images = batched_inputs["images"].to(self.device)
        # images = batched_inputs
        images.sub_(self.pixel_mean).div_(self.pixel_std)
        return images

    def losses(self, outputs, gt_labels):
        r"""
        Compute loss from modeling's outputs, the loss function input arguments
        must be the same as the outputs of the model forwarding.
        """
        cls_outputs, pred_class_logits, pred_features = outputs
        loss_dict = {}
        loss_names = self._cfg.MODEL.LOSSES.NAME

        # Log prediction accuracy
        CrossEntropyLoss.log_accuracy(pred_class_logits.detach(), gt_labels)

        if "CrossEntropyLoss" in loss_names:
            loss_dict['loss_cls'] = CrossEntropyLoss(self._cfg)(cls_outputs, gt_labels)

        if "TripletLoss" in loss_names:
            loss_dict['loss_triplet'] = TripletLoss(self._cfg)(pred_features, gt_labels)

        return loss_dict
Update sampler code 2020-02-10 07:38:56 +08:00			`# encoding: utf-8`
			`"""`
			`@author: liaoxingyu`
			`@contact: sherlockliao01@gmail.com`
			`"""`

fix: remove prefetcher, put normalizer in model 1. remove messy data prefetcher which will cause confusion 2. put normliazer in model to accelerate training via GPU computing 2020-05-25 23:39:11 +08:00			`import torch`
chagne arch 1. change dataset show to trainset show and testset show seperately 2. add cls layer to easily plug in circle loss and arcface 2020-04-19 12:54:01 +08:00			`from torch import nn`
Update sampler code 2020-02-10 07:38:56 +08:00
update fast global avgpool Summary: update fast pool according to https://arxiv.org/pdf/2003.13630.pdf 2020-06-12 16:34:03 +08:00			`from fastreid.layers import GeneralizedMeanPoolingP, AdaptiveAvgMaxPool2d, FastGlobalAvgPool2d`
feat(layers/norm): add ghost batchnorm add a get_norm fucntion to easily change normalization between batchnorm, ghost bn and group bn 2020-05-01 09:02:46 +08:00			`from fastreid.modeling.backbones import build_backbone`
			`from fastreid.modeling.heads import build_reid_heads`
finish v0.2 ddp training 2020-07-06 16:57:43 +08:00			`from fastreid.modeling.losses import *`
Update sampler code 2020-02-10 07:38:56 +08:00			`from .build import META_ARCH_REGISTRY`


			`@META_ARCH_REGISTRY.register()`
			`class Baseline(nn.Module):`
			`def __init__(self, cfg):`
			`super().__init__()`
update version0.2 code 2020-03-25 10:58:26 +08:00			`self._cfg = cfg`
finish v0.2 ddp training 2020-07-06 16:57:43 +08:00			`assert len(cfg.MODEL.PIXEL_MEAN) == len(cfg.MODEL.PIXEL_STD)`
			`self.register_buffer("pixel_mean", torch.tensor(cfg.MODEL.PIXEL_MEAN).view(1, -1, 1, 1))`
			`self.register_buffer("pixel_std", torch.tensor(cfg.MODEL.PIXEL_STD).view(1, -1, 1, 1))`

update version0.2 code 2020-03-25 10:58:26 +08:00			`# backbone`
Update sampler code 2020-02-10 07:38:56 +08:00			`self.backbone = build_backbone(cfg)`

update version0.2 code 2020-03-25 10:58:26 +08:00			`# head`
refactor code Summary: change code style and refactor code, add avgmax pooling layer in gem_pool 2020-05-28 13:49:39 +08:00			`pool_type = cfg.MODEL.HEADS.POOL_LAYER`
update fast global avgpool Summary: update fast pool according to https://arxiv.org/pdf/2003.13630.pdf 2020-06-12 16:34:03 +08:00			`if pool_type == 'avgpool': pool_layer = FastGlobalAvgPool2d()`
refactor code Summary: change code style and refactor code, add avgmax pooling layer in gem_pool 2020-05-28 13:49:39 +08:00			`elif pool_type == 'maxpool': pool_layer = nn.AdaptiveMaxPool2d(1)`
			`elif pool_type == 'gempool': pool_layer = GeneralizedMeanPoolingP()`
update fast global avgpool Summary: update fast pool according to https://arxiv.org/pdf/2003.13630.pdf 2020-06-12 16:34:03 +08:00			`elif pool_type == "avgmaxpool": pool_layer = AdaptiveAvgMaxPool2d()`
refactor code Summary: change code style and refactor code, add avgmax pooling layer in gem_pool 2020-05-28 13:49:39 +08:00			`elif pool_type == "identity": pool_layer = nn.Identity()`
update version0.2 code 2020-03-25 10:58:26 +08:00			`else:`
refactor code Summary: change code style and refactor code, add avgmax pooling layer in gem_pool 2020-05-28 13:49:39 +08:00			`raise KeyError(f"{pool_type} is invalid, please choose from "`
			`f"'avgpool', 'maxpool', 'gempool', 'avgmaxpool' and 'identity'.")`
refactor($modeling/meta): refactor heads output without intermediate variables generated by reid heads, make it more flexible 2020-04-24 12:16:18 +08:00
			`in_feat = cfg.MODEL.HEADS.IN_FEAT`
refactor(heads): move num_classes out from heads set parameter num_classes in meta_arch to easily modify different heads fc layer 2020-04-29 21:29:48 +08:00			`num_classes = cfg.MODEL.HEADS.NUM_CLASSES`
			`self.heads = build_reid_heads(cfg, in_feat, num_classes, pool_layer)`
Change architecture: 1. delete redundant preprocess 2. add data prefetcher to accelerate data loading 3. fix minor bug of triplet sampler when only one image for one id 2020-02-18 21:01:23 +08:00
fix: remove prefetcher, put normalizer in model 1. remove messy data prefetcher which will cause confusion 2. put normliazer in model to accelerate training via GPU computing 2020-05-25 23:39:11 +08:00			`@property`
			`def device(self):`
			`return self.pixel_mean.device`
Update sampler code 2020-02-10 07:38:56 +08:00
fix: remove prefetcher, put normalizer in model 1. remove messy data prefetcher which will cause confusion 2. put normliazer in model to accelerate training via GPU computing 2020-05-25 23:39:11 +08:00			`def forward(self, batched_inputs):`
			`images = self.preprocess_image(batched_inputs)`
finish v0.2 ddp training 2020-07-06 16:57:43 +08:00			`features = self.backbone(images)`
fix: remove prefetcher, put normalizer in model 1. remove messy data prefetcher which will cause confusion 2. put normliazer in model to accelerate training via GPU computing 2020-05-25 23:39:11 +08:00
finish v0.2 ddp training 2020-07-06 16:57:43 +08:00			`if self.training:`
			`assert "targets" in batched_inputs, "Person ID annotation are missing in training!"`
			`targets = batched_inputs["targets"].long().to(self.device)`
update version0.2 code 2020-03-25 10:58:26 +08:00
fix typro 2020-07-10 16:26:35 +08:00			`# PreciseBN flag, When do preciseBN on different dataset, the number of classes in new dataset`
			`# may be larger than that in the original dataset, so the circle/arcface will`
			`# throw an error. We just set all the targets to 0 to avoid this problem.`
			`if targets.sum() < 0: targets.zero_()`

minor update 2020-07-14 11:58:06 +08:00			`return self.heads(features, targets), targets`
finish v0.2 ddp training 2020-07-06 16:57:43 +08:00			`else:`
minor update 2020-07-14 11:58:06 +08:00			`return self.heads(features)`
update version0.2 code 2020-03-25 10:58:26 +08:00
fix: remove prefetcher, put normalizer in model 1. remove messy data prefetcher which will cause confusion 2. put normliazer in model to accelerate training via GPU computing 2020-05-25 23:39:11 +08:00			`def preprocess_image(self, batched_inputs):`
			`"""`
			`Normalize and batch the input images.`
			`"""`
finish v0.2 ddp training 2020-07-06 16:57:43 +08:00			`images = batched_inputs["images"].to(self.device)`
change style in baseline 2020-06-05 11:23:11 +08:00			`# images = batched_inputs`
fix: remove prefetcher, put normalizer in model 1. remove messy data prefetcher which will cause confusion 2. put normliazer in model to accelerate training via GPU computing 2020-05-25 23:39:11 +08:00			`images.sub_(self.pixel_mean).div_(self.pixel_std)`
			`return images`

minor update 2020-07-14 11:58:06 +08:00			`def losses(self, outputs, gt_labels):`
fix typro 2020-07-10 16:26:35 +08:00			`r"""`
			`Compute loss from modeling's outputs, the loss function input arguments`
			`must be the same as the outputs of the model forwarding.`
			`"""`
minor update 2020-07-14 11:58:06 +08:00			`cls_outputs, pred_class_logits, pred_features = outputs`
finish v0.2 ddp training 2020-07-06 16:57:43 +08:00			`loss_dict = {}`
			`loss_names = self._cfg.MODEL.LOSSES.NAME`

minor update 2020-07-14 11:58:06 +08:00			`# Log prediction accuracy`
			`CrossEntropyLoss.log_accuracy(pred_class_logits.detach(), gt_labels)`

finish v0.2 ddp training 2020-07-06 16:57:43 +08:00			`if "CrossEntropyLoss" in loss_names:`
			`loss_dict['loss_cls'] = CrossEntropyLoss(self._cfg)(cls_outputs, gt_labels)`

			`if "TripletLoss" in loss_names:`
			`loss_dict['loss_triplet'] = TripletLoss(self._cfg)(pred_features, gt_labels)`

			`return loss_dict`