mmclassification/mmpretrain/models/heads/multi_label_cls_head.py

# Copyright (c) OpenMMLab. All rights reserved.
from typing import Dict, List, Optional, Tuple

import torch
import torch.nn as nn
from mmengine.model import BaseModule

from mmpretrain.registry import MODELS
from mmpretrain.structures import DataSample, label_to_onehot


@MODELS.register_module()
class MultiLabelClsHead(BaseModule):
    """Classification head for multilabel task.

    Args:
        loss (dict): Config of classification loss. Defaults to
            dict(type='CrossEntropyLoss', use_sigmoid=True).
        thr (float, optional): Predictions with scores under the thresholds
            are considered as negative. Defaults to None.
        topk (int, optional): Predictions with the k-th highest scores are
            considered as positive. Defaults to None.
        init_cfg (dict, optional): The extra init config of layers.
            Defaults to None.

    Notes:
        If both ``thr`` and ``topk`` are set, use ``thr` to determine
        positive predictions. If neither is set, use ``thr=0.5`` as
        default.
    """

    def __init__(self,
                 loss: Dict = dict(type='CrossEntropyLoss', use_sigmoid=True),
                 thr: Optional[float] = None,
                 topk: Optional[int] = None,
                 init_cfg: Optional[dict] = None):
        super(MultiLabelClsHead, self).__init__(init_cfg=init_cfg)

        if not isinstance(loss, nn.Module):
            loss = MODELS.build(loss)
        self.loss_module = loss

        if thr is None and topk is None:
            thr = 0.5

        self.thr = thr
        self.topk = topk

    def pre_logits(self, feats: Tuple[torch.Tensor]) -> torch.Tensor:
        """The process before the final classification head.

        The input ``feats`` is a tuple of tensor, and each tensor is the
        feature of a backbone stage. In ``MultiLabelClsHead``, we just obtain
        the feature of the last stage.
        """
        # The MultiLabelClsHead doesn't have other module, just return after
        # unpacking.
        return feats[-1]

    def forward(self, feats: Tuple[torch.Tensor]) -> torch.Tensor:
        """The forward process."""
        pre_logits = self.pre_logits(feats)
        # The MultiLabelClsHead doesn't have the final classification head,
        # just return the unpacked inputs.
        return pre_logits

    def loss(self, feats: Tuple[torch.Tensor], data_samples: List[DataSample],
             **kwargs) -> dict:
        """Calculate losses from the classification score.

        Args:
            feats (tuple[Tensor]): The features extracted from the backbone.
                Multiple stage inputs are acceptable but only the last stage
                will be used to classify. The shape of every item should be
                ``(num_samples, num_classes)``.
            data_samples (List[DataSample]): The annotation data of
                every samples.
            **kwargs: Other keyword arguments to forward the loss module.

        Returns:
            dict[str, Tensor]: a dictionary of loss components
        """
        # The part can be traced by torch.fx
        cls_score = self(feats)

        # The part can not be traced by torch.fx
        losses = self._get_loss(cls_score, data_samples, **kwargs)
        return losses

    def _get_loss(self, cls_score: torch.Tensor,
                  data_samples: List[DataSample], **kwargs):
        """Unpack data samples and compute loss."""
        num_classes = cls_score.size()[-1]
        # Unpack data samples and pack targets
        if 'gt_score' in data_samples[0]:
            target = torch.stack([i.gt_score.float() for i in data_samples])
        else:
            target = torch.stack([
                label_to_onehot(i.gt_label, num_classes) for i in data_samples
            ]).float()

        # compute loss
        losses = dict()
        loss = self.loss_module(
            cls_score, target, avg_factor=cls_score.size(0), **kwargs)
        losses['loss'] = loss

        return losses

    def predict(self,
                feats: Tuple[torch.Tensor],
                data_samples: List[DataSample] = None) -> List[DataSample]:
        """Inference without augmentation.

        Args:
            feats (tuple[Tensor]): The features extracted from the backbone.
                Multiple stage inputs are acceptable but only the last stage
                will be used to classify. The shape of every item should be
                ``(num_samples, num_classes)``.
            data_samples (List[DataSample], optional): The annotation
                data of every samples. If not None, set ``pred_label`` of
                the input data samples. Defaults to None.

        Returns:
            List[DataSample]: A list of data samples which contains the
            predicted results.
        """
        # The part can be traced by torch.fx
        cls_score = self(feats)

        # The part can not be traced by torch.fx
        predictions = self._get_predictions(cls_score, data_samples)
        return predictions

    def _get_predictions(self, cls_score: torch.Tensor,
                         data_samples: List[DataSample]):
        """Post-process the output of head.

        Including softmax and set ``pred_label`` of data samples.
        """
        pred_scores = torch.sigmoid(cls_score)

        if data_samples is None:
            data_samples = [DataSample() for _ in range(cls_score.size(0))]

        for data_sample, score in zip(data_samples, pred_scores):
            if self.thr is not None:
                # a label is predicted positive if larger than thr
                label = torch.where(score >= self.thr)[0]
            else:
                # top-k labels will be predicted positive for any example
                _, label = score.topk(self.topk)
            data_sample.set_pred_score(score).set_pred_label(label)

        return data_samples
Add multi_label heads 2022-07-08 06:51:09 +00:00			`# Copyright (c) OpenMMLab. All rights reserved.`
			`from typing import Dict, List, Optional, Tuple`

			`import torch`
[Feature] Support getting model from the name defined in the model-index file. (#1236) * [Feature] Support getting model from the name defined in the model-index file. * Add unit tests. * Prevent import `timm` if the `TIMMBackbone` is not used. * Fix Windows CI. * Move `init_model` to `mmcls.apis.hub`, and support pass nn.Module to all model components. * Fix requirements * Rename `hub.py` to `model.py` and add unit tests. 2022-12-06 17:00:22 +08:00			`import torch.nn as nn`
[Refactor] Add selfsup algorithms. (#1389) * remove basehead * add moco series * add byol simclr simsiam * add ut * update configs * add simsiam hook * add and refactor beit * update ut * add cae * update extract_feat * refactor cae * add mae * refactor data preprocessor * update heads * add maskfeat * add milan * add simmim * add mixmim * fix lint * fix ut * fix lint * add eva * add densecl * add barlowtwins * add swav * fix lint * update readtherdocs rst * update docs * update * Decrease UT memory usage * Fix docstring * update DALLEEncoder * Update model docs * refactor dalle encoder * update docstring * fix ut * fix config error * add val_cfg and test_cfg * refactor clip generator * fix lint * pass check * fix ut * add lars * update type of BEiT in configs * Use MMEngine style momentum in EMA. * apply mmpretrain solarize --------- Co-authored-by: mzr1996 <mzr1996@163.com> 2023-03-06 16:53:15 +08:00			`from mmengine.model import BaseModule`
Add multi_label heads 2022-07-08 06:51:09 +00:00
Rename the package name to `mmpretrain`. 2023-02-17 11:31:08 +08:00			`from mmpretrain.registry import MODELS`
[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`from mmpretrain.structures import DataSample, label_to_onehot`
Add multi_label heads 2022-07-08 06:51:09 +00:00

			`@MODELS.register_module()`
[Refactor] Add selfsup algorithms. (#1389) * remove basehead * add moco series * add byol simclr simsiam * add ut * update configs * add simsiam hook * add and refactor beit * update ut * add cae * update extract_feat * refactor cae * add mae * refactor data preprocessor * update heads * add maskfeat * add milan * add simmim * add mixmim * fix lint * fix ut * fix lint * add eva * add densecl * add barlowtwins * add swav * fix lint * update readtherdocs rst * update docs * update * Decrease UT memory usage * Fix docstring * update DALLEEncoder * Update model docs * refactor dalle encoder * update docstring * fix ut * fix config error * add val_cfg and test_cfg * refactor clip generator * fix lint * pass check * fix ut * add lars * update type of BEiT in configs * Use MMEngine style momentum in EMA. * apply mmpretrain solarize --------- Co-authored-by: mzr1996 <mzr1996@163.com> 2023-03-06 16:53:15 +08:00			`class MultiLabelClsHead(BaseModule):`
Add multi_label heads 2022-07-08 06:51:09 +00:00			`"""Classification head for multilabel task.`

			`Args:`
			`loss (dict): Config of classification loss. Defaults to`
			`dict(type='CrossEntropyLoss', use_sigmoid=True).`
			`thr (float, optional): Predictions with scores under the thresholds`
			`are considered as negative. Defaults to None.`
			`topk (int, optional): Predictions with the k-th highest scores are`
			`considered as positive. Defaults to None.`
			`init_cfg (dict, optional): The extra init config of layers.`
			`Defaults to None.`

			`Notes:`
			If both ``thr`` and ``topk`` are set, use ``thr` to determine
			positive predictions. If neither is set, use ``thr=0.5`` as
			`default.`
			`"""`

			`def __init__(self,`
			`loss: Dict = dict(type='CrossEntropyLoss', use_sigmoid=True),`
			`thr: Optional[float] = None,`
			`topk: Optional[int] = None,`
			`init_cfg: Optional[dict] = None):`
			`super(MultiLabelClsHead, self).__init__(init_cfg=init_cfg)`

[Feature] Support getting model from the name defined in the model-index file. (#1236) * [Feature] Support getting model from the name defined in the model-index file. * Add unit tests. * Prevent import `timm` if the `TIMMBackbone` is not used. * Fix Windows CI. * Move `init_model` to `mmcls.apis.hub`, and support pass nn.Module to all model components. * Fix requirements * Rename `hub.py` to `model.py` and add unit tests. 2022-12-06 17:00:22 +08:00			`if not isinstance(loss, nn.Module):`
			`loss = MODELS.build(loss)`
			`self.loss_module = loss`
Add multi_label heads 2022-07-08 06:51:09 +00:00
			`if thr is None and topk is None:`
			`thr = 0.5`

			`self.thr = thr`
			`self.topk = topk`

			`def pre_logits(self, feats: Tuple[torch.Tensor]) -> torch.Tensor:`
			`"""The process before the final classification head.`

			The input ``feats`` is a tuple of tensor, and each tensor is the
			feature of a backbone stage. In ``MultiLabelClsHead``, we just obtain
			`the feature of the last stage.`
			`"""`
			`# The MultiLabelClsHead doesn't have other module, just return after`
			`# unpacking.`
			`return feats[-1]`

			`def forward(self, feats: Tuple[torch.Tensor]) -> torch.Tensor:`
			`"""The forward process."""`
			`pre_logits = self.pre_logits(feats)`
			`# The MultiLabelClsHead doesn't have the final classification head,`
			`# just return the unpacked inputs.`
			`return pre_logits`

[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`def loss(self, feats: Tuple[torch.Tensor], data_samples: List[DataSample],`
			`**kwargs) -> dict:`
Add multi_label heads 2022-07-08 06:51:09 +00:00			`"""Calculate losses from the classification score.`

			`Args:`
			`feats (tuple[Tensor]): The features extracted from the backbone.`
			`Multiple stage inputs are acceptable but only the last stage`
			`will be used to classify. The shape of every item should be`
			``(num_samples, num_classes)``.
[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`data_samples (List[DataSample]): The annotation data of`
Add multi_label heads 2022-07-08 06:51:09 +00:00			`every samples.`
			`**kwargs: Other keyword arguments to forward the loss module.`

			`Returns:`
			`dict[str, Tensor]: a dictionary of loss components`
			`"""`
			`# The part can be traced by torch.fx`
			`cls_score = self(feats)`

			`# The part can not be traced by torch.fx`
			`losses = self._get_loss(cls_score, data_samples, **kwargs)`
			`return losses`

			`def _get_loss(self, cls_score: torch.Tensor,`
[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`data_samples: List[DataSample], **kwargs):`
Add multi_label heads 2022-07-08 06:51:09 +00:00			`"""Unpack data samples and compute loss."""`
			`num_classes = cls_score.size()[-1]`
			`# Unpack data samples and pack targets`
[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`if 'gt_score' in data_samples[0]:`
[Fix] Fix the bug in binary cross entropy loss (#1499) * [Fix] Fix the bug in binary cross entropy loss Fix the bug in binary cross entropy loss when using multi-label datasets e.g.VOC2007 * update ci --------- Co-authored-by: Ezra-Yu <18586273+Ezra-Yu@users.noreply.github.com> 2023-04-19 13:53:31 +08:00			`target = torch.stack([i.gt_score.float() for i in data_samples])`
Add multi_label heads 2022-07-08 06:51:09 +00:00			`else:`
			`target = torch.stack([`
[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`label_to_onehot(i.gt_label, num_classes) for i in data_samples`
			`]).float()`
Add multi_label heads 2022-07-08 06:51:09 +00:00
			`# compute loss`
			`losses = dict()`
			`loss = self.loss_module(`
			`cls_score, target, avg_factor=cls_score.size(0), **kwargs)`
			`losses['loss'] = loss`

			`return losses`

[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`def predict(self,`
			`feats: Tuple[torch.Tensor],`
			`data_samples: List[DataSample] = None) -> List[DataSample]:`
Add multi_label heads 2022-07-08 06:51:09 +00:00			`"""Inference without augmentation.`

			`Args:`
			`feats (tuple[Tensor]): The features extracted from the backbone.`
			`Multiple stage inputs are acceptable but only the last stage`
			`will be used to classify. The shape of every item should be`
			``(num_samples, num_classes)``.
[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`data_samples (List[DataSample], optional): The annotation`
Add multi_label heads 2022-07-08 06:51:09 +00:00			data of every samples. If not None, set ``pred_label`` of
			`the input data samples. Defaults to None.`

			`Returns:`
[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`List[DataSample]: A list of data samples which contains the`
Add multi_label heads 2022-07-08 06:51:09 +00:00			`predicted results.`
			`"""`
			`# The part can be traced by torch.fx`
			`cls_score = self(feats)`

			`# The part can not be traced by torch.fx`
			`predictions = self._get_predictions(cls_score, data_samples)`
			`return predictions`

			`def _get_predictions(self, cls_score: torch.Tensor,`
[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`data_samples: List[DataSample]):`
Add multi_label heads 2022-07-08 06:51:09 +00:00			`"""Post-process the output of head.`

			Including softmax and set ``pred_label`` of data samples.
			`"""`
			`pred_scores = torch.sigmoid(cls_score)`

			`if data_samples is None:`
[Refactor] Refactor ClsDatasample to a union DataSample. (#1371) * [Refactor] Refactor ClsDatasample to a union DataSample. * Add method * Fix docstring * Update docstring. 2023-02-23 10:07:53 +08:00			`data_samples = [DataSample() for _ in range(cls_score.size(0))]`
Add multi_label heads 2022-07-08 06:51:09 +00:00
			`for data_sample, score in zip(data_samples, pred_scores):`
			`if self.thr is not None:`
			`# a label is predicted positive if larger than thr`
			`label = torch.where(score >= self.thr)[0]`
			`else:`
			`# top-k labels will be predicted positive for any example`
			`_, label = score.topk(self.topk)`
			`data_sample.set_pred_score(score).set_pred_label(label)`

			`return data_samples`