[Enhance] Suport Mixup&Cutmix for multi-label task.

2025-06-03 21:53:55 +08:00 · 2022-01-21 12:30:58 +09:00 · 2022-01-21 12:30:58 +09:00 · d29037e8d1
commit d29037e8d1
parent b39885d953
5 changed files with 64 additions and 7 deletions
--- a/mmcls/models/utils/augment/cutmix.py
+++ b/mmcls/models/utils/augment/cutmix.py
@ -3,9 +3,9 @@ from abc import ABCMeta, abstractmethod
 import numpy as np
 import torch
 import torch.nn.functional as F
 from .builder import AUGMENT
 from .utils import one_hot_encoding
 class BaseCutMixLayer(object, metaclass=ABCMeta):
@ -123,7 +123,7 @@ class BatchCutMixLayer(BaseCutMixLayer):
        super(BatchCutMixLayer, self).__init__(*args, **kwargs)
    def cutmix(self, img, gt_label):
-        one_hot_gt_label = F.one_hot(gt_label, num_classes=self.num_classes)
+        one_hot_gt_label = one_hot_encoding(gt_label, self.num_classes)
        lam = np.random.beta(self.alpha, self.alpha)
        batch_size = img.size(0)
        index = torch.randperm(batch_size)
--- a/mmcls/models/utils/augment/identity.py
+++ b/mmcls/models/utils/augment/identity.py
@ -1,7 +1,6 @@
 # Copyright (c) OpenMMLab. All rights reserved.
 import torch.nn.functional as F
 from .builder import AUGMENT
 from .utils import one_hot_encoding
@AUGMENT.register_module(name='Identity')
@ -24,7 +23,7 @@ class Identity(object):
        self.prob = prob
    def one_hot(self, gt_label):
-        return F.one_hot(gt_label, num_classes=self.num_classes)
+        return one_hot_encoding(gt_label, self.num_classes)
    def __call__(self, img, gt_label):
        return img, self.one_hot(gt_label)
--- a/mmcls/models/utils/augment/mixup.py
+++ b/mmcls/models/utils/augment/mixup.py
@ -3,9 +3,9 @@ from abc import ABCMeta, abstractmethod
 import numpy as np
 import torch
 import torch.nn.functional as F
 from .builder import AUGMENT
 from .utils import one_hot_encoding
 class BaseMixupLayer(object, metaclass=ABCMeta):
@ -42,7 +42,7 @@ class BatchMixupLayer(BaseMixupLayer):
        super(BatchMixupLayer, self).__init__(*args, **kwargs)
    def mixup(self, img, gt_label):
-        one_hot_gt_label = F.one_hot(gt_label, num_classes=self.num_classes)
+        one_hot_gt_label = one_hot_encoding(gt_label, self.num_classes)
        lam = np.random.beta(self.alpha, self.alpha)
        batch_size = img.size(0)
        index = torch.randperm(batch_size)
--- a/mmcls/models/utils/augment/utils.py
+++ b/mmcls/models/utils/augment/utils.py
@ -0,0 +1,23 @@
 import torch.nn.functional as F
 def one_hot_encoding(gt, num_classes):
    """Change gt_label to one_hot encoding.
    If the shape has 2 or more
    dimensions, return it without encoding.
    Args:
        gt (Tensor): The gt label with shape (N,) or shape (N, */).
        num_classes (int): The number of classes.
    Return:
        Tensor: One hot gt label.
    """
    if gt.ndim == 1:
        # multi-class classification
        return F.one_hot(gt, num_classes=num_classes)
    else:
        # binary classification
        # example. [[0], [1], [1]]
        # multi-label classification
        # example. [[0, 1, 1], [1, 0, 0], [1, 1, 1]]
        return gt
--- a/tests/test_models/test_utils/test_augment.py
+++ b/tests/test_models/test_utils/test_augment.py
@ -1,8 +1,15 @@
 # Copyright (c) OpenMMLab. All rights reserved.
 import pytest
 import torch
 from mmcls.models.utils import Augments
 augment_cfgs = [
    dict(type='BatchCutMix', alpha=1., prob=1.),
    dict(type='BatchMixup', alpha=1., prob=1.),
    dict(type='Identity', prob=1.),
 ]
 def test_augments():
    imgs = torch.randn(4, 3, 32, 32)
@ -50,3 +57,31 @@ def test_augments():
    mixed_imgs, mixed_labels = augs(imgs, labels)
    assert mixed_imgs.shape == torch.Size((4, 3, 32, 32))
    assert mixed_labels.shape == torch.Size((4, 10))
@pytest.mark.parametrize('cfg', augment_cfgs)
 def test_binary_augment(cfg):
    cfg_ = dict(num_classes=1, **cfg)
    augs = Augments(cfg_)
    imgs = torch.randn(4, 3, 32, 32)
    labels = torch.randint(0, 2, (4, 1)).float()
    mixed_imgs, mixed_labels = augs(imgs, labels)
    assert mixed_imgs.shape == torch.Size((4, 3, 32, 32))
    assert mixed_labels.shape == torch.Size((4, 1))
@pytest.mark.parametrize('cfg', augment_cfgs)
 def test_multilabel_augment(cfg):
    cfg_ = dict(num_classes=10, **cfg)
    augs = Augments(cfg_)
    imgs = torch.randn(4, 3, 32, 32)
    labels = torch.randint(0, 2, (4, 10)).float()
    mixed_imgs, mixed_labels = augs(imgs, labels)
    assert mixed_imgs.shape == torch.Size((4, 3, 32, 32))
    assert mixed_labels.shape == torch.Size((4, 10))