fast-reid/fastreid/modeling/layers/adacos.py

# encoding: utf-8
"""
@author:  liaoxingyu
@contact: sherlockliao01@gmail.com
"""

import math

import torch
import torch.nn.functional as F
from torch.nn import Parameter

from ..layers import *
from ..model_utils import weights_init_kaiming


class AdaCos(nn.Module):
    def __init__(self, cfg, in_feat, pool_layer=nn.AdaptiveAvgPool2d(1)):
        super().__init__()
        self._num_classes = cfg.MODEL.HEADS.NUM_CLASSES

        self.pool_layer = nn.Sequential(
            pool_layer,
            Flatten()
        )
        # bnneck
        self.bnneck = NoBiasBatchNorm1d(in_feat)
        self.bnneck.apply(weights_init_kaiming)

        # classifier
        self._s = math.sqrt(2) * math.log(self._num_classes - 1)
        self._m = 0.50

        self.weight = Parameter(torch.Tensor(self._num_classes, in_feat))
        self.reset_parameters()

    def reset_parameters(self):
        nn.init.xavier_uniform_(self.weight)

    def forward(self, features, targets=None):
        global_feat = self.pool_layer(features)
        bn_feat = self.bnneck(global_feat)
        if not self.training:
            return bn_feat

        # normalize features
        x = F.normalize(bn_feat)
        # normalize weights
        weight = F.normalize(self.weight)
        # dot product
        logits = F.linear(x, weight)
        # feature re-scale
        theta = torch.acos(torch.clamp(logits, -1.0 + 1e-7, 1.0 - 1e-7))
        one_hot = torch.zeros_like(logits)
        one_hot.scatter_(1, targets.view(-1, 1).long(), 1)
        with torch.no_grad():
            B_avg = torch.where(one_hot < 1, torch.exp(self._s * logits), torch.zeros_like(logits))
            B_avg = torch.sum(B_avg) / x.size(0)
            # print(B_avg)
            theta_med = torch.median(theta[one_hot == 1])
            self.s = torch.log(B_avg) / torch.cos(torch.min(math.pi / 4 * torch.ones_like(theta_med), theta_med))

        pred_class_logits = self.s * logits

        return pred_class_logits, global_feat
1. upload circle loss and arcface 2. finish freeze training 3. update augmix data augmentation 2020-04-05 23:54:26 +08:00			`# encoding: utf-8`
			`"""`
			`@author: liaoxingyu`
			`@contact: sherlockliao01@gmail.com`
			`"""`

			`import math`

			`import torch`
			`import torch.nn.functional as F`
			`from torch.nn import Parameter`

chagne arch 1. change dataset show to trainset show and testset show seperately 2. add cls layer to easily plug in circle loss and arcface 2020-04-19 12:54:01 +08:00			`from ..layers import *`
1. upload circle loss and arcface 2. finish freeze training 3. update augmix data augmentation 2020-04-05 23:54:26 +08:00			`from ..model_utils import weights_init_kaiming`


chagne arch 1. change dataset show to trainset show and testset show seperately 2. add cls layer to easily plug in circle loss and arcface 2020-04-19 12:54:01 +08:00			`class AdaCos(nn.Module):`
1. upload circle loss and arcface 2. finish freeze training 3. update augmix data augmentation 2020-04-05 23:54:26 +08:00			`def __init__(self, cfg, in_feat, pool_layer=nn.AdaptiveAvgPool2d(1)):`
			`super().__init__()`
			`self._num_classes = cfg.MODEL.HEADS.NUM_CLASSES`

			`self.pool_layer = nn.Sequential(`
			`pool_layer,`
			`Flatten()`
			`)`
			`# bnneck`
refactor bn_no_bias 2020-04-08 21:04:09 +08:00			`self.bnneck = NoBiasBatchNorm1d(in_feat)`
1. upload circle loss and arcface 2. finish freeze training 3. update augmix data augmentation 2020-04-05 23:54:26 +08:00			`self.bnneck.apply(weights_init_kaiming)`

			`# classifier`
chagne arch 1. change dataset show to trainset show and testset show seperately 2. add cls layer to easily plug in circle loss and arcface 2020-04-19 12:54:01 +08:00			`self._s = math.sqrt(2) * math.log(self._num_classes - 1)`
			`self._m = 0.50`
1. upload circle loss and arcface 2. finish freeze training 3. update augmix data augmentation 2020-04-05 23:54:26 +08:00
			`self.weight = Parameter(torch.Tensor(self._num_classes, in_feat))`
			`self.reset_parameters()`

			`def reset_parameters(self):`
chagne arch 1. change dataset show to trainset show and testset show seperately 2. add cls layer to easily plug in circle loss and arcface 2020-04-19 12:54:01 +08:00			`nn.init.xavier_uniform_(self.weight)`
1. upload circle loss and arcface 2. finish freeze training 3. update augmix data augmentation 2020-04-05 23:54:26 +08:00
			`def forward(self, features, targets=None):`
			`global_feat = self.pool_layer(features)`
			`bn_feat = self.bnneck(global_feat)`
			`if not self.training:`
			`return bn_feat`

chagne arch 1. change dataset show to trainset show and testset show seperately 2. add cls layer to easily plug in circle loss and arcface 2020-04-19 12:54:01 +08:00			`# normalize features`
			`x = F.normalize(bn_feat)`
			`# normalize weights`
			`weight = F.normalize(self.weight)`
			`# dot product`
			`logits = F.linear(x, weight)`
			`# feature re-scale`
			`theta = torch.acos(torch.clamp(logits, -1.0 + 1e-7, 1.0 - 1e-7))`
			`one_hot = torch.zeros_like(logits)`
1. upload circle loss and arcface 2. finish freeze training 3. update augmix data augmentation 2020-04-05 23:54:26 +08:00			`one_hot.scatter_(1, targets.view(-1, 1).long(), 1)`
chagne arch 1. change dataset show to trainset show and testset show seperately 2. add cls layer to easily plug in circle loss and arcface 2020-04-19 12:54:01 +08:00			`with torch.no_grad():`
			`B_avg = torch.where(one_hot < 1, torch.exp(self._s * logits), torch.zeros_like(logits))`
			`B_avg = torch.sum(B_avg) / x.size(0)`
			`# print(B_avg)`
			`theta_med = torch.median(theta[one_hot == 1])`
			`self.s = torch.log(B_avg) / torch.cos(torch.min(math.pi / 4 * torch.ones_like(theta_med), theta_med))`
1. upload circle loss and arcface 2. finish freeze training 3. update augmix data augmentation 2020-04-05 23:54:26 +08:00
chagne arch 1. change dataset show to trainset show and testset show seperately 2. add cls layer to easily plug in circle loss and arcface 2020-04-19 12:54:01 +08:00			`pred_class_logits = self.s * logits`
1. upload circle loss and arcface 2. finish freeze training 3. update augmix data augmentation 2020-04-05 23:54:26 +08:00
			`return pred_class_logits, global_feat`