Yixiao Fang 63d9f27fde
[Refactor] Add necks, heads and losses for the self-supervised task. (#1376)
* add necks

* refactor linear neck

* rename simmim neck

* add heads

* add losses

* fix

* add unittest

* update

* update cae

* remove mim head

* update config
2023-02-28 10:05:00 +08:00

34 lines
971 B
Python

# Copyright (c) OpenMMLab. All rights reserved.
import torch
import torch.nn as nn
from mmengine.model import BaseModule
from mmpretrain.registry import MODELS
@MODELS.register_module()
class SimMIMLinearDecoder(BaseModule):
"""Linear Decoder For SimMIM pretraining.
This neck reconstructs the original image from the shrunk feature map.
Args:
in_channels (int): Channel dimension of the feature map.
encoder_stride (int): The total stride of the encoder.
"""
def __init__(self, in_channels: int, encoder_stride: int) -> None:
super().__init__()
self.decoder = nn.Sequential(
nn.Conv2d(
in_channels=in_channels,
out_channels=encoder_stride**2 * 3,
kernel_size=1),
nn.PixelShuffle(encoder_stride),
)
def forward(self, x: torch.Tensor) -> torch.Tensor:
"""Forward function."""
x = self.decoder(x)
return x