PaddleClas/ppcls/arch/backbone/base/theseus_layer.py

83 lines
3.1 KiB
Python
Raw Normal View History

2021-05-24 11:42:24 +08:00
from abc import ABC
from paddle import nn
import re
class Identity(nn.Layer):
def __init__(self):
super(Identity, self).__init__()
def forward(self, inputs):
return inputs
2021-05-25 16:47:33 +08:00
class TheseusLayer(nn.Layer):
def __init__(self, *args, return_patterns=None, **kwargs):
2021-05-24 11:42:24 +08:00
super(TheseusLayer, self).__init__()
self.res_dict = None
2021-08-08 00:37:53 +08:00
self.register_forward_post_hook(self._disconnect_res_dict_hook)
if return_patterns is not None:
self._update_res(return_patterns)
2021-05-24 11:42:24 +08:00
def forward(self, *input, res_dict=None, **kwargs):
if res_dict is not None:
self.res_dict = res_dict
# stop doesn't work when stop layer has a parallel branch.
def stop_after(self, stop_layer_name: str):
2021-05-24 11:42:24 +08:00
after_stop = False
for layer_i in self._sub_layers:
if after_stop:
self._sub_layers[layer_i] = Identity()
continue
layer_name = self._sub_layers[layer_i].full_name()
if layer_name == stop_layer_name:
after_stop = True
continue
if isinstance(self._sub_layers[layer_i], TheseusLayer):
2021-06-04 10:19:01 +08:00
after_stop = self._sub_layers[layer_i].stop_after(
stop_layer_name)
return after_stop
def _update_res(self, return_layers):
for layer_i in self._sub_layers:
layer_name = self._sub_layers[layer_i].full_name()
2021-05-24 11:42:24 +08:00
for return_pattern in return_layers:
2021-08-07 23:00:32 +08:00
if return_layers is not None and re.match(return_pattern, layer_name):
2021-06-04 10:19:01 +08:00
self._sub_layers[layer_i].register_forward_post_hook(
self._save_sub_res_hook)
2021-05-24 11:42:24 +08:00
2021-08-07 23:00:32 +08:00
def _save_sub_res_hook(self, layer, input, output):
2021-08-08 00:37:53 +08:00
if self.res_dict is not None:
self.res_dict[layer.full_name()] = output
2021-08-07 23:00:32 +08:00
def _disconnect_res_dict_hook(self, input, output):
self.res_dict = None
def replace_sub(self, layer_name_pattern, replace_function, recursive=True):
for layer_i in self._sub_layers:
layer_name = self._sub_layers[layer_i].full_name()
2021-05-24 11:42:24 +08:00
if re.match(layer_name_pattern, layer_name):
2021-08-07 23:00:32 +08:00
self._sub_layers[layer_i] = replace_function(self._sub_layers[layer_i])
2021-06-04 10:19:01 +08:00
if recursive:
2021-08-07 23:00:32 +08:00
if isinstance(self._sub_layers[layer_i], TheseusLayer):
self._sub_layers[layer_i].replace_sub(
2021-06-04 10:19:01 +08:00
layer_name_pattern, replace_function, recursive)
2021-08-07 23:00:32 +08:00
elif isinstance(self._sub_layers[layer_i], (nn.Sequential, nn.LayerList)):
for layer_j in self._sub_layers[layer_i]._sub_layers:
self._sub_layers[layer_i]._sub_layers[layer_j].replace_sub(
2021-06-04 10:19:01 +08:00
layer_name_pattern, replace_function, recursive)
2021-05-24 11:42:24 +08:00
'''
example of replace function:
def replace_conv(origin_conv: nn.Conv2D):
new_conv = nn.Conv2D(
in_channels=origin_conv._in_channels,
out_channels=origin_conv._out_channels,
kernel_size=origin_conv._kernel_size,
stride=2
)
return new_conv
2021-06-04 10:19:01 +08:00
'''