2021-05-24 11:42:24 +08:00
|
|
|
from abc import ABC
|
|
|
|
from paddle import nn
|
|
|
|
import re
|
|
|
|
|
|
|
|
|
|
|
|
class Identity(nn.Layer):
|
|
|
|
def __init__(self):
|
|
|
|
super(Identity, self).__init__()
|
|
|
|
|
|
|
|
def forward(self, inputs):
|
|
|
|
return inputs
|
|
|
|
|
|
|
|
|
2021-05-25 16:47:33 +08:00
|
|
|
class TheseusLayer(nn.Layer):
|
2021-08-08 01:07:49 +08:00
|
|
|
def __init__(self, *args, **kwargs):
|
2021-05-24 11:42:24 +08:00
|
|
|
super(TheseusLayer, self).__init__()
|
2021-08-08 14:32:45 +08:00
|
|
|
self.res_dict = {}
|
2021-05-24 11:42:24 +08:00
|
|
|
|
2021-05-24 19:49:06 +08:00
|
|
|
# stop doesn't work when stop layer has a parallel branch.
|
|
|
|
def stop_after(self, stop_layer_name: str):
|
2021-05-24 11:42:24 +08:00
|
|
|
after_stop = False
|
|
|
|
for layer_i in self._sub_layers:
|
|
|
|
if after_stop:
|
|
|
|
self._sub_layers[layer_i] = Identity()
|
2021-05-24 19:49:06 +08:00
|
|
|
continue
|
|
|
|
layer_name = self._sub_layers[layer_i].full_name()
|
|
|
|
if layer_name == stop_layer_name:
|
|
|
|
after_stop = True
|
|
|
|
continue
|
|
|
|
if isinstance(self._sub_layers[layer_i], TheseusLayer):
|
2021-06-04 10:19:01 +08:00
|
|
|
after_stop = self._sub_layers[layer_i].stop_after(
|
|
|
|
stop_layer_name)
|
2021-05-24 19:49:06 +08:00
|
|
|
return after_stop
|
|
|
|
|
2021-08-08 15:04:26 +08:00
|
|
|
def update_res(self, return_patterns):
|
2021-08-08 15:55:34 +08:00
|
|
|
if not return_patterns or isinstance(self, WrapLayer):
|
2021-08-08 14:57:29 +08:00
|
|
|
return
|
2021-05-24 19:49:06 +08:00
|
|
|
for layer_i in self._sub_layers:
|
|
|
|
layer_name = self._sub_layers[layer_i].full_name()
|
2021-08-08 15:55:34 +08:00
|
|
|
if isinstance(self._sub_layers[layer_i], (nn.Sequential, nn.LayerList)):
|
|
|
|
self._sub_layers[layer_i] = wrap_theseus(self._sub_layers[layer_i])
|
|
|
|
self._sub_layers[layer_i].res_dict = self.res_dict
|
2021-08-08 15:04:26 +08:00
|
|
|
self._sub_layers[layer_i].update_res(return_patterns)
|
2021-08-08 15:55:34 +08:00
|
|
|
else:
|
|
|
|
for return_pattern in return_patterns:
|
|
|
|
if re.match(return_pattern, layer_name):
|
|
|
|
if not isinstance(self._sub_layers[layer_i], TheseusLayer):
|
|
|
|
self._sub_layers[layer_i] = wrap_theseus(self._sub_layers[layer_i])
|
|
|
|
self._sub_layers[layer_i].register_forward_post_hook(
|
|
|
|
self._sub_layers[layer_i]._save_sub_res_hook)
|
|
|
|
self._sub_layers[layer_i].res_dict = self.res_dict
|
|
|
|
if isinstance(self._sub_layers[layer_i], TheseusLayer):
|
|
|
|
self._sub_layers[layer_i].update_res(return_patterns)
|
2021-05-24 11:42:24 +08:00
|
|
|
|
2021-08-07 23:00:32 +08:00
|
|
|
def _save_sub_res_hook(self, layer, input, output):
|
2021-08-08 00:37:53 +08:00
|
|
|
if self.res_dict is not None:
|
|
|
|
self.res_dict[layer.full_name()] = output
|
2021-08-07 23:00:32 +08:00
|
|
|
|
|
|
|
def replace_sub(self, layer_name_pattern, replace_function, recursive=True):
|
|
|
|
for layer_i in self._sub_layers:
|
|
|
|
layer_name = self._sub_layers[layer_i].full_name()
|
2021-05-24 11:42:24 +08:00
|
|
|
if re.match(layer_name_pattern, layer_name):
|
2021-08-07 23:00:32 +08:00
|
|
|
self._sub_layers[layer_i] = replace_function(self._sub_layers[layer_i])
|
2021-06-04 10:19:01 +08:00
|
|
|
if recursive:
|
2021-08-07 23:00:32 +08:00
|
|
|
if isinstance(self._sub_layers[layer_i], TheseusLayer):
|
|
|
|
self._sub_layers[layer_i].replace_sub(
|
2021-06-04 10:19:01 +08:00
|
|
|
layer_name_pattern, replace_function, recursive)
|
2021-08-07 23:00:32 +08:00
|
|
|
elif isinstance(self._sub_layers[layer_i], (nn.Sequential, nn.LayerList)):
|
|
|
|
for layer_j in self._sub_layers[layer_i]._sub_layers:
|
|
|
|
self._sub_layers[layer_i]._sub_layers[layer_j].replace_sub(
|
2021-06-04 10:19:01 +08:00
|
|
|
layer_name_pattern, replace_function, recursive)
|
2021-05-24 11:42:24 +08:00
|
|
|
|
|
|
|
'''
|
|
|
|
example of replace function:
|
|
|
|
def replace_conv(origin_conv: nn.Conv2D):
|
|
|
|
new_conv = nn.Conv2D(
|
|
|
|
in_channels=origin_conv._in_channels,
|
|
|
|
out_channels=origin_conv._out_channels,
|
|
|
|
kernel_size=origin_conv._kernel_size,
|
|
|
|
stride=2
|
|
|
|
)
|
|
|
|
return new_conv
|
|
|
|
|
2021-06-04 10:19:01 +08:00
|
|
|
'''
|
2021-08-08 14:57:29 +08:00
|
|
|
|
|
|
|
|
|
|
|
class WrapLayer(TheseusLayer):
|
|
|
|
def __init__(self, sub_layer):
|
|
|
|
super(WrapLayer, self).__init__()
|
|
|
|
self.sub_layer = sub_layer
|
|
|
|
self.name = sub_layer.full_name()
|
|
|
|
|
|
|
|
def full_name(self):
|
|
|
|
return self.name
|
|
|
|
|
|
|
|
def forward(self, *inputs, **kwargs):
|
2021-08-08 15:56:57 +08:00
|
|
|
return self.sub_layer(*inputs, **kwargs)
|
2021-08-08 14:57:29 +08:00
|
|
|
|
2021-08-08 15:55:34 +08:00
|
|
|
def update_res(self, return_patterns):
|
|
|
|
if not return_patterns or not isinstance(self.sub_layer, (nn.Sequential, nn.LayerList)):
|
|
|
|
return
|
|
|
|
for layer_i in self.sub_layer._sub_layers:
|
|
|
|
if isinstance(self.sub_layer._sub_layers[layer_i], (nn.Sequential, nn.LayerList)):
|
|
|
|
self.sub_layer._sub_layers[layer_i] = wrap_theseus(self.sub_layer._sub_layers[layer_i])
|
|
|
|
self.sub_layer._sub_layers[layer_i].res_dict = self.res_dict
|
|
|
|
self.sub_layer._sub_layers[layer_i].update_res(return_patterns)
|
2021-08-08 15:56:57 +08:00
|
|
|
|
2021-08-08 15:55:34 +08:00
|
|
|
layer_name = self.sub_layer._sub_layers[layer_i].full_name()
|
|
|
|
for return_pattern in return_patterns:
|
|
|
|
if re.match(return_pattern, layer_name):
|
|
|
|
self.sub_layer._sub_layers[layer_i].res_dict = self.res_dict
|
2021-08-08 14:57:29 +08:00
|
|
|
|
2021-08-08 15:55:34 +08:00
|
|
|
if isinstance(self.sub_layer._sub_layers[layer_i], TheseusLayer):
|
|
|
|
self.sub_layer._sub_layers[layer_i].update_res(return_patterns)
|
|
|
|
|
|
|
|
|
|
|
|
def wrap_theseus(sub_layer):
|
2021-08-08 14:57:29 +08:00
|
|
|
wrapped_layer = WrapLayer(sub_layer)
|
|
|
|
return wrapped_layer
|