mmrazor/tools/model_converters/convert_ofa_ckpt.py

# Copyright (c) OpenMMLab. All rights reserved.
import argparse
from pathlib import Path

import torch


def parse_args():
    parser = argparse.ArgumentParser(
        description='Process a checkpoint to be published')
    parser.add_argument('checkpoint', help='input checkpoint filename')
    parser.add_argument('--depth', nargs='+', type=int, help='layer depth')
    parser.add_argument(
        '--inplace', action='store_true', help='replace origin ckpt')
    args = parser.parse_args()
    return args


def block2layer_index_convert(layer_depth):
    """Build index_table from OFA blocks to MMRazor layers."""
    index_table = dict()
    i = 0
    first_index = 1
    second_index = 0
    for k in layer_depth:
        for _ in range(k):
            index_table[str(i)] = str(first_index) + '.' + str(second_index)
            i += 1
            second_index += 1
        second_index = 0
        first_index += 1

    return index_table


def main():
    args = parse_args()
    checkpoint = torch.load(args.checkpoint, map_location='cpu')
    new_state_dict = dict()

    index_table = block2layer_index_convert(args.depth)

    for key, value in checkpoint['state_dict'].items():
        if 'blocks' in key:
            index = key.split('.')[1]
            new_key = key.replace('blocks.' + index,
                                  'layer' + index_table[index])
        else:
            new_key = key

        if 'mobile_inverted_conv' in new_key:
            new_key = new_key.replace('mobile_inverted_conv.', '')
        if 'depth_conv' in key:
            new_key = new_key.replace('depth_conv', 'depthwise_conv')
        if 'point_linear' in key:
            new_key = new_key.replace('point_linear', 'linear_conv')
        if 'inverted_bottleneck' in key:
            new_key = new_key.replace('inverted_bottleneck', 'expand_conv')
        if '.conv.conv' in new_key:
            new_key = new_key.replace('.conv.conv', '.conv')
        if '.bn.bn' in new_key:
            new_key = new_key.replace('.bn.bn', '.bn')

        if 'layer1.0.depthwise_conv.weight' in new_key:
            new_key = new_key.replace('layer1.0.depthwise_conv.weight',
                                      'layer1.0.depthwise_conv.conv.weight')
        if 'layer1.0.linear_conv.weight' in new_key:
            new_key = new_key.replace('layer1.0.linear_conv.weight',
                                      'layer1.0.linear_conv.conv.weight')

        if 'depthwise_conv.se.fc.reduce' in new_key:
            new_key = new_key.replace('depthwise_conv.se.fc.reduce',
                                      'se.conv1.conv')
        if 'depthwise_conv.se.fc.expand' in new_key:
            new_key = new_key.replace('depthwise_conv.se.fc.expand',
                                      'se.conv2.conv')

        if 'final_expand_layer' in new_key:
            new_key = new_key.replace('final_expand_layer',
                                      'last_conv.final_expand_layer')
        if 'feature_mix_layer' in new_key:
            new_key = new_key.replace('feature_mix_layer',
                                      'last_conv.feature_mix_layer')

        if '5to3_matrix' in new_key:
            new_key = new_key.replace('5to3_matrix', 'trans_matrix_5to3')
        if '7to5_matrix' in new_key:
            new_key = new_key.replace('7to5_matrix', 'trans_matrix_7to5')

        new_key = 'architecture.backbone.' + new_key

        if 'classifier.linear' in new_key:
            new_key = new_key.replace('classifier.linear', 'head.fc')
            new_key = new_key.replace('backbone.', '')

        new_state_dict[new_key] = value

    checkpoint['state_dict'] = new_state_dict
    if args.inplace:
        torch.save(checkpoint, args.checkpoint)
    else:
        ckpt_path = Path(args.checkpoint)
        ckpt_name = ckpt_path.stem
        ckpt_dir = ckpt_path.parent
        new_ckpt_path = ckpt_dir / f'{ckpt_name}_latest.pth'
        torch.save(checkpoint, new_ckpt_path)


if __name__ == '__main__':
    main()
[Feature] Add BigNAS algorithm (#219) * add calibrate-bn-statistics * add test calibrate-bn-statistics * fix mixins * fix mixins * fix mixin tests * remove slimmable channel mutable and refactor dynamic op * refact dynamic batch norm * add progressive dynamic conv2d * add center crop dynamic conv2d * refactor dynamic directory * refactor dynamic sequential * rename length to depth in dynamic sequential * add test for derived mutable * refactor dynamic op * refactor api of dynamic op * add derive mutable mixin * addbignas algorithm * refactor bignas structure * add input resizer * add input resizer to bignas * move input resizer from algorithm into classifier * remove compnents * add attentive mobilenet * delete json file * nearly(less 0.2) align inference accuracy with gml * move mutate seperated in bignas mobilenet backbone * add zero_init_residual * add set_dropout * set dropout in bignas algorithm * fix registry * add subnet yaml and nearly align inference accuracy with gml * add rsb config for bignas * remove base in config * add gml bignas config * convert to iter based * bignas forward and backward fly * fix merge conflict * fix dynamicseq bug * fix bug and refactor bignas * arrange configs of bignas * fix typo * refactor attentive_mobilenet * fix channel mismatch due to registion of DerivedMutable * update bignas & fix se channel mismatch * add AutoAugmentV2 & remove unness configs * fix lint * recover channel assertion in channel unit * fix a group bug * fix comments * add docstring * add norm in dynamic_embed * fix search loop & other minor changes * fix se expansion * minor change * add ut for bignas & attentive_mobilenet * fix ut * update bignas readme * rm unness ut & supplement get_placeholder * fix lint * fix ut * add subnet deployment in downstream tasks. * minor change * update ofa backbone * minor fix * Continued improvements of searchable backbone * minor change * drop ratio in backbone * fix comments * fix ci test * fix test * add dynamic shortcut UT * modify strategy to fit bignas * fix test * fix bug in neck * fix error * fix error * fix yaml * save subnet ckpt * merge autoslim_val/test_loop into subnet_val_loop * move calibrate_bn_mixin to utils * fix bugs and add docstring * clean code * fix register bug * clean code * update Co-authored-by: wangshiguang <wangshiguang@sensetime.com> Co-authored-by: gaoyang07 <1546308416@qq.com> Co-authored-by: aptsunny <aptsunny@tongji.edu.cn> Co-authored-by: sunyue1 <sunyue1@sensetime.com> 2022-12-07 11:28:10 +08:00			`# Copyright (c) OpenMMLab. All rights reserved.`
			`import argparse`
			`from pathlib import Path`

			`import torch`


			`def parse_args():`
			`parser = argparse.ArgumentParser(`
			`description='Process a checkpoint to be published')`
			`parser.add_argument('checkpoint', help='input checkpoint filename')`
[Improvement] Adapt OFA series with SearchableMobileNetV3 (#385) * fix mutable bug in AttentiveMobileNetV3 * remove unness code * update ATTENTIVE_SUBNET_A0-A6.yaml with optimized names * unify the sampling usage in sandwich_rule-based NAS * use alias to export subnet * update OFA configs * fix attr bug * fix comments * update convert_supernet2subnet.py * correct the way to dump DerivedMutable * fix convert index bug * update OFA configs & models * fix dynamic2static * generalize convert_ofa_ckpt.py * update input_resizer * update README.md * fix ut * update export_fix_subnet * update _dynamic_to_static * update fix_subnet UT & minor fix bugs * fix ut * add new autoaug compared to attentivenas * clean * fix act * fix act_cfg * update fix_subnet * fix lint * add docstring Co-authored-by: gaoyang07 <1546308416@qq.com> Co-authored-by: aptsunny <aptsunny@tongji.edu.cn> 2022-12-15 22:19:55 +08:00			`parser.add_argument('--depth', nargs='+', type=int, help='layer depth')`
[Feature] Add BigNAS algorithm (#219) * add calibrate-bn-statistics * add test calibrate-bn-statistics * fix mixins * fix mixins * fix mixin tests * remove slimmable channel mutable and refactor dynamic op * refact dynamic batch norm * add progressive dynamic conv2d * add center crop dynamic conv2d * refactor dynamic directory * refactor dynamic sequential * rename length to depth in dynamic sequential * add test for derived mutable * refactor dynamic op * refactor api of dynamic op * add derive mutable mixin * addbignas algorithm * refactor bignas structure * add input resizer * add input resizer to bignas * move input resizer from algorithm into classifier * remove compnents * add attentive mobilenet * delete json file * nearly(less 0.2) align inference accuracy with gml * move mutate seperated in bignas mobilenet backbone * add zero_init_residual * add set_dropout * set dropout in bignas algorithm * fix registry * add subnet yaml and nearly align inference accuracy with gml * add rsb config for bignas * remove base in config * add gml bignas config * convert to iter based * bignas forward and backward fly * fix merge conflict * fix dynamicseq bug * fix bug and refactor bignas * arrange configs of bignas * fix typo * refactor attentive_mobilenet * fix channel mismatch due to registion of DerivedMutable * update bignas & fix se channel mismatch * add AutoAugmentV2 & remove unness configs * fix lint * recover channel assertion in channel unit * fix a group bug * fix comments * add docstring * add norm in dynamic_embed * fix search loop & other minor changes * fix se expansion * minor change * add ut for bignas & attentive_mobilenet * fix ut * update bignas readme * rm unness ut & supplement get_placeholder * fix lint * fix ut * add subnet deployment in downstream tasks. * minor change * update ofa backbone * minor fix * Continued improvements of searchable backbone * minor change * drop ratio in backbone * fix comments * fix ci test * fix test * add dynamic shortcut UT * modify strategy to fit bignas * fix test * fix bug in neck * fix error * fix error * fix yaml * save subnet ckpt * merge autoslim_val/test_loop into subnet_val_loop * move calibrate_bn_mixin to utils * fix bugs and add docstring * clean code * fix register bug * clean code * update Co-authored-by: wangshiguang <wangshiguang@sensetime.com> Co-authored-by: gaoyang07 <1546308416@qq.com> Co-authored-by: aptsunny <aptsunny@tongji.edu.cn> Co-authored-by: sunyue1 <sunyue1@sensetime.com> 2022-12-07 11:28:10 +08:00			`parser.add_argument(`
			`'--inplace', action='store_true', help='replace origin ckpt')`
			`args = parser.parse_args()`
			`return args`


[Improvement] Adapt OFA series with SearchableMobileNetV3 (#385) * fix mutable bug in AttentiveMobileNetV3 * remove unness code * update ATTENTIVE_SUBNET_A0-A6.yaml with optimized names * unify the sampling usage in sandwich_rule-based NAS * use alias to export subnet * update OFA configs * fix attr bug * fix comments * update convert_supernet2subnet.py * correct the way to dump DerivedMutable * fix convert index bug * update OFA configs & models * fix dynamic2static * generalize convert_ofa_ckpt.py * update input_resizer * update README.md * fix ut * update export_fix_subnet * update _dynamic_to_static * update fix_subnet UT & minor fix bugs * fix ut * add new autoaug compared to attentivenas * clean * fix act * fix act_cfg * update fix_subnet * fix lint * add docstring Co-authored-by: gaoyang07 <1546308416@qq.com> Co-authored-by: aptsunny <aptsunny@tongji.edu.cn> 2022-12-15 22:19:55 +08:00			`def block2layer_index_convert(layer_depth):`
			`"""Build index_table from OFA blocks to MMRazor layers."""`
			`index_table = dict()`
			`i = 0`
			`first_index = 1`
			`second_index = 0`
			`for k in layer_depth:`
			`for _ in range(k):`
			`index_table[str(i)] = str(first_index) + '.' + str(second_index)`
			`i += 1`
			`second_index += 1`
			`second_index = 0`
			`first_index += 1`

			`return index_table`


[Feature] Add BigNAS algorithm (#219) * add calibrate-bn-statistics * add test calibrate-bn-statistics * fix mixins * fix mixins * fix mixin tests * remove slimmable channel mutable and refactor dynamic op * refact dynamic batch norm * add progressive dynamic conv2d * add center crop dynamic conv2d * refactor dynamic directory * refactor dynamic sequential * rename length to depth in dynamic sequential * add test for derived mutable * refactor dynamic op * refactor api of dynamic op * add derive mutable mixin * addbignas algorithm * refactor bignas structure * add input resizer * add input resizer to bignas * move input resizer from algorithm into classifier * remove compnents * add attentive mobilenet * delete json file * nearly(less 0.2) align inference accuracy with gml * move mutate seperated in bignas mobilenet backbone * add zero_init_residual * add set_dropout * set dropout in bignas algorithm * fix registry * add subnet yaml and nearly align inference accuracy with gml * add rsb config for bignas * remove base in config * add gml bignas config * convert to iter based * bignas forward and backward fly * fix merge conflict * fix dynamicseq bug * fix bug and refactor bignas * arrange configs of bignas * fix typo * refactor attentive_mobilenet * fix channel mismatch due to registion of DerivedMutable * update bignas & fix se channel mismatch * add AutoAugmentV2 & remove unness configs * fix lint * recover channel assertion in channel unit * fix a group bug * fix comments * add docstring * add norm in dynamic_embed * fix search loop & other minor changes * fix se expansion * minor change * add ut for bignas & attentive_mobilenet * fix ut * update bignas readme * rm unness ut & supplement get_placeholder * fix lint * fix ut * add subnet deployment in downstream tasks. * minor change * update ofa backbone * minor fix * Continued improvements of searchable backbone * minor change * drop ratio in backbone * fix comments * fix ci test * fix test * add dynamic shortcut UT * modify strategy to fit bignas * fix test * fix bug in neck * fix error * fix error * fix yaml * save subnet ckpt * merge autoslim_val/test_loop into subnet_val_loop * move calibrate_bn_mixin to utils * fix bugs and add docstring * clean code * fix register bug * clean code * update Co-authored-by: wangshiguang <wangshiguang@sensetime.com> Co-authored-by: gaoyang07 <1546308416@qq.com> Co-authored-by: aptsunny <aptsunny@tongji.edu.cn> Co-authored-by: sunyue1 <sunyue1@sensetime.com> 2022-12-07 11:28:10 +08:00			`def main():`
			`args = parse_args()`
			`checkpoint = torch.load(args.checkpoint, map_location='cpu')`
			`new_state_dict = dict()`

[Improvement] Adapt OFA series with SearchableMobileNetV3 (#385) * fix mutable bug in AttentiveMobileNetV3 * remove unness code * update ATTENTIVE_SUBNET_A0-A6.yaml with optimized names * unify the sampling usage in sandwich_rule-based NAS * use alias to export subnet * update OFA configs * fix attr bug * fix comments * update convert_supernet2subnet.py * correct the way to dump DerivedMutable * fix convert index bug * update OFA configs & models * fix dynamic2static * generalize convert_ofa_ckpt.py * update input_resizer * update README.md * fix ut * update export_fix_subnet * update _dynamic_to_static * update fix_subnet UT & minor fix bugs * fix ut * add new autoaug compared to attentivenas * clean * fix act * fix act_cfg * update fix_subnet * fix lint * add docstring Co-authored-by: gaoyang07 <1546308416@qq.com> Co-authored-by: aptsunny <aptsunny@tongji.edu.cn> 2022-12-15 22:19:55 +08:00			`index_table = block2layer_index_convert(args.depth)`

[Feature] Add BigNAS algorithm (#219) * add calibrate-bn-statistics * add test calibrate-bn-statistics * fix mixins * fix mixins * fix mixin tests * remove slimmable channel mutable and refactor dynamic op * refact dynamic batch norm * add progressive dynamic conv2d * add center crop dynamic conv2d * refactor dynamic directory * refactor dynamic sequential * rename length to depth in dynamic sequential * add test for derived mutable * refactor dynamic op * refactor api of dynamic op * add derive mutable mixin * addbignas algorithm * refactor bignas structure * add input resizer * add input resizer to bignas * move input resizer from algorithm into classifier * remove compnents * add attentive mobilenet * delete json file * nearly(less 0.2) align inference accuracy with gml * move mutate seperated in bignas mobilenet backbone * add zero_init_residual * add set_dropout * set dropout in bignas algorithm * fix registry * add subnet yaml and nearly align inference accuracy with gml * add rsb config for bignas * remove base in config * add gml bignas config * convert to iter based * bignas forward and backward fly * fix merge conflict * fix dynamicseq bug * fix bug and refactor bignas * arrange configs of bignas * fix typo * refactor attentive_mobilenet * fix channel mismatch due to registion of DerivedMutable * update bignas & fix se channel mismatch * add AutoAugmentV2 & remove unness configs * fix lint * recover channel assertion in channel unit * fix a group bug * fix comments * add docstring * add norm in dynamic_embed * fix search loop & other minor changes * fix se expansion * minor change * add ut for bignas & attentive_mobilenet * fix ut * update bignas readme * rm unness ut & supplement get_placeholder * fix lint * fix ut * add subnet deployment in downstream tasks. * minor change * update ofa backbone * minor fix * Continued improvements of searchable backbone * minor change * drop ratio in backbone * fix comments * fix ci test * fix test * add dynamic shortcut UT * modify strategy to fit bignas * fix test * fix bug in neck * fix error * fix error * fix yaml * save subnet ckpt * merge autoslim_val/test_loop into subnet_val_loop * move calibrate_bn_mixin to utils * fix bugs and add docstring * clean code * fix register bug * clean code * update Co-authored-by: wangshiguang <wangshiguang@sensetime.com> Co-authored-by: gaoyang07 <1546308416@qq.com> Co-authored-by: aptsunny <aptsunny@tongji.edu.cn> Co-authored-by: sunyue1 <sunyue1@sensetime.com> 2022-12-07 11:28:10 +08:00			`for key, value in checkpoint['state_dict'].items():`
[Improvement] Adapt OFA series with SearchableMobileNetV3 (#385) * fix mutable bug in AttentiveMobileNetV3 * remove unness code * update ATTENTIVE_SUBNET_A0-A6.yaml with optimized names * unify the sampling usage in sandwich_rule-based NAS * use alias to export subnet * update OFA configs * fix attr bug * fix comments * update convert_supernet2subnet.py * correct the way to dump DerivedMutable * fix convert index bug * update OFA configs & models * fix dynamic2static * generalize convert_ofa_ckpt.py * update input_resizer * update README.md * fix ut * update export_fix_subnet * update _dynamic_to_static * update fix_subnet UT & minor fix bugs * fix ut * add new autoaug compared to attentivenas * clean * fix act * fix act_cfg * update fix_subnet * fix lint * add docstring Co-authored-by: gaoyang07 <1546308416@qq.com> Co-authored-by: aptsunny <aptsunny@tongji.edu.cn> 2022-12-15 22:19:55 +08:00			`if 'blocks' in key:`
			`index = key.split('.')[1]`
			`new_key = key.replace('blocks.' + index,`
			`'layer' + index_table[index])`
[Feature] Add BigNAS algorithm (#219) * add calibrate-bn-statistics * add test calibrate-bn-statistics * fix mixins * fix mixins * fix mixin tests * remove slimmable channel mutable and refactor dynamic op * refact dynamic batch norm * add progressive dynamic conv2d * add center crop dynamic conv2d * refactor dynamic directory * refactor dynamic sequential * rename length to depth in dynamic sequential * add test for derived mutable * refactor dynamic op * refactor api of dynamic op * add derive mutable mixin * addbignas algorithm * refactor bignas structure * add input resizer * add input resizer to bignas * move input resizer from algorithm into classifier * remove compnents * add attentive mobilenet * delete json file * nearly(less 0.2) align inference accuracy with gml * move mutate seperated in bignas mobilenet backbone * add zero_init_residual * add set_dropout * set dropout in bignas algorithm * fix registry * add subnet yaml and nearly align inference accuracy with gml * add rsb config for bignas * remove base in config * add gml bignas config * convert to iter based * bignas forward and backward fly * fix merge conflict * fix dynamicseq bug * fix bug and refactor bignas * arrange configs of bignas * fix typo * refactor attentive_mobilenet * fix channel mismatch due to registion of DerivedMutable * update bignas & fix se channel mismatch * add AutoAugmentV2 & remove unness configs * fix lint * recover channel assertion in channel unit * fix a group bug * fix comments * add docstring * add norm in dynamic_embed * fix search loop & other minor changes * fix se expansion * minor change * add ut for bignas & attentive_mobilenet * fix ut * update bignas readme * rm unness ut & supplement get_placeholder * fix lint * fix ut * add subnet deployment in downstream tasks. * minor change * update ofa backbone * minor fix * Continued improvements of searchable backbone * minor change * drop ratio in backbone * fix comments * fix ci test * fix test * add dynamic shortcut UT * modify strategy to fit bignas * fix test * fix bug in neck * fix error * fix error * fix yaml * save subnet ckpt * merge autoslim_val/test_loop into subnet_val_loop * move calibrate_bn_mixin to utils * fix bugs and add docstring * clean code * fix register bug * clean code * update Co-authored-by: wangshiguang <wangshiguang@sensetime.com> Co-authored-by: gaoyang07 <1546308416@qq.com> Co-authored-by: aptsunny <aptsunny@tongji.edu.cn> Co-authored-by: sunyue1 <sunyue1@sensetime.com> 2022-12-07 11:28:10 +08:00			`else:`
			`new_key = key`

			`if 'mobile_inverted_conv' in new_key:`
			`new_key = new_key.replace('mobile_inverted_conv.', '')`
			`if 'depth_conv' in key:`
			`new_key = new_key.replace('depth_conv', 'depthwise_conv')`
			`if 'point_linear' in key:`
			`new_key = new_key.replace('point_linear', 'linear_conv')`
			`if 'inverted_bottleneck' in key:`
			`new_key = new_key.replace('inverted_bottleneck', 'expand_conv')`
			`if '.conv.conv' in new_key:`
			`new_key = new_key.replace('.conv.conv', '.conv')`
			`if '.bn.bn' in new_key:`
			`new_key = new_key.replace('.bn.bn', '.bn')`

			`if 'layer1.0.depthwise_conv.weight' in new_key:`
			`new_key = new_key.replace('layer1.0.depthwise_conv.weight',`
			`'layer1.0.depthwise_conv.conv.weight')`
			`if 'layer1.0.linear_conv.weight' in new_key:`
			`new_key = new_key.replace('layer1.0.linear_conv.weight',`
			`'layer1.0.linear_conv.conv.weight')`

			`if 'depthwise_conv.se.fc.reduce' in new_key:`
			`new_key = new_key.replace('depthwise_conv.se.fc.reduce',`
			`'se.conv1.conv')`
			`if 'depthwise_conv.se.fc.expand' in new_key:`
			`new_key = new_key.replace('depthwise_conv.se.fc.expand',`
			`'se.conv2.conv')`

			`if 'final_expand_layer' in new_key:`
			`new_key = new_key.replace('final_expand_layer',`
			`'last_conv.final_expand_layer')`
			`if 'feature_mix_layer' in new_key:`
			`new_key = new_key.replace('feature_mix_layer',`
			`'last_conv.feature_mix_layer')`

			`if '5to3_matrix' in new_key:`
			`new_key = new_key.replace('5to3_matrix', 'trans_matrix_5to3')`
			`if '7to5_matrix' in new_key:`
			`new_key = new_key.replace('7to5_matrix', 'trans_matrix_7to5')`

			`new_key = 'architecture.backbone.' + new_key`

			`if 'classifier.linear' in new_key:`
			`new_key = new_key.replace('classifier.linear', 'head.fc')`
			`new_key = new_key.replace('backbone.', '')`

			`new_state_dict[new_key] = value`

			`checkpoint['state_dict'] = new_state_dict`
			`if args.inplace:`
			`torch.save(checkpoint, args.checkpoint)`
			`else:`
			`ckpt_path = Path(args.checkpoint)`
			`ckpt_name = ckpt_path.stem`
			`ckpt_dir = ckpt_path.parent`
			`new_ckpt_path = ckpt_dir / f'{ckpt_name}_latest.pth'`
			`torch.save(checkpoint, new_ckpt_path)`


			`if __name__ == '__main__':`
			`main()`