mmclassification/tools/model_converters/levit2mmpretrain.py

# Copyright (c) OpenMMLab. All rights reserved.
import argparse
import os.path as osp
from collections import OrderedDict

import mmengine
import torch


def convert_levit(args, ckpt):
    new_ckpt = OrderedDict()
    stage = 0
    block = 0
    change = True
    for k, v in list(ckpt.items()):
        new_v = v
        if k.startswith('head_dist'):
            new_k = k.replace('head_dist.', 'head.head_dist.')
            new_k = new_k.replace('.l.', '.linear.')
            new_ckpt[new_k] = new_v
            continue
        elif k.startswith('head'):
            new_k = k.replace('head.', 'head.head.')
            new_k = new_k.replace('.l.', '.linear.')
            new_ckpt[new_k] = new_v
            continue
        elif k.startswith('patch_embed'):
            new_k = k.replace('patch_embed.',
                              'patch_embed.patch_embed.').replace(
                                  '.c.', '.conv.')
        elif k.startswith('blocks'):
            strs = k.split('.')
            # new_k = k.replace('.c.', '.').replace('.bn.', '.')
            new_k = k
            if '.m.' in k:
                new_k = new_k.replace('.m.0', '.m.linear1')
                new_k = new_k.replace('.m.2', '.m.linear2')
                new_k = new_k.replace('.m.', '.block.')
                change = True
            elif change:
                stage += 1
                block = int(strs[1])
                change = False
            new_k = new_k.replace(
                'blocks.%s.' % (strs[1]),
                'stages.%d.%d.' % (stage, int(strs[1]) - block))
            new_k = new_k.replace('.c.', '.linear.')
        else:
            new_k = k
        # print(new_k)
        new_k = 'backbone.' + new_k
        new_ckpt[new_k] = new_v

    return new_ckpt


def main():
    parser = argparse.ArgumentParser(
        description='Convert keys in timm pretrained vit models to '
        'MMPretrain style.')
    parser.add_argument('src', help='src model path or url')
    # The dst path must be a full path of the new checkpoint.
    parser.add_argument('dst', help='save path')
    args = parser.parse_args()

    checkpoint = torch.load(args.src, map_location='cpu')
    checkpoint = checkpoint['model']
    if 'state_dict' in checkpoint:
        # timm checkpoint
        state_dict = checkpoint['state_dict']
    else:
        state_dict = checkpoint

    weight = convert_levit(args, state_dict)
    mmengine.mkdir_or_exist(osp.dirname(args.dst))
    torch.save(weight, args.dst)


if __name__ == '__main__':
    main()
[Feature] Support LeViT backbone. (#1238) * 网络搭建完成、能正常推理 * 网络搭建完成、能正常推理 * 网络搭建完成、能正常推理 * 添加了模型转换未验证，配置文件但有无法运行 * 模型转换、结构验证完成，可以推理出正确答案 * 推理精度与原论文一致已完成转化 * 三个方法改为class 暂存 * 完成推理精度对齐误差0.04 * 暂时使用的levit2mmcls * 训练跑通，训练相关参数未对齐 * '训练相关参数对齐'参数' * '修复训练时验证导致模型结构改变无法复原问题' * '修复训练时验证导致模型结构改变无法复原问题' * '添加mixup和labelsmooth' * '配置文件补齐' * 添加模型转换 * 添加meta文件 * 添加meta文件 * 删除demo.py测试文件 * 添加模型README文件 * docs文件回滚 * model-index删除末行空格 * 更新模型metafile * 更新metafile * 更新metafile * 更新README和metafile * 更新模型README * 更新模型metafile * Delete the model class and get_LeViT_model methods in the mmcls.models.backone.levit file * Change the class name to Google Code Style * use arch to provide default architectures * use nn.Conv2d * mmcv.cnn.fuse_conv_bn * modify some details * remove down_ops from the architectures. * remove init_weight function * Modify ambiguous variable names * Change the drop_path in config to drop_path_rate * Add unit test * remove train function * add unit test * modify nn.norm1d to build_norm_layer * update metafile and readme * Update configs and LeViT implementations. * Update README. * Add docstring and update unit tests. * Revert irrelative modification. * Fix unit tests * minor fix Co-authored-by: mzr1996 <mzr1996@163.com> 2023-01-17 17:43:42 +08:00			`# Copyright (c) OpenMMLab. All rights reserved.`
			`import argparse`
			`import os.path as osp`
			`from collections import OrderedDict`

			`import mmengine`
			`import torch`


			`def convert_levit(args, ckpt):`
			`new_ckpt = OrderedDict()`
			`stage = 0`
			`block = 0`
			`change = True`
			`for k, v in list(ckpt.items()):`
			`new_v = v`
			`if k.startswith('head_dist'):`
			`new_k = k.replace('head_dist.', 'head.head_dist.')`
			`new_k = new_k.replace('.l.', '.linear.')`
			`new_ckpt[new_k] = new_v`
			`continue`
			`elif k.startswith('head'):`
			`new_k = k.replace('head.', 'head.head.')`
			`new_k = new_k.replace('.l.', '.linear.')`
			`new_ckpt[new_k] = new_v`
			`continue`
			`elif k.startswith('patch_embed'):`
			`new_k = k.replace('patch_embed.',`
			`'patch_embed.patch_embed.').replace(`
			`'.c.', '.conv.')`
			`elif k.startswith('blocks'):`
			`strs = k.split('.')`
			`# new_k = k.replace('.c.', '.').replace('.bn.', '.')`
			`new_k = k`
			`if '.m.' in k:`
			`new_k = new_k.replace('.m.0', '.m.linear1')`
			`new_k = new_k.replace('.m.2', '.m.linear2')`
			`new_k = new_k.replace('.m.', '.block.')`
			`change = True`
			`elif change:`
			`stage += 1`
			`block = int(strs[1])`
			`change = False`
			`new_k = new_k.replace(`
			`'blocks.%s.' % (strs[1]),`
			`'stages.%d.%d.' % (stage, int(strs[1]) - block))`
			`new_k = new_k.replace('.c.', '.linear.')`
			`else:`
			`new_k = k`
			`# print(new_k)`
			`new_k = 'backbone.' + new_k`
			`new_ckpt[new_k] = new_v`

			`return new_ckpt`


			`def main():`
			`parser = argparse.ArgumentParser(`
			`description='Convert keys in timm pretrained vit models to '`
Rename the package name to `mmpretrain`. 2023-02-17 11:31:08 +08:00			`'MMPretrain style.')`
[Feature] Support LeViT backbone. (#1238) * 网络搭建完成、能正常推理 * 网络搭建完成、能正常推理 * 网络搭建完成、能正常推理 * 添加了模型转换未验证，配置文件但有无法运行 * 模型转换、结构验证完成，可以推理出正确答案 * 推理精度与原论文一致已完成转化 * 三个方法改为class 暂存 * 完成推理精度对齐误差0.04 * 暂时使用的levit2mmcls * 训练跑通，训练相关参数未对齐 * '训练相关参数对齐'参数' * '修复训练时验证导致模型结构改变无法复原问题' * '修复训练时验证导致模型结构改变无法复原问题' * '添加mixup和labelsmooth' * '配置文件补齐' * 添加模型转换 * 添加meta文件 * 添加meta文件 * 删除demo.py测试文件 * 添加模型README文件 * docs文件回滚 * model-index删除末行空格 * 更新模型metafile * 更新metafile * 更新metafile * 更新README和metafile * 更新模型README * 更新模型metafile * Delete the model class and get_LeViT_model methods in the mmcls.models.backone.levit file * Change the class name to Google Code Style * use arch to provide default architectures * use nn.Conv2d * mmcv.cnn.fuse_conv_bn * modify some details * remove down_ops from the architectures. * remove init_weight function * Modify ambiguous variable names * Change the drop_path in config to drop_path_rate * Add unit test * remove train function * add unit test * modify nn.norm1d to build_norm_layer * update metafile and readme * Update configs and LeViT implementations. * Update README. * Add docstring and update unit tests. * Revert irrelative modification. * Fix unit tests * minor fix Co-authored-by: mzr1996 <mzr1996@163.com> 2023-01-17 17:43:42 +08:00			`parser.add_argument('src', help='src model path or url')`
			`# The dst path must be a full path of the new checkpoint.`
			`parser.add_argument('dst', help='save path')`
			`args = parser.parse_args()`

			`checkpoint = torch.load(args.src, map_location='cpu')`
			`checkpoint = checkpoint['model']`
			`if 'state_dict' in checkpoint:`
			`# timm checkpoint`
			`state_dict = checkpoint['state_dict']`
			`else:`
			`state_dict = checkpoint`

			`weight = convert_levit(args, state_dict)`
			`mmengine.mkdir_or_exist(osp.dirname(args.dst))`
			`torch.save(weight, args.dst)`


			`if __name__ == '__main__':`
			`main()`