mmdeploy/tools/onnx2ncnn_quant_table.py

# Copyright (c) OpenMMLab. All rights reserved.
import argparse
import logging

from mmcv import Config

from mmdeploy.utils import Task, get_root_logger, get_task_type, load_config


def get_table(onnx_path: str,
              deploy_cfg: Config,
              model_cfg: Config,
              output_onnx_path: str,
              output_quant_table_path: str,
              image_dir: str = None,
              device: str = 'cuda',
              dataset_type: str = 'val'):

    input_shape = None
    # setup input_shape if existed in `onnx_config`
    if 'onnx_config' in deploy_cfg and 'input_shape' in deploy_cfg.onnx_config:
        input_shape = deploy_cfg.onnx_config.input_shape

    # build calibration dataloader. If img dir not specified, use val dataset.
    if image_dir is not None:
        from quant_image_dataset import QuantizationImageDataset
        from torch.utils.data import DataLoader
        dataset = QuantizationImageDataset(
            path=image_dir, deploy_cfg=deploy_cfg, model_cfg=model_cfg)
        dataloader = DataLoader(dataset, batch_size=1)
    else:
        from mmdeploy.apis.utils import build_task_processor
        task_processor = build_task_processor(model_cfg, deploy_cfg, device)
        dataset = task_processor.build_dataset(model_cfg, dataset_type)
        dataloader = task_processor.build_dataloader(dataset, 1, 1)

    # get an available input shape randomly
    task = get_task_type(deploy_cfg)
    for _, input_data in enumerate(dataloader):
        if task != Task.SUPER_RESOLUTION:
            if isinstance(input_data['img'], list):
                input_shape = input_data['img'][0].shape
                collate_fn = lambda x: x['img'][0].to(device)  # noqa: E731
            else:
                input_shape = input_data['img'].shape
                collate_fn = lambda x: x['img'].to(device)  # noqa: E731
            break
        else:
            if isinstance(input_data['lq'], list):
                input_shape = input_data['lq'][0].shape
                collate_fn = lambda x: x['lq'][0].to(device)  # noqa: E731
            else:
                input_shape = input_data['lq'].shape
                collate_fn = lambda x: x['lq'].to(device)  # noqa: E731
            break

    from ppq import QuantizationSettingFactory, TargetPlatform
    from ppq.api import export_ppq_graph, quantize_onnx_model

    # settings for ncnn quantization
    quant_setting = QuantizationSettingFactory.default_setting()
    quant_setting.equalization = False
    quant_setting.dispatcher = 'conservative'

    # quantize the model
    quantized = quantize_onnx_model(
        onnx_import_file=onnx_path,
        calib_dataloader=dataloader,
        calib_steps=max(8, min(512, len(dataset))),
        input_shape=input_shape,
        setting=quant_setting,
        collate_fn=collate_fn,
        platform=TargetPlatform.NCNN_INT8,
        device=device,
        verbose=1)

    # export quantized graph and quant table
    export_ppq_graph(
        graph=quantized,
        platform=TargetPlatform.NCNN_INT8,
        graph_save_to=output_onnx_path,
        config_save_to=output_quant_table_path)
    return


def parse_args():
    parser = argparse.ArgumentParser(
        description='Generate ncnn quant table from ONNX.')
    parser.add_argument('--onnx', help='ONNX model path')
    parser.add_argument('--deploy-cfg', help='Input deploy config path')
    parser.add_argument('--model-cfg', help='Input model config path')
    parser.add_argument('--out-onnx', help='Output onnx path')
    parser.add_argument('--out-table', help='Output quant table path')
    parser.add_argument(
        '--image-dir',
        type=str,
        default=None,
        help='Calibration Image Directory.')
    parser.add_argument(
        '--log-level',
        help='set log level',
        default='INFO',
        choices=list(logging._nameToLevel.keys()))
    args = parser.parse_args()

    return args


def main():
    args = parse_args()
    logger = get_root_logger(log_level=args.log_level)

    onnx_path = args.onnx
    deploy_cfg, model_cfg = load_config(args.deploy_cfg, args.model_cfg)
    quant_table_path = args.out_table
    quant_onnx_path = args.out_onnx
    image_dir = args.image_dir

    try:
        get_table(onnx_path, deploy_cfg, model_cfg, quant_onnx_path,
                  quant_table_path, image_dir)
        logger.info('onnx2ncnn_quant_table success.')
    except Exception as e:
        logger.error(e)
        logger.error('onnx2ncnn_quant_table failed.')


if __name__ == '__main__':
    main()
feat(tools/deploy.py): support ncnn quantization (#476) * feat(tools): add onnx2ncnn_quant_table * feat(tools): add quantization image dataset * feat(tools): add image dataset * feat(tools/deploy.py): support quant * fix(CI): lint * fix(CI): format * docs(zh_cn): add quantization usage * docs(zh_cn): add benchmark * feat(tools): add onnx2ncnn_quant_table * docs(zh_cn): add more test result * CI(github): add quant script * CI(.github/scripts): add test quant * fix(CI): remove pushd and popd * feat(CI): debug * fix(CI): path error * fix(CI): fix path * fix(CI): install wget * fix(CI): review advices * improvement(mmdeploy): review advice * fix(tools): rename to onnx2ncnn_quant_table.py * improvement(tools): rename file * improvement(test): remove useless * fix(tools/quant_image_dataset): remove loadFile in test.pipeline * docs(quantization.md): update description * fix(CI): protobuf version * fix(CI): pip install * docs(quantization): review advice * fix(CI): revert mmcv version * fix(CI): udpate pb version * fix(CI): update 2022-05-26 19:53:56 +08:00			`# Copyright (c) OpenMMLab. All rights reserved.`
			`import argparse`
			`import logging`

			`from mmcv import Config`

[Feature]add edsr result && super-resolution ncnn-int8 config (#1111) * add edsr result && ncnn-int8 config * fix lint error * fix lint error * fix lint error && update benchmark.md * add EDSRx2 pytorch result * update edsrx4 result in benchmark 2022-10-18 10:04:56 +08:00			`from mmdeploy.utils import Task, get_root_logger, get_task_type, load_config`
feat(tools/deploy.py): support ncnn quantization (#476) * feat(tools): add onnx2ncnn_quant_table * feat(tools): add quantization image dataset * feat(tools): add image dataset * feat(tools/deploy.py): support quant * fix(CI): lint * fix(CI): format * docs(zh_cn): add quantization usage * docs(zh_cn): add benchmark * feat(tools): add onnx2ncnn_quant_table * docs(zh_cn): add more test result * CI(github): add quant script * CI(.github/scripts): add test quant * fix(CI): remove pushd and popd * feat(CI): debug * fix(CI): path error * fix(CI): fix path * fix(CI): install wget * fix(CI): review advices * improvement(mmdeploy): review advice * fix(tools): rename to onnx2ncnn_quant_table.py * improvement(tools): rename file * improvement(test): remove useless * fix(tools/quant_image_dataset): remove loadFile in test.pipeline * docs(quantization.md): update description * fix(CI): protobuf version * fix(CI): pip install * docs(quantization): review advice * fix(CI): revert mmcv version * fix(CI): udpate pb version * fix(CI): update 2022-05-26 19:53:56 +08:00

			`def get_table(onnx_path: str,`
			`deploy_cfg: Config,`
			`model_cfg: Config,`
			`output_onnx_path: str,`
			`output_quant_table_path: str,`
			`image_dir: str = None,`
			`device: str = 'cuda',`
			`dataset_type: str = 'val'):`

			`input_shape = None`
			# setup input_shape if existed in `onnx_config`
			`if 'onnx_config' in deploy_cfg and 'input_shape' in deploy_cfg.onnx_config:`
			`input_shape = deploy_cfg.onnx_config.input_shape`

			`# build calibration dataloader. If img dir not specified, use val dataset.`
			`if image_dir is not None:`
			`from quant_image_dataset import QuantizationImageDataset`
			`from torch.utils.data import DataLoader`
			`dataset = QuantizationImageDataset(`
			`path=image_dir, deploy_cfg=deploy_cfg, model_cfg=model_cfg)`
			`dataloader = DataLoader(dataset, batch_size=1)`
			`else:`
			`from mmdeploy.apis.utils import build_task_processor`
			`task_processor = build_task_processor(model_cfg, deploy_cfg, device)`
			`dataset = task_processor.build_dataset(model_cfg, dataset_type)`
			`dataloader = task_processor.build_dataloader(dataset, 1, 1)`

			`# get an available input shape randomly`
[Feature]add edsr result && super-resolution ncnn-int8 config (#1111) * add edsr result && ncnn-int8 config * fix lint error * fix lint error * fix lint error && update benchmark.md * add EDSRx2 pytorch result * update edsrx4 result in benchmark 2022-10-18 10:04:56 +08:00			`task = get_task_type(deploy_cfg)`
feat(tools/deploy.py): support ncnn quantization (#476) * feat(tools): add onnx2ncnn_quant_table * feat(tools): add quantization image dataset * feat(tools): add image dataset * feat(tools/deploy.py): support quant * fix(CI): lint * fix(CI): format * docs(zh_cn): add quantization usage * docs(zh_cn): add benchmark * feat(tools): add onnx2ncnn_quant_table * docs(zh_cn): add more test result * CI(github): add quant script * CI(.github/scripts): add test quant * fix(CI): remove pushd and popd * feat(CI): debug * fix(CI): path error * fix(CI): fix path * fix(CI): install wget * fix(CI): review advices * improvement(mmdeploy): review advice * fix(tools): rename to onnx2ncnn_quant_table.py * improvement(tools): rename file * improvement(test): remove useless * fix(tools/quant_image_dataset): remove loadFile in test.pipeline * docs(quantization.md): update description * fix(CI): protobuf version * fix(CI): pip install * docs(quantization): review advice * fix(CI): revert mmcv version * fix(CI): udpate pb version * fix(CI): update 2022-05-26 19:53:56 +08:00			`for _, input_data in enumerate(dataloader):`
[Feature]add edsr result && super-resolution ncnn-int8 config (#1111) * add edsr result && ncnn-int8 config * fix lint error * fix lint error * fix lint error && update benchmark.md * add EDSRx2 pytorch result * update edsrx4 result in benchmark 2022-10-18 10:04:56 +08:00			`if task != Task.SUPER_RESOLUTION:`
			`if isinstance(input_data['img'], list):`
			`input_shape = input_data['img'][0].shape`
			`collate_fn = lambda x: x['img'][0].to(device) # noqa: E731`
			`else:`
			`input_shape = input_data['img'].shape`
			`collate_fn = lambda x: x['img'].to(device) # noqa: E731`
			`break`
feat(tools/deploy.py): support ncnn quantization (#476) * feat(tools): add onnx2ncnn_quant_table * feat(tools): add quantization image dataset * feat(tools): add image dataset * feat(tools/deploy.py): support quant * fix(CI): lint * fix(CI): format * docs(zh_cn): add quantization usage * docs(zh_cn): add benchmark * feat(tools): add onnx2ncnn_quant_table * docs(zh_cn): add more test result * CI(github): add quant script * CI(.github/scripts): add test quant * fix(CI): remove pushd and popd * feat(CI): debug * fix(CI): path error * fix(CI): fix path * fix(CI): install wget * fix(CI): review advices * improvement(mmdeploy): review advice * fix(tools): rename to onnx2ncnn_quant_table.py * improvement(tools): rename file * improvement(test): remove useless * fix(tools/quant_image_dataset): remove loadFile in test.pipeline * docs(quantization.md): update description * fix(CI): protobuf version * fix(CI): pip install * docs(quantization): review advice * fix(CI): revert mmcv version * fix(CI): udpate pb version * fix(CI): update 2022-05-26 19:53:56 +08:00			`else:`
[Feature]add edsr result && super-resolution ncnn-int8 config (#1111) * add edsr result && ncnn-int8 config * fix lint error * fix lint error * fix lint error && update benchmark.md * add EDSRx2 pytorch result * update edsrx4 result in benchmark 2022-10-18 10:04:56 +08:00			`if isinstance(input_data['lq'], list):`
			`input_shape = input_data['lq'][0].shape`
			`collate_fn = lambda x: x['lq'][0].to(device) # noqa: E731`
			`else:`
			`input_shape = input_data['lq'].shape`
			`collate_fn = lambda x: x['lq'].to(device) # noqa: E731`
			`break`
feat(tools/deploy.py): support ncnn quantization (#476) * feat(tools): add onnx2ncnn_quant_table * feat(tools): add quantization image dataset * feat(tools): add image dataset * feat(tools/deploy.py): support quant * fix(CI): lint * fix(CI): format * docs(zh_cn): add quantization usage * docs(zh_cn): add benchmark * feat(tools): add onnx2ncnn_quant_table * docs(zh_cn): add more test result * CI(github): add quant script * CI(.github/scripts): add test quant * fix(CI): remove pushd and popd * feat(CI): debug * fix(CI): path error * fix(CI): fix path * fix(CI): install wget * fix(CI): review advices * improvement(mmdeploy): review advice * fix(tools): rename to onnx2ncnn_quant_table.py * improvement(tools): rename file * improvement(test): remove useless * fix(tools/quant_image_dataset): remove loadFile in test.pipeline * docs(quantization.md): update description * fix(CI): protobuf version * fix(CI): pip install * docs(quantization): review advice * fix(CI): revert mmcv version * fix(CI): udpate pb version * fix(CI): update 2022-05-26 19:53:56 +08:00
			`from ppq import QuantizationSettingFactory, TargetPlatform`
			`from ppq.api import export_ppq_graph, quantize_onnx_model`

			`# settings for ncnn quantization`
			`quant_setting = QuantizationSettingFactory.default_setting()`
			`quant_setting.equalization = False`
			`quant_setting.dispatcher = 'conservative'`

			`# quantize the model`
			`quantized = quantize_onnx_model(`
			`onnx_import_file=onnx_path,`
			`calib_dataloader=dataloader,`
			`calib_steps=max(8, min(512, len(dataset))),`
			`input_shape=input_shape,`
			`setting=quant_setting,`
			`collate_fn=collate_fn,`
			`platform=TargetPlatform.NCNN_INT8,`
			`device=device,`
			`verbose=1)`

			`# export quantized graph and quant table`
			`export_ppq_graph(`
			`graph=quantized,`
			`platform=TargetPlatform.NCNN_INT8,`
			`graph_save_to=output_onnx_path,`
			`config_save_to=output_quant_table_path)`
			`return`


			`def parse_args():`
			`parser = argparse.ArgumentParser(`
			`description='Generate ncnn quant table from ONNX.')`
			`parser.add_argument('--onnx', help='ONNX model path')`
			`parser.add_argument('--deploy-cfg', help='Input deploy config path')`
			`parser.add_argument('--model-cfg', help='Input model config path')`
			`parser.add_argument('--out-onnx', help='Output onnx path')`
			`parser.add_argument('--out-table', help='Output quant table path')`
			`parser.add_argument(`
			`'--image-dir',`
			`type=str,`
			`default=None,`
			`help='Calibration Image Directory.')`
			`parser.add_argument(`
			`'--log-level',`
			`help='set log level',`
			`default='INFO',`
			`choices=list(logging._nameToLevel.keys()))`
			`args = parser.parse_args()`

			`return args`


			`def main():`
			`args = parse_args()`
			`logger = get_root_logger(log_level=args.log_level)`

			`onnx_path = args.onnx`
			`deploy_cfg, model_cfg = load_config(args.deploy_cfg, args.model_cfg)`
			`quant_table_path = args.out_table`
			`quant_onnx_path = args.out_onnx`
			`image_dir = args.image_dir`

			`try:`
			`get_table(onnx_path, deploy_cfg, model_cfg, quant_onnx_path,`
			`quant_table_path, image_dir)`
			`logger.info('onnx2ncnn_quant_table success.')`
			`except Exception as e:`
			`logger.error(e)`
			`logger.error('onnx2ncnn_quant_table failed.')`


			`if __name__ == '__main__':`
			`main()`