rewrite torch.cat for TensorRT when input is dynamic (#1851)

2025-01-14 08:09:43 +08:00 · 2023-03-17 15:49:52 +08:00 · 2023-03-17 15:49:52 +08:00 · 8e2f6556be
commit 8e2f6556be
parent 847a906e6f
3 changed files with 57 additions and 2 deletions
--- a/mmdeploy/pytorch/functions/init.py
+++ b/mmdeploy/pytorch/functions/init.py
@ -2,6 +2,7 @@
 from . import adaptive_pool  # noqa: F401,F403
 from . import any  # noqa: F401,F403
 from . import atan2  # noqa: F401,F403
 from . import cat  # noqa: F401,F403
 from . import chunk  # noqa: F401,F403
 from . import clip  # noqa: F401,F403
 from . import expand  # noqa: F401,F403
--- a/mmdeploy/pytorch/functions/cat.py
+++ b/mmdeploy/pytorch/functions/cat.py
@ -0,0 +1,24 @@
 # Copyright (c) OpenMMLab. All rights reserved.
 from typing import Sequence
 import torch
 from torch import Tensor
 from mmdeploy.core import FUNCTION_REWRITER
 from mmdeploy.utils import get_dynamic_axes
@FUNCTION_REWRITER.register_rewriter(func_name='torch.cat', backend='tensorrt')
 def cat__tensorrt(tensors: Sequence[Tensor], *args, **kwargs) -> torch.Tensor:
    """Rewrite `cat` for TensorRT backend.
    cat in TensorRT does not support bool or uint8 type when input is dynamic.
    """
    ctx = FUNCTION_REWRITER.get_context()
    if get_dynamic_axes(ctx.cfg) is None:
        return ctx.origin_func(tensors, *args, **kwargs)
    if len(tensors) > 0 and (tensors[0].dtype in [torch.bool, torch.uint8]):
        original_dtype = tensors[0].dtype
        tensors = [i.to(torch.int32) for i in tensors]
        return ctx.origin_func(tensors, *args, **kwargs).to(original_dtype)
    return ctx.origin_func(tensors, *args, **kwargs)
--- a/tests/test_pytorch/test_pytorch_functions.py
+++ b/tests/test_pytorch/test_pytorch_functions.py
@ -19,10 +19,13 @@ deploy_cfg_ncnn = Config(
        codebase_config=dict(type='mmdet', task='ObjectDetection')))
-def get_trt_config(output_names, shape):
+def get_trt_config(output_names, shape, dynamic_axes=None):
    deploy_cfg_tensorrt = Config(
        dict(
-            onnx_config=dict(input_shape=None, output_names=output_names),
+            onnx_config=dict(
                input_shape=None,
                output_names=output_names,
                dynamic_axes=dynamic_axes),
            backend_config=dict(
                type='tensorrt',
                common_config=dict(
@ -615,3 +618,30 @@ def test_linspace__default():
        assert np.allclose(
            model_output, rewrite_outputs, rtol=1e-03, atol=1e-05)
@backend_checker(Backend.TENSORRT)
@pytest.mark.parametrize('dtype', [torch.bool, torch.float32])
@pytest.mark.parametrize('dynamic_axes',
                         [None, dict(input=dict({
                             0: 'dim0',
                             1: 'dim1'
                         }))])
 def test_cat__tensorrt(dtype, dynamic_axes):
    input = torch.rand(2, 4)
    model = WrapFunction(lambda input: torch.cat(
        [input.to(dtype), input.to(dtype)], -1))
    pytorch_output = model(input)
    rewrite_output, _ = get_rewrite_outputs(
        model,
        model_inputs={'input': input},
        deploy_cfg=get_trt_config(['output'],
                                  shape=[2, 4],
                                  dynamic_axes=dynamic_axes),
        run_with_backend=True)
    assert pytorch_output.dtype == rewrite_output[0].dtype
    assert torch.allclose(
        pytorch_output.cpu().float(),
        rewrite_output[0].cpu().float(),
        rtol=1e-3,
        atol=1e-5)