Cherry-pick #1439 to fix 'topk' on different devices for onnxruntime-gpu inference (#1603)

Co-authored-by: grimoire <yaoqian@sensetime.com>
2025-01-14 08:09:43 +08:00 · 2023-01-04 23:10:19 +08:00 · 2023-01-04 23:10:19 +08:00 · 8a05b8d62d
commit 8a05b8d62d
parent c67e2db68e
1 changed files with 3 additions and 2 deletions
--- a/mmdeploy/pytorch/functions/topk.py
+++ b/mmdeploy/pytorch/functions/topk.py
@ -28,7 +28,8 @@ def topk__dynamic(input: torch.Tensor,
        k = torch.tensor(k, device=input.device, dtype=torch.long)
    # Always keep topk op for dynamic input
    if isinstance(size, torch.Tensor):
-        size = size.to(input.device)
+        # size would be treated as cpu tensor, trick to avoid that.
        size = k.new_zeros(()) + size
    k = torch.where(k < size, k, size)
    return ctx.origin_func(input, k, dim=dim, largest=largest, sorted=sorted)