[Enhance] Enable full precision training on Ascend NPU (#1109)

2025-06-03 21:54:44 +08:00 · 2023-05-06 17:17:32 +08:00 · 2023-05-06 17:17:32 +08:00 · fed0e3821a
commit fed0e3821a
parent 6cd7a43a7f
3 changed files with 16 additions and 6 deletions
--- a/mmengine/device/init.py
+++ b/mmengine/device/init.py
@ -1,8 +1,10 @@
 # Copyright (c) OpenMMLab. All rights reserved.
 from .utils import (get_device, get_max_cuda_memory, is_cuda_available,
-                    is_mlu_available, is_mps_available, is_npu_available)
+                    is_mlu_available, is_mps_available, is_npu_available,
                    is_npu_support_full_precision)
 __all__ = [
    'get_max_cuda_memory', 'get_device', 'is_cuda_available',
-    'is_mlu_available', 'is_mps_available', 'is_npu_available'
+    'is_mlu_available', 'is_mps_available', 'is_npu_available',
    'is_npu_support_full_precision'
 ]
--- a/mmengine/device/utils.py
+++ b/mmengine/device/utils.py
@ -6,6 +6,7 @@ import torch
 try:
    import torch_npu  # noqa: F401
    import torch_npu.npu.utils as npu_utils
    # Enable operator support for dynamic shape and
    # binary operator support on the NPU.
@ -62,6 +63,13 @@ def is_mps_available() -> bool:
    return hasattr(torch.backends, 'mps') and torch.backends.mps.is_available()
 def is_npu_support_full_precision() -> bool:
    """Returns True if npu devices support full precision training."""
    version_of_support_full_precision = 220
    return IS_NPU_AVAILABLE and npu_utils.get_soc_version(
    ) >= version_of_support_full_precision
 DEVICE = 'cpu'
 if is_npu_available():
    DEVICE = 'npu'
--- a/mmengine/optim/optimizer/builder.py
+++ b/mmengine/optim/optimizer/builder.py
@ -7,7 +7,7 @@ import torch
 import torch.nn as nn
 from mmengine.config import Config, ConfigDict
-from mmengine.device import is_npu_available
+from mmengine.device import is_npu_available, is_npu_support_full_precision
 from mmengine.registry import OPTIM_WRAPPER_CONSTRUCTORS, OPTIMIZERS
 from .optimizer_wrapper import OptimWrapper
@ -128,9 +128,9 @@ def build_optim_wrapper(model: nn.Module,
    paramwise_cfg = optim_wrapper_cfg.pop('paramwise_cfg', None)
    # Since the current generation of NPU(Ascend 910) only supports
-    # mixed precision training, here we turn on mixed precision by default
+    # mixed precision training, here we turn on mixed precision
-    # on the NPU to make the training normal
+    # to make the training normal
-    if is_npu_available():
+    if is_npu_available() and not is_npu_support_full_precision():
        optim_wrapper_cfg['type'] = 'AmpOptimWrapper'
    optim_wrapper_constructor = OPTIM_WRAPPER_CONSTRUCTORS.build(