use torch.ops.npu prefix and drop redundant torch_npu import

orangeH25 · orangeH25 · commit 68eea614160a · 2025-10-14T09:51:48.000Z
diff --git a/torchao/quantization/quantize_/workflows/int4/int4_plain_int32_tensor_npu.py b/torchao/quantization/quantize_/workflows/int4/int4_plain_int32_tensor_npu.py
@@ -21,11 +21,6 @@
 
 aten = torch.ops.aten
 
-try:
-    import torch_npu
-except ImportError:
-    torch_npu = None
-
 
 class Int4PlainInt32TensorNPU(TorchAOBaseTensor):
     """
@@ -93,9 +88,6 @@ def from_hp(
         w: torch.Tensor,
         block_size: List[int],
     ):
-        if torch_npu is None:
-            raise ImportError("Requires torch_npu but it is not installed")
-
         assert w.ndim == 2 and w.device.type == "npu", (
             f"Expecting 2D tensor on NPU, but got: {w.shape} on {w.device.type}"
         )
@@ -143,7 +135,7 @@ def from_hp(
             f"torch_npu.npu_convert_weight_to_int4pack expects last dim must be aligned to 8,but got {int_data.shape[-1]}"
         )
 
-        packed_weight = torch_npu.npu_convert_weight_to_int4pack(
+        packed_weight = torch.ops.npu.npu_convert_weight_to_int4pack(
             int_data.contiguous(), 0
         )
 
@@ -174,9 +166,6 @@ def _(func, types, args, kwargs):
         args[2] if len(args) > 2 else None,
     )
 
-    if torch_npu is None:
-        raise ImportError("Requires torch_npu but it is not installed")
-
     assert input_tensor.device.type == "npu", (
         f"For NPU device only but got: {input_tensor.device.type}"
     )
@@ -219,7 +208,7 @@ def _(func, types, args, kwargs):
     # groupwise int4 quantization
     groupsize = weight_tensor.block_size[1]
 
-    y = torch_npu.npu_weight_quant_batchmatmul(
+    y = torch.ops.npu.npu_weight_quant_batchmatmul(
         x=act_mat,
         weight=packed_weight.contiguous().transpose(-1, -2),
         antiquant_scale=scale,