diff --git a/torch_npu/meta/_meta_registrations.py b/torch_npu/meta/_meta_registrations.py index dc245410ffe3579c54a89c214a010c15fae06a54..0fdad4db80f4c5cf6a8db3fd0a62075d464d8728 100644 --- a/torch_npu/meta/_meta_registrations.py +++ b/torch_npu/meta/_meta_registrations.py @@ -759,9 +759,11 @@ def npu_group_quant_meta(x, scale, group_index, *, offset=None, dst_dtype=None): return torch.empty_like(x, dtype=torch.int8) elif dst_dtype == torch.quint4x2: dim_num = x.dim() + if dim_num == 0: + raise RuntimeError("Input x can't be scalar" + ops_error(ErrCode.PARAM)) if x.size(dim_num - 1) % 8: - raise RuntimeError("If dst_dtype is quint4x2, last dim must be divisible by 8" + - ops_error(ErrCode.NOT_SUPPORT)) + raise RuntimeError("If dst_dtype is quint4x2, x last dim must be divisible by 8" + + ops_error(ErrCode.PARAM)) output_shape = [] for dim in range(dim_num - 1): output_shape.append(x.size(dim))