diff --git a/torch_npu/meta/_meta_registrations.py b/torch_npu/meta/_meta_registrations.py index 4c8bdebf73f8a0ac0266824d96633f4ab0f3dfea..487da245865003ad1d3f945865b02b7de9269fc9 100644 --- a/torch_npu/meta/_meta_registrations.py +++ b/torch_npu/meta/_meta_registrations.py @@ -636,9 +636,11 @@ def npu_group_quant_meta(x, scale, group_index, *, offset=None, dst_dtype=None): return torch.empty_like(x, dtype=torch.int8) elif dst_dtype == torch.quint4x2: dim_num = x.dim() + if dim_num == 0: + raise RuntimeError("Input x can't be scalar" + ops_error(ErrCode.PARAM)) if x.size(dim_num - 1) % 8: - raise RuntimeError("If dst_dtype is quint4x2, last dim must be divisible by 8" + - ops_error(ErrCode.NOT_SUPPORT)) + raise RuntimeError("If dst_dtype is quint4x2, x last dim must be divisible by 8" + + ops_error(ErrCode.PARAM)) output_shape = [] for dim in range(dim_num - 1): output_shape.append(x.size(dim))