diff --git a/src/kernels/kernels/elewise/quant/quant_tiling/quant_tiling.cpp b/src/kernels/kernels/elewise/quant/quant_tiling/quant_tiling.cpp index 7ebefcb5d31d1eba0b681df46b6fd6e9d8a075c7..5431f956c3562f4f205b0f288fc64d1ab82c4f32 100644 --- a/src/kernels/kernels/elewise/quant/quant_tiling/quant_tiling.cpp +++ b/src/kernels/kernels/elewise/quant/quant_tiling/quant_tiling.cpp @@ -33,6 +33,8 @@ Status QuantF16Tiling(const LaunchParam &launchParam, KernelInfo &kernelInfo) Status ret = PostLayerNormPtrFunc(tilingDataPtr, quantPtrCon, launchParam, kernelInfo); OP_TILING_CHECK_STATUS_RETURN(ret); int32_t scalarUsed = 256; + MKI_CHECK(quantPtrCon.numCol % 32 == 0, "last dim is not 32 bytes align", + return Status::FailStatus(ERROR_INVALID_VALUE, "last dim is not 32 bytes align")); // 32: 算子约束最后一维32字节对齐要求 MKI_CHECK(quantPtrCon.nlFirstdimPerCoreNum < (static_cast(std::numeric_limits::max()) / 2) / quantPtrCon.numCol, "numCol or nlFirstdimPerCoreNum is not invalid",