diff --git a/impl/matmul/matmul_impl.h b/impl/matmul/matmul_impl.h index 09d44c628e464b2ec1a91422f074e1733c7589ea..24e89bbc2348b4d4fb088161020a8520710b333b 100644 --- a/impl/matmul/matmul_impl.h +++ b/impl/matmul/matmul_impl.h @@ -7939,6 +7939,7 @@ __aicore__ inline void MatmulImpl bias; for (int k = 0; k < var.kIter_; k++) { // start reduce K axis var.baseUseK_ = ToMatmulConfig(MM_CFG).basicK; // Disassemble into main tail block. constexpr uint16_t blockUseK = ToMatmulConfig(MM_CFG).basicK / c0Size_; @@ -7958,7 +7959,6 @@ __aicore__ inline void MatmulImpl bias; if constexpr (A_TYPE::layout == LayoutMode::NONE || ToMatmulConfig(MM_CFG).batchMode == BatchMode::SINGLE_LARGE_THAN_L1) { bias = var.qidBias_.template DeQue(); @@ -7966,16 +7966,16 @@ __aicore__ inline void MatmulImpl