From bcb6c302ede533ca14da3651f89f8b379ae448b8 Mon Sep 17 00:00:00 2001 From: y30062407 Date: Wed, 18 Jun 2025 16:16:58 +0800 Subject: [PATCH] =?UTF-8?q?=E3=80=90mindspore=E3=80=91=E3=80=90bugfix?= =?UTF-8?q?=E3=80=91Fix=20error=20enabling=20moe-zerc=20+=20dualpipe=20in?= =?UTF-8?q?=20full=20recompute=20for=20deepseek=5Fv3?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- mindspeed_llm/mindspore/mindspore_adaptor.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/mindspeed_llm/mindspore/mindspore_adaptor.py b/mindspeed_llm/mindspore/mindspore_adaptor.py index cd3992a2b..55b90b723 100644 --- a/mindspeed_llm/mindspore/mindspore_adaptor.py +++ b/mindspeed_llm/mindspore/mindspore_adaptor.py @@ -190,10 +190,11 @@ class MindSporeAdaptation(MegatronAdaptationABC): MindSporeAdaptation.register('megatron.core.pipeline_parallel.schedules.forward_backward_pipelining_without_interleaving', forward_backward_pipelining_with_cutinhalf) - - from mindspeed.mindspore.core.pipeline_parallel.fb_overlap.transformer_layer import transformer_layer_backward - MindSporeAdaptation.register('mindspeed.core.pipeline_parallel.fb_overlap.transformer_layer.transformer_layer_backward', - transformer_layer_backward) + from mindspeed.mindspore.core.pipeline_parallel.fb_overlap.transformer_layer import \ + transformer_layer_recompute + MindSporeAdaptation.register( + 'mindspeed.core.pipeline_parallel.fb_overlap.transformer_layer.transformer_layer_recompute', + transformer_layer_recompute) from mindspeed.mindspore.core.pipeline_parallel.fb_overlap.transformer_block import transformer_block_forward, transformer_block_forward_backward_overlaping MindSporeAdaptation.register('mindspeed.core.pipeline_parallel.fb_overlap.transformer_block.transformer_block_forward', -- Gitee