From 67d74b5178104f4b2b53cc26518c7a0e83e0c793 Mon Sep 17 00:00:00 2001 From: YiYang <15594999221@163.com> Date: Thu, 26 Jun 2025 22:24:36 +0800 Subject: [PATCH] =?UTF-8?q?[Refactor][develop]=E5=B0=8FEP=E5=9C=BA?= =?UTF-8?q?=E6=99=AFgating=E6=A8=A1=E5=9D=97=E6=80=A7=E8=83=BD=E4=BC=98?= =?UTF-8?q?=E5=8C=96?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../models/mf_models/deepseekv3_weight_processor.py | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/vllm_mindspore/model_executor/models/mf_models/deepseekv3_weight_processor.py b/vllm_mindspore/model_executor/models/mf_models/deepseekv3_weight_processor.py index c63abe69..6e4d1e61 100644 --- a/vllm_mindspore/model_executor/models/mf_models/deepseekv3_weight_processor.py +++ b/vllm_mindspore/model_executor/models/mf_models/deepseekv3_weight_processor.py @@ -1140,6 +1140,14 @@ class DeepseekV3WeightProcessor(BaseWeightProcessor): router_dense_ms_name = self.convert_weight_name(router_dense_hf_name) router_dense_ms_param, _ = self.get_safetensor_from_file( router_dense_hf_name, src_hf_dir, hf_weight_map) + + if self.moe_split_ep and self.ep_method != EPMethod.ALLTOALL: + expert_idx = [idx for idx in range(router_dense_ms_param.shape[0])] + in_start_expert_idx = self.ep_group_nums * self.moe_ep_rank_id + expert_idx = expert_idx[ + in_start_expert_idx:] + expert_idx[:in_start_expert_idx] + router_dense_ms_param = np.array(router_dense_ms_param)[expert_idx] + self.parameter_dict[router_dense_ms_name] = ms.Parameter( ms.from_numpy(router_dense_ms_param).astype(ms.bfloat16), name=router_dense_ms_name, -- Gitee