diff --git a/tests/mindspore/st/st_run.sh b/tests/mindspore/st/st_run.sh index 57946854c1bc7a10a78e82f0398cf90896e47fbf..268aba5a61630c151813d9eb3f66fda0a117f5c3 100644 --- a/tests/mindspore/st/st_run.sh +++ b/tests/mindspore/st/st_run.sh @@ -21,12 +21,6 @@ rm -f "$ERROR_FLAG" # step 2: enable deterministic computation and insert modification points MindSpeed_LLM_PATH=$BASE_DIR/../../../../MindSpeed-LLM -Megatron_LM_PATH=$BASE_DIR/../../../../Megatron-LM -addbias() { - fname=$1 - lineNum=$(grep -n 'config.perform_initialization' ${fname} | cut -d: -f1) - sed -i $((lineNum))'i\ \ \ \ \ \ \ \ self.bias = torch.zeros((self.config.num_moe_experts), dtype=torch.bfloat16)' $fname -} addSeedAll() { fname=$1 lineNumMain=$(grep -n '__main__' ${fname} | cut -d: -f1) @@ -60,9 +54,6 @@ modifyTrainingLogs() { modifyTrainingLogs ${MindSpeed_LLM_PATH}/mindspeed_llm/training/training.py addSeedAll ${MindSpeed_LLM_PATH}/pretrain_gpt.py addSeedAll ${MindSpeed_LLM_PATH}/posttrain_gpt.py -sed -i 's/\ \ \ \ \ \ \ \ logits = F.linear(input, self.weight)/\ \ \ \ \ \ \ \ logits = F.linear(input, self.weight, self.bias)/g' ${MindSpeed_LLM_PATH}/mindspeed_llm/core/transformer/moe/router.py -addbias ${Megatron_LM_PATH}/megatron/core/transformer/moe/router.py -sed -i 's/ device=freqs.device, dtype=torch.float32/ dtype=torch.float32/g' ${MindSpeed_LLM_PATH}/mindspeed_llm/core/models/common/embeddings/rotary_pos_embedding.py export HCCL_DETERMINISTIC=true export ASCEND_LAUNCH_BLOCKING=1 export NCCL_DETERMINISTIC=1