diff --git a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_16p.sh b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_16p.sh index b358516d854ffd002b0b879011cb8823713d365d..b3d615854ef5b51bec3f5137ff5d06f20e7e331c 100644 --- a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_16p.sh +++ b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_16p.sh @@ -75,6 +75,8 @@ export ASCEND_SLOG_PRINT_TO_STDOUT=0 export ASCEND_GLOBAL_LOG_LEVEL=3 export PTCOPY_ENABLE=1 export TASK_QUEUE_ENABLE=1 +export COMBINED_ENABLE=1 +export SCALAR_TO_HOST_MEM=1 export DYNAMIC_OP="ADD#MUL" start_time=$(date +%s) NPUS=($(seq 0 7)) @@ -109,7 +111,7 @@ do --min-lr 0.0 \ --dropout 0.1 \ --weight-decay 0.0 \ - --criterion label_smoothed_cross_entropy \ + --criterion cross_entropy \ --label-smoothing 0.1 \ --max-sentences 128\ --max-tokens 102400 \ diff --git a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_8p.sh b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_8p.sh index 71a10edeead5c15b9abe30d1cd7d3fdcb83147b7..ef46a3a63a22faa4caf5bedf189f562696cc9e72 100644 --- a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_8p.sh +++ b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_8p.sh @@ -64,6 +64,8 @@ export ASCEND_SLOG_PRINT_TO_STDOUT=0 export ASCEND_GLOBAL_LOG_LEVEL_ETP=3 export PTCOPY_ENABLE=1 export TASK_QUEUE_ENABLE=1 +export COMBINED_ENABLE=1 +export SCALAR_TO_HOST_MEM=1 export DYNAMIC_OP="ADD#MUL" start_time=$(date +%s) NPUS=($(seq 0 7)) @@ -96,7 +98,7 @@ do --min-lr 0.0 \ --dropout 0.1 \ --weight-decay 0.0 \ - --criterion label_smoothed_cross_entropy \ + --criterion cross_entropy \ --label-smoothing 0.1 \ --max-sentences 128\ --max-tokens 102400 \