diff --git a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_full_1p.sh b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_full_1p.sh index be569813bfd793d973ea794bbf292a32258461a2..c24ddbb326813374ec4869f955f766e799d2c0db 100644 --- a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_full_1p.sh +++ b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_full_1p.sh @@ -61,7 +61,9 @@ export ASCEND_SLOG_PRINT_TO_STDOUT=0 export ASCEND_GLOBAL_LOG_LEVEL_ETP=3 export PTCOPY_ENABLE=1 export TASK_QUEUE_ENABLE=1 -export DYNAMIC_OP="ADD#MUL" +#export DYNAMIC_OP="ADD#MUL" +export COMBINED_ENABLE=1 +export SCALAR_TO_HOST_MEM=1 start_time=$(date +%s) python3 -u train_1p.py \ $data_path \ @@ -80,7 +82,7 @@ python3 -u train_1p.py \ --min-lr 0.0 \ --dropout 0.1 \ --weight-decay 0.0 \ - --criterion label_smoothed_cross_entropy \ + --criterion cross_entropy \ --label-smoothing 0.1 \ --max-sentences 128\ --max-tokens 102400\ diff --git a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_full_8p.sh b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_full_8p.sh index 17208843fcb2540fb3a3eadd4db37b09d1e11945..72cd7550b92bba7717c8113d9f1c356018ddcf58 100644 --- a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_full_8p.sh +++ b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_full_8p.sh @@ -17,7 +17,13 @@ train_epochs=30 #训练batch_size,,需要模型审视修改 batch_size=128 - +export ASCEND_SLOG_PRINT_TO_STDOUT=0 +export ASCEND_GLOBAL_LOG_LEVEL_ETP=3 +export PTCOPY_ENABLE=1 +export TASK_QUEUE_ENABLE=1 +#export DYNAMIC_OP="ADD#MUL" +export COMBINED_ENABLE=1 +export SCALAR_TO_HOST_MEM=1 # 参数校验,data_path为必传参数,其他参数的增删由模型自身决定;此处新增参数需在上面有定义并赋值 for para in $* @@ -88,7 +94,7 @@ do --min-lr 0.0 \ --dropout 0.1 \ --weight-decay 0.0 \ - --criterion label_smoothed_cross_entropy \ + --criterion cross_entropy \ --label-smoothing 0.1 \ --max-sentences 128\ --max-tokens 102400 \ diff --git a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_8p.sh b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_8p.sh index 71a10edeead5c15b9abe30d1cd7d3fdcb83147b7..8ab4566f18e36b74410f3abe52c68bbabe7182ab 100644 --- a/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_8p.sh +++ b/PyTorch/dev/nlp/Transformer_ID0105_for_PyTorch/test/train_performance_8p.sh @@ -64,7 +64,9 @@ export ASCEND_SLOG_PRINT_TO_STDOUT=0 export ASCEND_GLOBAL_LOG_LEVEL_ETP=3 export PTCOPY_ENABLE=1 export TASK_QUEUE_ENABLE=1 -export DYNAMIC_OP="ADD#MUL" +#export DYNAMIC_OP="ADD#MUL" +export COMBINED_ENABLE=1 +export SCALAR_TO_HOST_MEM=1 start_time=$(date +%s) NPUS=($(seq 0 7)) export NPU_WORLD_SIZE=${#NPUS[@]} @@ -96,7 +98,7 @@ do --min-lr 0.0 \ --dropout 0.1 \ --weight-decay 0.0 \ - --criterion label_smoothed_cross_entropy \ + --criterion cross_entropy \ --label-smoothing 0.1 \ --max-sentences 128\ --max-tokens 102400 \