From 3f086adf86e79d7945b7ce6e43ea33baa6842e1f Mon Sep 17 00:00:00 2001 From: Ryan Date: Tue, 10 May 2022 13:55:56 +0800 Subject: [PATCH] =?UTF-8?q?=E4=BF=AE=E6=94=B9bert=E7=B3=BB=E5=88=978p?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .../test/train_ID1641_BertLarge-128_full_8p.sh | 4 ++-- .../test/train_ID1641_BertLarge-128_performance_8p.sh | 4 ++-- .../test/train_ID1642_BertLarge-128_full_8p.sh | 4 ++-- .../test/train_ID1642_BertLarge-128_performance_8p.sh | 4 ++-- .../test/train_ID1643_BertLarge-128_full_8p.sh | 4 ++-- .../test/train_ID1643_BertLarge-128_performance_8p.sh | 4 ++-- .../test/train_ID3232_BertBase-128_full_8p.sh | 4 ++-- .../test/train_ID3232_BertBase-128_performance_8p.sh | 4 ++-- .../test/train_ID3233_BertBase-128_full_8p.sh | 4 ++-- .../test/train_ID3233_BertBase-128_performance_8p.sh | 4 ++-- .../test/train_ID3234_BertBase-128_full_8p.sh | 4 ++-- .../test/train_ID3234_BertBase-128_performance_8p.sh | 4 ++-- 12 files changed, 24 insertions(+), 24 deletions(-) diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1641_BertLarge-128_full_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1641_BertLarge-128_full_8p.sh index 47c464bba..33ab18762 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1641_BertLarge-128_full_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1641_BertLarge-128_full_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1641_BertLarge-128_performance_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1641_BertLarge-128_performance_8p.sh index 5896c0930..91390a6b4 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1641_BertLarge-128_performance_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1641_BertLarge-128_performance_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1642_BertLarge-128_full_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1642_BertLarge-128_full_8p.sh index 815433976..981113eea 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1642_BertLarge-128_full_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1642_BertLarge-128_full_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1642_BertLarge-128_performance_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1642_BertLarge-128_performance_8p.sh index 44533e68c..cd444351f 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1642_BertLarge-128_performance_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1642_BertLarge-128_performance_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1643_BertLarge-128_full_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1643_BertLarge-128_full_8p.sh index a2cdedb05..4a455c4f9 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1643_BertLarge-128_full_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1643_BertLarge-128_full_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1643_BertLarge-128_performance_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1643_BertLarge-128_performance_8p.sh index acab05790..3f87a6f34 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1643_BertLarge-128_performance_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID1643_BertLarge-128_performance_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3232_BertBase-128_full_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3232_BertBase-128_full_8p.sh index be49ce9e5..08c291031 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3232_BertBase-128_full_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3232_BertBase-128_full_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3232_BertBase-128_performance_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3232_BertBase-128_performance_8p.sh index c88a324d7..cd8e00931 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3232_BertBase-128_performance_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3232_BertBase-128_performance_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3233_BertBase-128_full_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3233_BertBase-128_full_8p.sh index 4362d42a9..6680bd3fd 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3233_BertBase-128_full_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3233_BertBase-128_full_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3233_BertBase-128_performance_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3233_BertBase-128_performance_8p.sh index 154cedd58..20f1a04e3 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3233_BertBase-128_performance_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3233_BertBase-128_performance_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3234_BertBase-128_full_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3234_BertBase-128_full_8p.sh index 046dae77f..e24d1f7e4 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3234_BertBase-128_full_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3234_BertBase-128_full_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} diff --git a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3234_BertBase-128_performance_8p.sh b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3234_BertBase-128_performance_8p.sh index f1811c234..cdc579016 100644 --- a/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3234_BertBase-128_performance_8p.sh +++ b/TensorFlow/built-in/nlp/BertNV_Series_for_TensorFlow/test/train_ID3234_BertBase-128_performance_8p.sh @@ -4,7 +4,7 @@ cur_path=`pwd` #集合通信参数,不需要修改 export RANK_SIZE=8 -export RANK_TABLE_FILE=#cur_path/../configs/${RANK_SIZE}p.json +export RANK_TABLE_FILE=$cur_path/../configs/${RANK_SIZE}p.json export JOB_ID=10087 export GE_USE_STATIC_MEMORY=1 export HCCL_CONNECT_TIMEOUT=600 @@ -139,7 +139,7 @@ cd $cur_path/../ for((RANK_ID=$RANK_ID_START;RANK_ID<$((RANK_SIZE+RANK_ID_START));RANK_ID++)); do #设置环境变量,不需要修改 - echo "Device ID: $ASCEND_DEVICE_ID" + echo "Device ID: $RANK_ID" export RANK_ID=$RANK_ID export ASCEND_DEVICE_ID=$RANK_ID ASCEND_DEVICE_ID=${ASCEND_DEVICE_ID} -- Gitee