From df6b43355018d127ef4f7eb1f71cbd9caf330076 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E4=BF=8A=E8=BE=89?= <11181965+zhujunhui1@user.noreply.gitee.com> Date: Mon, 16 Oct 2023 09:17:34 +0000 Subject: [PATCH 1/9] update PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 朱俊辉 <11181965+zhujunhui1@user.noreply.gitee.com> --- .../YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh b/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh index a3cbfa8e8d..1bd00cf0d1 100644 --- a/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh +++ b/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh @@ -11,7 +11,7 @@ if [ x"${cur_path_last_dirname}" == x"test" ];then else test_path_dir=${cur_path}/test fi - +export INF_NAN_MODE_ENABLE=1 #集合通信参数,不需要修改 export RANK_SIZE=1 -- Gitee From 99a5555f16f5276e39c79b7ae28a61ea245ba80d Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E4=BF=8A=E8=BE=89?= <11181965+zhujunhui1@user.noreply.gitee.com> Date: Mon, 16 Oct 2023 09:18:05 +0000 Subject: [PATCH 2/9] update PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_full_8p.sh. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 朱俊辉 <11181965+zhujunhui1@user.noreply.gitee.com> --- .../detection/YoloV3_ID1790_for_PyTorch/test/train_full_8p.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_full_8p.sh b/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_full_8p.sh index 2373e4cafa..2ba76aca4c 100644 --- a/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_full_8p.sh +++ b/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_full_8p.sh @@ -11,7 +11,7 @@ if [ x"${cur_path_last_dirname}" == x"test" ];then else test_path_dir=${cur_path}/test fi - +export INF_NAN_MODE_ENABLE=0 #集合通信参数,不需要修改 export RANK_SIZE=8 RANK_ID_START=0 -- Gitee From 2b33070dc71a4f981e4bc0e95299081c10898c9b Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E4=BF=8A=E8=BE=89?= <11181965+zhujunhui1@user.noreply.gitee.com> Date: Mon, 16 Oct 2023 09:22:20 +0000 Subject: [PATCH 3/9] update PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 朱俊辉 <11181965+zhujunhui1@user.noreply.gitee.com> --- .../YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh b/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh index 1bd00cf0d1..d2e5fda1bc 100644 --- a/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh +++ b/PyTorch/built-in/cv/detection/YoloV3_ID1790_for_PyTorch/test/train_performance_1p.sh @@ -11,7 +11,7 @@ if [ x"${cur_path_last_dirname}" == x"test" ];then else test_path_dir=${cur_path}/test fi -export INF_NAN_MODE_ENABLE=1 +export INF_NAN_MODE_ENABLE=0 #集合通信参数,不需要修改 export RANK_SIZE=1 -- Gitee From f22f2be7519e85b5bcc5a66e414c70fa714f095a Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E4=BF=8A=E8=BE=89?= <11181965+zhujunhui1@user.noreply.gitee.com> Date: Mon, 16 Oct 2023 09:38:36 +0000 Subject: [PATCH 4/9] updatetrain_ID4042_FairSeq_Transformer_RT2_full_1p.sh. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 朱俊辉 <11181965+zhujunhui1@user.noreply.gitee.com> --- .../test/train_ID4042_FairSeq_Transformer_RT2_full_1p.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_full_1p.sh b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_full_1p.sh index 53e3f46a39..f146671e54 100644 --- a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_full_1p.sh +++ b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_full_1p.sh @@ -12,7 +12,8 @@ RANK_ID_START=0 #进入到conda环境 #source activate py8 - +#关闭inf/nan +export INF_NAN_MODE_ENABLE=0 # 数据集路径,保持为空,不需要修改 data_path="" -- Gitee From a22a52cfa0c8ee453b59b3c880099e0658e3aa1c Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E4=BF=8A=E8=BE=89?= <11181965+zhujunhui1@user.noreply.gitee.com> Date: Mon, 16 Oct 2023 09:39:09 +0000 Subject: [PATCH 5/9] update train_ID4042_FairSeq_Transformer_RT2_full_8p.sh. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 朱俊辉 <11181965+zhujunhui1@user.noreply.gitee.com> --- .../test/train_ID4042_FairSeq_Transformer_RT2_full_8p.sh | 2 ++ 1 file changed, 2 insertions(+) diff --git a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_full_8p.sh b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_full_8p.sh index 3c485e3aa1..2d7c126b49 100644 --- a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_full_8p.sh +++ b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_full_8p.sh @@ -13,6 +13,8 @@ RANK_ID_START=0 #进入到conda环境 #source activate py8 +#关闭inf/nan +export INF_NAN_MODE_ENABLE=0 # 数据集路径,保持为空,不需要修改 -- Gitee From e71becdec6e76bcb992cb2fea017fadc51044b94 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E4=BF=8A=E8=BE=89?= <11181965+zhujunhui1@user.noreply.gitee.com> Date: Mon, 16 Oct 2023 09:39:34 +0000 Subject: [PATCH 6/9] update train_ID4042_FairSeq_Transformer_RT2_performance_1p.sh. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 朱俊辉 <11181965+zhujunhui1@user.noreply.gitee.com> --- .../train_ID4042_FairSeq_Transformer_RT2_performance_1p.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_performance_1p.sh b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_performance_1p.sh index 5882fe122f..08c8bcfcc1 100644 --- a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_performance_1p.sh +++ b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_performance_1p.sh @@ -12,7 +12,8 @@ RANK_ID_START=0 #进入到conda环境 #source activate py8 - +#关闭inf/nan +export INF_NAN_MODE_ENABLE=0 # 数据集路径,保持为空,不需要修改 data_path="" -- Gitee From 5aefeb5330ee3759016176ce7b89f7a62e3ae902 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E4=BF=8A=E8=BE=89?= <11181965+zhujunhui1@user.noreply.gitee.com> Date: Mon, 16 Oct 2023 09:39:59 +0000 Subject: [PATCH 7/9] update train_ID4042_FairSeq_Transformer_RT2_performance_8p.sh. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 朱俊辉 <11181965+zhujunhui1@user.noreply.gitee.com> --- .../test/train_ID4042_FairSeq_Transformer_RT2_performance_8p.sh | 2 ++ 1 file changed, 2 insertions(+) diff --git a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_performance_8p.sh b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_performance_8p.sh index 0d2d3394cb..a28c410e10 100644 --- a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_performance_8p.sh +++ b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_ID4042_FairSeq_Transformer_RT2_performance_8p.sh @@ -14,6 +14,8 @@ RANK_ID_START=0 #进入到conda环境 #source activate py8 +#关闭inf/nan +export INF_NAN_MODE_ENABLE=0 # 数据集路径,保持为空,不需要修改 -- Gitee From 0487f7df7f83c17ed456234caed234a3f6d663c0 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E4=BF=8A=E8=BE=89?= <11181965+zhujunhui1@user.noreply.gitee.com> Date: Mon, 16 Oct 2023 09:40:27 +0000 Subject: [PATCH 8/9] update train_full_1p_bs512.sh. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 朱俊辉 <11181965+zhujunhui1@user.noreply.gitee.com> --- .../test/train_full_1p_bs512.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_full_1p_bs512.sh b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_full_1p_bs512.sh index b06ea7b807..dc18efbe0b 100644 --- a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_full_1p_bs512.sh +++ b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_full_1p_bs512.sh @@ -13,7 +13,8 @@ RANK_ID_START=0 #进入到conda环境 #source activate py8 - +#关闭inf/nan +export INF_NAN_MODE_ENABLE=0 # 数据集路径,保持为空,不需要修改 data_path="" -- Gitee From be7d26aa7f343f17dc25de8a96bc86c31bfe4544 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E4=BF=8A=E8=BE=89?= <11181965+zhujunhui1@user.noreply.gitee.com> Date: Mon, 16 Oct 2023 09:40:58 +0000 Subject: [PATCH 9/9] update train_performance_1p_bs512.sh. MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: 朱俊辉 <11181965+zhujunhui1@user.noreply.gitee.com> --- .../test/train_performance_1p_bs512.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_performance_1p_bs512.sh b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_performance_1p_bs512.sh index 30d2968b5e..c054c342f9 100644 --- a/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_performance_1p_bs512.sh +++ b/PyTorch/dev/nlp/FairSeq_Transformer_ID0496_for_PyTorch/test/train_performance_1p_bs512.sh @@ -13,7 +13,8 @@ RANK_ID_START=0 #进入到conda环境 #source activate py8 - +#关闭inf/nan +export INF_NAN_MODE_ENABLE=0 # 数据集路径,保持为空,不需要修改 data_path="" -- Gitee