From 009ef1582a7ede3341445549d0739bd9168cb75a Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 01:15:04 +0000 Subject: [PATCH 01/12] =?UTF-8?q?update=20=20ResNet50=5FID0360=5Ffor=5FTen?= =?UTF-8?q?sorFlow2.X/test/train=5Fperformance=5F1p=5Fprofiling1.sh.=20?= =?UTF-8?q?=E5=8E=BB=E9=99=A4=E6=B3=A8=E9=87=8A?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh index 6c1b65fd7..095b0e3fc 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh @@ -200,7 +200,7 @@ echo "RankSize = ${RANK_SIZE}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName} echo "BatchSize = ${BatchSize}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "DeviceType = ${DeviceType}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "CaseName = ${CaseName}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log -#echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log +echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "TrainingTime = ${TrainingTime}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "TrainAccuracy = ${train_accuracy}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "ActualLoss = ${ActualLoss}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log -- Gitee From b48f2395d097a564f98a0d4a8a3252afb6889ad0 Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 01:34:41 +0000 Subject: [PATCH 02/12] =?UTF-8?q?update=20ResNet50=5FID0360=5Ffor=5FTensor?= =?UTF-8?q?Flow2.X/test/train=5Fperformance=5F1p=5Fprofiling1.sh.=20?= =?UTF-8?q?=E6=96=B0=E5=A2=9Eprofiling=5Fresult=E7=BB=93=E6=9E=9C=E5=88=A4?= =?UTF-8?q?=E6=96=AD?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh index 095b0e3fc..9f61b9304 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh @@ -182,9 +182,9 @@ TrainingTime=`awk 'BEGIN{printf "%.2f\n",'${BatchSize}'*1000/'${FPS}'}'` op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` echo $op_static if [ $op_static -eq 1 ]; then - echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log + profiling_resuit="True" else - echo "ActualFPS = " >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log + profiling_resuit="False" fi @@ -195,7 +195,7 @@ grep train_loss $cur_path/output/$ASCEND_DEVICE_ID/train_$ASCEND_DEVICE_ID.log|g ActualLoss=`awk 'END {print}' $cur_path/output/$ASCEND_DEVICE_ID/train_${CaseName}_loss.txt` #关键信息打印到${CaseName}.log中,不需要修改 -echo "Network = ${Network}" > $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log +echo "Network = ${Network}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "RankSize = ${RANK_SIZE}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "BatchSize = ${BatchSize}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "DeviceType = ${DeviceType}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log @@ -205,6 +205,6 @@ echo "TrainingTime = ${TrainingTime}" >> $cur_path/output/$ASCEND_DEVICE_ID/${Ca echo "TrainAccuracy = ${train_accuracy}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "ActualLoss = ${ActualLoss}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "E2ETrainingTime = ${e2e_time}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log - +echo "profiling_result = ${profiling_result}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log sed -i "/AttributeError/d" $cur_path/output/${ASCEND_DEVICE_ID}/train_${ASCEND_DEVICE_ID}.log sed -i "/MLL/d" $cur_path/output/${ASCEND_DEVICE_ID}/train_${ASCEND_DEVICE_ID}.log \ No newline at end of file -- Gitee From 38db45ca9a80140cb17cae481353c5da9bf3dc2b Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 02:54:31 +0000 Subject: [PATCH 03/12] update /ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh. Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh index 9f61b9304..c0730c32e 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh @@ -182,9 +182,9 @@ TrainingTime=`awk 'BEGIN{printf "%.2f\n",'${BatchSize}'*1000/'${FPS}'}'` op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` echo $op_static if [ $op_static -eq 1 ]; then - profiling_resuit="True" + profiling_result="True" else - profiling_resuit="False" + profiling_result="False" fi -- Gitee From ad39eaa994ee2f46bc487a7ae23f368ccdb43c00 Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 05:58:05 +0000 Subject: [PATCH 04/12] update ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh. Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 1 + 1 file changed, 1 insertion(+) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh index c0730c32e..697e7daba 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh @@ -178,6 +178,7 @@ CaseName=${Network}_bs${BatchSize}_${RANK_SIZE}'p'_'profiling1'_'perf' ActualFPS=${FPS} #单迭代训练时长 TrainingTime=`awk 'BEGIN{printf "%.2f\n",'${BatchSize}'*1000/'${FPS}'}'` +sleep 5m op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` echo $op_static -- Gitee From 98c2071a25ef096a119fbbbeeb06e66f19e0b1d2 Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 06:37:14 +0000 Subject: [PATCH 05/12] =?UTF-8?q?update=20ResNet50=5FID0360=5Ffor=5FTensor?= =?UTF-8?q?Flow2.X/test/train=5Fperformance=5F1p=5Fprofiling1.sh.=20?= =?UTF-8?q?=E4=BF=AE=E6=94=B9profiling=E5=88=A4=E5=AE=9A=E9=80=BB=E8=BE=91?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 21 +++++++++++++------ 1 file changed, 15 insertions(+), 6 deletions(-) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh index 697e7daba..13a9a203d 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh @@ -178,17 +178,26 @@ CaseName=${Network}_bs${BatchSize}_${RANK_SIZE}'p'_'profiling1'_'perf' ActualFPS=${FPS} #单迭代训练时长 TrainingTime=`awk 'BEGIN{printf "%.2f\n",'${BatchSize}'*1000/'${FPS}'}'` -sleep 5m -op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` -echo $op_static -if [ $op_static -eq 1 ]; then - profiling_result="True" +cur_path=`pwd` +if [ -d ${cur_path}/etp_output/profiling ];then + for((i=0;i<100;i++)); + do + op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` + echo $op_static + if [ $op_static -eq 1 ]; then + profiling_result="True" + break + else + sleep 10 + fi + done else - profiling_result="False" + profiling_result="False" fi + #从train_$ASCEND_DEVICE_ID.log提取Loss到train_${CaseName}_loss.txt中,需要根据模型审视 grep train_loss $cur_path/output/$ASCEND_DEVICE_ID/train_$ASCEND_DEVICE_ID.log|grep -v BatchTimestamp|awk '{print $10}'|sed 's/,//g'|sed '/^$/d' >> $cur_path/output/$ASCEND_DEVICE_ID/train_${CaseName}_loss.txt -- Gitee From 5cdd12d61d5a5becb1b98b1d04906ccdffff24c9 Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 07:23:22 +0000 Subject: [PATCH 06/12] update ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh. Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh index 13a9a203d..844dbb2d7 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh @@ -179,7 +179,7 @@ ActualFPS=${FPS} #单迭代训练时长 TrainingTime=`awk 'BEGIN{printf "%.2f\n",'${BatchSize}'*1000/'${FPS}'}'` -cur_path=`pwd` + if [ -d ${cur_path}/etp_output/profiling ];then for((i=0;i<100;i++)); do -- Gitee From fa83d8a58651de6da98eb691e3c266a260f54646 Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 08:34:07 +0000 Subject: [PATCH 07/12] =?UTF-8?q?update=20ResNet50=5FID0360=5Ffor=5FTensor?= =?UTF-8?q?Flow2.X/test/train=5Fperformance=5F1p=5Fprofiling1.sh.=20?= =?UTF-8?q?=E4=BF=AE=E6=94=B9?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh index 844dbb2d7..86cfb2f9a 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh @@ -178,18 +178,18 @@ CaseName=${Network}_bs${BatchSize}_${RANK_SIZE}'p'_'profiling1'_'perf' ActualFPS=${FPS} #单迭代训练时长 TrainingTime=`awk 'BEGIN{printf "%.2f\n",'${BatchSize}'*1000/'${FPS}'}'` - +profiling_result="False" if [ -d ${cur_path}/etp_output/profiling ];then for((i=0;i<100;i++)); do - op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` + op_static=echo $i`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` echo $op_static if [ $op_static -eq 1 ]; then profiling_result="True" break else - sleep 10 + sleep 30 fi done else -- Gitee From 19693c2e4b5f701dee72900a432672d6c366677e Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 08:36:11 +0000 Subject: [PATCH 08/12] =?UTF-8?q?update=20=20/ResNet50=5FID0360=5Ffor=5FTe?= =?UTF-8?q?nsorFlow2.X/test/train=5Fperformance=5F1p=5Fprofiling1.sh.=20?= =?UTF-8?q?=E4=BF=AE=E6=94=B9?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh index 86cfb2f9a..0ae9181ca 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh @@ -183,7 +183,8 @@ profiling_result="False" if [ -d ${cur_path}/etp_output/profiling ];then for((i=0;i<100;i++)); do - op_static=echo $i`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` + echo $i + op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` echo $op_static if [ $op_static -eq 1 ]; then profiling_result="True" -- Gitee From 4f41b5961894064af2c60ea3914d2494efd91cc2 Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 09:24:17 +0000 Subject: [PATCH 09/12] =?UTF-8?q?update=20ResNet50=5FID0360=5Ffor=5FTensor?= =?UTF-8?q?Flow2.X/test/train=5Fperformance=5F1p=5Fprofiling1.sh.=20?= =?UTF-8?q?=E4=BF=AE=E6=94=B9profiling=E7=BB=B4=E6=B5=8B=E9=80=82=E9=85=8D?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 23 ++++++------------- 1 file changed, 7 insertions(+), 16 deletions(-) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh index 0ae9181ca..e2c324a69 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling1.sh @@ -178,27 +178,18 @@ CaseName=${Network}_bs${BatchSize}_${RANK_SIZE}'p'_'profiling1'_'perf' ActualFPS=${FPS} #单迭代训练时长 TrainingTime=`awk 'BEGIN{printf "%.2f\n",'${BatchSize}'*1000/'${FPS}'}'` -profiling_result="False" - -if [ -d ${cur_path}/etp_output/profiling ];then - for((i=0;i<100;i++)); - do - echo $i - op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` - echo $op_static - if [ $op_static -eq 1 ]; then - profiling_result="True" - break - else - sleep 30 - fi - done + +op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` +echo $op_static +if [ $op_static -eq 1 ]; then + profiling_result="True" else - profiling_result="False" + profiling_result="False" fi + #从train_$ASCEND_DEVICE_ID.log提取Loss到train_${CaseName}_loss.txt中,需要根据模型审视 grep train_loss $cur_path/output/$ASCEND_DEVICE_ID/train_$ASCEND_DEVICE_ID.log|grep -v BatchTimestamp|awk '{print $10}'|sed 's/,//g'|sed '/^$/d' >> $cur_path/output/$ASCEND_DEVICE_ID/train_${CaseName}_loss.txt -- Gitee From eb43e0a9fc077a52da7324e3bb311e6b445f9da8 Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 09:27:38 +0000 Subject: [PATCH 10/12] =?UTF-8?q?update=20ResNet50=5FID0360=5Ffor=5FTensor?= =?UTF-8?q?Flow2.X/test/train=5Fperformance=5F1p=5Fprofiling2.sh.=20?= =?UTF-8?q?=E4=BF=AE=E6=94=B9profiling=E7=BB=B4=E6=B5=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling2.sh | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling2.sh b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling2.sh index dd07ca5fa..fc79b71f2 100644 --- a/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling2.sh +++ b/TensorFlow2/built-in/cv/image_classification/ResNet50_ID0360_for_TensorFlow2.X/test/train_performance_1p_profiling2.sh @@ -187,9 +187,9 @@ TrainingTime=`awk 'BEGIN{printf "%.2f\n",'${BatchSize}'*1000/'${FPS}'}'` op_static=`find $cur_path/../tensorflow/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` echo $op_static if [ $op_static -eq 1 ]; then - echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log + profiling_result="True" else - echo "ActualFPS = " >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log + profiling_result="False" fi #从train_$ASCEND_DEVICE_ID.log提取Loss到train_${CaseName}_loss.txt中,需要根据模型审视 @@ -204,8 +204,9 @@ echo "RankSize = ${RANK_SIZE}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName} echo "BatchSize = ${BatchSize}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "DeviceType = ${DeviceType}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "CaseName = ${CaseName}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log -#echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log +echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "TrainingTime = ${TrainingTime}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log +echo "profiling_result = ${profiling_result}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "TrainAccuracy = ${train_accuracy}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "ActualLoss = ${ActualLoss}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "E2ETrainingTime = ${e2e_time}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log -- Gitee From ab7d2cd8f9dfed681a365c3ecc4daedfb73da6ce Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 09:33:35 +0000 Subject: [PATCH 11/12] =?UTF-8?q?update=20WideDeep=5FID2712=5Ffor=5FTensor?= =?UTF-8?q?Flow/test/train=5Fperformance=5F1p=5Fprofiling1.sh.=20=E4=BF=AE?= =?UTF-8?q?=E6=94=B9profiling=E5=88=A4=E5=AE=9A?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling1.sh | 8 +++++--- 1 file changed, 5 insertions(+), 3 deletions(-) diff --git a/TensorFlow/built-in/recommendation/WideDeep_ID2712_for_TensorFlow/test/train_performance_1p_profiling1.sh b/TensorFlow/built-in/recommendation/WideDeep_ID2712_for_TensorFlow/test/train_performance_1p_profiling1.sh index 27dacebd6..c798c77a3 100644 --- a/TensorFlow/built-in/recommendation/WideDeep_ID2712_for_TensorFlow/test/train_performance_1p_profiling1.sh +++ b/TensorFlow/built-in/recommendation/WideDeep_ID2712_for_TensorFlow/test/train_performance_1p_profiling1.sh @@ -145,10 +145,11 @@ echo "TrainingTime(ms/step) : $TrainingTime" op_static=`find ${cur_path}/etp_output/profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` echo $op_static if [ $op_static -eq 1 ]; then - echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log + profiling_result="True" else - echo "ActualFPS = " >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log + profiling_result="False" fi + #从train_$ASCEND_DEVICE_ID.log提取Loss到train_${CaseName}_loss.txt中,需要根据模型审视 loss=`grep 'loss =' $cur_path/output/${ASCEND_DEVICE_ID}/train_${ASCEND_DEVICE_ID}.log | tr -d '\b\r' | awk -F' ' '{print $9}'|sed 's/,$//'` echo "${loss}"> $cur_path/output/$ASCEND_DEVICE_ID/train_${CaseName}_loss.txt @@ -162,7 +163,8 @@ echo "RankSize = ${RANK_SIZE}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName} echo "BatchSize = ${BatchSize}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "DeviceType = ${DeviceType}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "CaseName = ${CaseName}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log -#echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log +echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log +echo "profiling_result = ${profiling_result}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "TrainingTime = ${TrainingTime}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "TrainAccuracy = ${train_accuracy}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "ActualLoss = ${ActualLoss}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log -- Gitee From 7d6a0deca253e0f0dff184df46101e90e635ea23 Mon Sep 17 00:00:00 2001 From: yongchao1 <297389370@qq.com> Date: Fri, 26 Jul 2024 09:40:46 +0000 Subject: [PATCH 12/12] update WideDeep_ID2712_for_TensorFlow/test/train_performance_1p_profiling2.sh. Signed-off-by: yongchao1 <297389370@qq.com> --- .../test/train_performance_1p_profiling2.sh | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/TensorFlow/built-in/recommendation/WideDeep_ID2712_for_TensorFlow/test/train_performance_1p_profiling2.sh b/TensorFlow/built-in/recommendation/WideDeep_ID2712_for_TensorFlow/test/train_performance_1p_profiling2.sh index 6e91f09ec..d037b91ed 100644 --- a/TensorFlow/built-in/recommendation/WideDeep_ID2712_for_TensorFlow/test/train_performance_1p_profiling2.sh +++ b/TensorFlow/built-in/recommendation/WideDeep_ID2712_for_TensorFlow/test/train_performance_1p_profiling2.sh @@ -151,9 +151,9 @@ echo "TrainingTime(ms/step) : $TrainingTime" op_static=`find ${cur_path}/../profiling/PROF*/mindstudio_profiler_output/ -name op_statistic*.csv | wc -l` echo $op_static if [ $op_static -eq 1 ]; then - echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log + profiling_result="True" else - echo "ActualFPS = " >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log + profiling_result="False" fi #从train_$ASCEND_DEVICE_ID.log提取Loss到train_${CaseName}_loss.txt中,需要根据模型审视 loss=`grep 'loss =' $cur_path/output/${ASCEND_DEVICE_ID}/train_${ASCEND_DEVICE_ID}.log | tr -d '\b\r' | awk -F' ' '{print $9}'|sed 's/,$//'` @@ -168,7 +168,8 @@ echo "RankSize = ${RANK_SIZE}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName} echo "BatchSize = ${BatchSize}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "DeviceType = ${DeviceType}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "CaseName = ${CaseName}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log -#echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log +echo "ActualFPS = ${ActualFPS}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log +echo "profiling_result = ${profiling_result}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "TrainingTime = ${TrainingTime}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "TrainAccuracy = ${train_accuracy}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log echo "ActualLoss = ${ActualLoss}" >> $cur_path/output/$ASCEND_DEVICE_ID/${CaseName}.log -- Gitee