From 8566e01af97eb4a6234253962c6c6162b73d3c75 Mon Sep 17 00:00:00 2001
From: jieliang cai <975092674@qq.com>
Date: Thu, 7 Jul 2022 12:41:20 +0000
Subject: [PATCH 1/7] update
TensorFlow2/built-in/cv/image_classification/MNIST_ID2481_for_TensorFlow2.X/README.md.
---
.../MNIST_ID2481_for_TensorFlow2.X/README.md | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/TensorFlow2/built-in/cv/image_classification/MNIST_ID2481_for_TensorFlow2.X/README.md b/TensorFlow2/built-in/cv/image_classification/MNIST_ID2481_for_TensorFlow2.X/README.md
index 42959f171..837522b1a 100644
--- a/TensorFlow2/built-in/cv/image_classification/MNIST_ID2481_for_TensorFlow2.X/README.md
+++ b/TensorFlow2/built-in/cv/image_classification/MNIST_ID2481_for_TensorFlow2.X/README.md
@@ -94,7 +94,7 @@ pip3 install requirements.txt
## 数据集准备
-1. 用户需自行下载ml-1m训练数据集,应有如下结构
+1. 用户需自行下载MNIST训练数据集,应有如下结构
```
dataset/
├── mnist
--
Gitee
From 0f03b93b7f4941a60dba1a7281dc6d6edc49bb92 Mon Sep 17 00:00:00 2001
From: jieliang cai <975092674@qq.com>
Date: Fri, 8 Jul 2022 06:44:07 +0000
Subject: [PATCH 2/7] update
TensorFlow2/built-in/nlp/Word2vec_ID2350_for_TensorFlow2.X/README.md.
---
.../built-in/nlp/Word2vec_ID2350_for_TensorFlow2.X/README.md | 3 ++-
1 file changed, 2 insertions(+), 1 deletion(-)
diff --git a/TensorFlow2/built-in/nlp/Word2vec_ID2350_for_TensorFlow2.X/README.md b/TensorFlow2/built-in/nlp/Word2vec_ID2350_for_TensorFlow2.X/README.md
index 378741945..be1ce0246 100644
--- a/TensorFlow2/built-in/nlp/Word2vec_ID2350_for_TensorFlow2.X/README.md
+++ b/TensorFlow2/built-in/nlp/Word2vec_ID2350_for_TensorFlow2.X/README.md
@@ -32,7 +32,8 @@
## 简述
-本项目是基于TensorFlow2.X的文本分类任务,通过直接配置可以支持:TextCNN/TextRNN/TextRCNN/Transformer/Bert/Albert/DistilBert基本分类模型;TextCNN/TextRNN/TextRCNN/Transformer的token可选用词粒度/子粒度;Word2Vec特征增强后接TextCNN/TextRNN/TextRCNN/Transformer;支持Attention-TextCNN/TextRNN;FGM和PGD两种对抗方法的引入训练;对比学习方法R-drop引入;支持二分类和多分类,支持FocalLoss;保存为pb文件可供部署;项目代码支持交互式测试和批量测试。
+本项目是基于TensorFlow2.X的文本分类任务,使用Word2vec词向量训练模型进行文本分类。Word2vec是一种将词转化成向量的方法,其中包含两种算法,分别是skip-gram和CBOW,它们最大的区别是skip-gram是通过中心词去预测中心词周围的词,而CBOW是通过周围的词去预测中心词。
+
- 参考论文:
--
Gitee
From 0fcf419f8e22ba087704cb2f77f9016c9e731378 Mon Sep 17 00:00:00 2001
From: jieliang cai <975092674@qq.com>
Date: Tue, 12 Jul 2022 06:09:12 +0000
Subject: [PATCH 3/7] modify
---
.../test/train_full_1p_4096bs_dynamic_noeval.sh | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
index 632d4525f..e5e95a7b0 100644
--- a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
+++ b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
@@ -22,7 +22,7 @@ Network="Transformer_ID0633_for_TensorFlow2.X"
#训练batch_size
batch_size=4096
#训练step
-train_steps=400000
+train_steps=10000
#TF2.X独有,不需要修改
#export NPU_ENABLE_PERF=true
--
Gitee
From 0f1fee3679d97af592179ef9df6d2cb9fa9ddb35 Mon Sep 17 00:00:00 2001
From: jieliang cai <975092674@qq.com>
Date: Tue, 12 Jul 2022 06:30:54 +0000
Subject: [PATCH 4/7] modify
---
.../test/train_full_1p_4096bs_dynamic_noeval.sh | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
index e5e95a7b0..80074912a 100644
--- a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
+++ b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
@@ -120,7 +120,7 @@ do
--param_set=big \
--train_steps=${train_steps} \
--batch_size=${batch_size} \
- --steps_between_evals=10000 \
+ --steps_between_evals=1000 \
--max_length=64 \
--mode=train \
--decode_batch_size=32 \
--
Gitee
From dc5afe55d4b5dcb32e845175b2bf5cdd6bf2c32e Mon Sep 17 00:00:00 2001
From: jieliang cai <975092674@qq.com>
Date: Tue, 12 Jul 2022 07:56:31 +0000
Subject: [PATCH 5/7] modify
---
.../test/train_full_1p_4096bs_dynamic_noeval.sh | 7 ++++---
1 file changed, 4 insertions(+), 3 deletions(-)
diff --git a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
index 80074912a..4e00200ac 100644
--- a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
+++ b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
@@ -4,7 +4,8 @@
cur_path=`pwd`
#集合通信参数,不需要修改
-
+export DUMP_GE_GRAPH=2
+export DUMP_GRAPH_LEVEL=3
export RANK_SIZE=1
export JOB_ID=10087
export RANK_ID_START=0
@@ -30,7 +31,7 @@ train_steps=10000
#维测参数,precision_mode需要模型审视修改
precision_mode="allow_mix_precision"
#维持参数,以下不需要修改
-over_dump=False
+over_dump=True
data_dump_flag=False
data_dump_step="10"
profiling=False
@@ -120,7 +121,7 @@ do
--param_set=big \
--train_steps=${train_steps} \
--batch_size=${batch_size} \
- --steps_between_evals=1000 \
+ --steps_between_evals=10000 \
--max_length=64 \
--mode=train \
--decode_batch_size=32 \
--
Gitee
From 28567d282d9dfd26f67edceda0f590dbc8ce782a Mon Sep 17 00:00:00 2001
From: jieliang cai <975092674@qq.com>
Date: Tue, 12 Jul 2022 08:04:16 +0000
Subject: [PATCH 6/7] modify
---
.../test/train_full_1p_4096bs_dynamic_noeval.sh | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
index 4e00200ac..70e04b160 100644
--- a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
+++ b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
@@ -31,7 +31,7 @@ train_steps=10000
#维测参数,precision_mode需要模型审视修改
precision_mode="allow_mix_precision"
#维持参数,以下不需要修改
-over_dump=True
+over_dump=False
data_dump_flag=False
data_dump_step="10"
profiling=False
--
Gitee
From b6614ee98939cf6b3b09833f3178b1a58050961a Mon Sep 17 00:00:00 2001
From: jieliang cai <975092674@qq.com>
Date: Wed, 13 Jul 2022 06:11:32 +0000
Subject: [PATCH 7/7] modify
---
.../test/train_full_1p_4096bs_dynamic_noeval.sh | 6 +++---
1 file changed, 3 insertions(+), 3 deletions(-)
diff --git a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
index 70e04b160..1f48774f0 100644
--- a/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
+++ b/TensorFlow2/built-in/nlp/Transformer_ID0633_for_TensorFlow2.X/test/train_full_1p_4096bs_dynamic_noeval.sh
@@ -23,7 +23,7 @@ Network="Transformer_ID0633_for_TensorFlow2.X"
#训练batch_size
batch_size=4096
#训练step
-train_steps=10000
+train_steps=300
#TF2.X独有,不需要修改
#export NPU_ENABLE_PERF=true
@@ -121,7 +121,7 @@ do
--param_set=big \
--train_steps=${train_steps} \
--batch_size=${batch_size} \
- --steps_between_evals=10000 \
+ --steps_between_evals=100 \
--max_length=64 \
--mode=train \
--decode_batch_size=32 \
@@ -131,7 +131,7 @@ do
--dtype=fp16 \
--distribution_strategy='one_device' \
--enable_time_history=true \
- --log_steps=1000 \
+ --log_steps=100 \
--loss_scale='dynamic' \
--precision_mode=${precision_mode} \
--over_dump=${over_dump} \
--
Gitee