From 160f7494929684795acf0aeeb17c007049a3f45f Mon Sep 17 00:00:00 2001
From: wangxingzhen <wangxingzhen@huawei.com>
Date: Mon, 25 Apr 2022 14:44:26 +0800
Subject: [PATCH 1/3] augru support seq-length

---
 tf_adapter/ops/aicore/npu_aicore_ops.cc                       | 1 +
 tf_adapter/python/npu_bridge/estimator/npu/npu_dynamic_rnn.py | 2 ++
 tf_adapter/python/npu_bridge/estimator/npu_ops.py             | 1 +
 3 files changed, 4 insertions(+)

diff --git a/tf_adapter/ops/aicore/npu_aicore_ops.cc b/tf_adapter/ops/aicore/npu_aicore_ops.cc
index 9734c7ba7..353834228 100644
--- a/tf_adapter/ops/aicore/npu_aicore_ops.cc
+++ b/tf_adapter/ops/aicore/npu_aicore_ops.cc
@@ -226,6 +226,7 @@ REGISTER_OP("DynamicAUGRUGrad")
 .Input("reset: T")
 .Input("new: T")
 .Input("hidden_new: T")
+.Input("seq_length: int32")
 .Output("dw_input: T")
 .Output("dw_hidden: T")
 .Output("db_input: T")
diff --git a/tf_adapter/python/npu_bridge/estimator/npu/npu_dynamic_rnn.py b/tf_adapter/python/npu_bridge/estimator/npu/npu_dynamic_rnn.py
index 3804be9cd..ea1f57473 100644
--- a/tf_adapter/python/npu_bridge/estimator/npu/npu_dynamic_rnn.py
+++ b/tf_adapter/python/npu_bridge/estimator/npu/npu_dynamic_rnn.py
@@ -326,6 +326,8 @@ class DynamicAUGRU(_DynamicBasic):
         self._args["weight_att"] = weight_att
         self._args["bias_input"] = self._bias_input
         self._args["bias_hidden"] = self._bias_hidden
+        if seq_length is not None:
+            self._args["seq_length"] = seq_length
         return gen_npu_ops.dynamic_augru(**self._args)
 
 
diff --git a/tf_adapter/python/npu_bridge/estimator/npu_ops.py b/tf_adapter/python/npu_bridge/estimator/npu_ops.py
index 93a3b1803..5ca6effbc 100644
--- a/tf_adapter/python/npu_bridge/estimator/npu_ops.py
+++ b/tf_adapter/python/npu_bridge/estimator/npu_ops.py
@@ -272,6 +272,7 @@ def dynamic_augru_grad(op, dy, doutput_h, dupdate, dupdate_att, dreset, dnew, dh
                                                                                                      update, update_att,
                                                                                                      reset, new,
                                                                                                      hidden_new,
+                                                                                                     seq_length,
                                                                                                      direction=op.get_attr(
                                                                                                          "direction"),
                                                                                                      cell_depth=op.get_attr(
-- 
Gitee


From 456dce732e783d8b33d6f7c104cea6197b8f9738 Mon Sep 17 00:00:00 2001
From: wangxingzhen <wangxingzhen@huawei.com>
Date: Mon, 2 May 2022 09:22:28 +0800
Subject: [PATCH 2/3] augru bugfix

---
 tf_adapter/python/npu_bridge/estimator/npu_ops.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tf_adapter/python/npu_bridge/estimator/npu_ops.py b/tf_adapter/python/npu_bridge/estimator/npu_ops.py
index 5ca6effbc..8cbcbbd29 100644
--- a/tf_adapter/python/npu_bridge/estimator/npu_ops.py
+++ b/tf_adapter/python/npu_bridge/estimator/npu_ops.py
@@ -230,7 +230,8 @@ def dynamic_gru_v2_grad(op, dy, doutput_h, dupdate, dreset, dnew, dhidden_new):
     (y, output_h, update, reset, new, hidden_new) = op.outputs
     (dw_input, dw_hidden, db_input, db_hidden, dx, dh_prev) = gen_npu_ops.dynamic_gru_v2_grad(x, weight_input,
                                                                                               weight_hidden, y, init_h,
-                                                                                              output_h, dy, doutput_h,
+                                                                                              output_h, dy,
+                                                                                              doutput_h[-1],
                                                                                               update, reset, new,
                                                                                               hidden_new,
                                                                                               direction=op.get_attr(
@@ -268,7 +269,7 @@ def dynamic_augru_grad(op, dy, doutput_h, dupdate, dupdate_att, dreset, dnew, dh
                                                                                                      weight_hidden,
                                                                                                      weight_att, y,
                                                                                                      init_h, output_h,
-                                                                                                     dy, doutput_h,
+                                                                                                     dy, doutput_h[-1],
                                                                                                      update, update_att,
                                                                                                      reset, new,
                                                                                                      hidden_new,
-- 
Gitee


From 1339658a1ab241b84ade59194255379018cb8dff Mon Sep 17 00:00:00 2001
From: wangxingzhen <wangxingzhen@huawei.com>
Date: Fri, 6 May 2022 10:21:45 +0800
Subject: [PATCH 3/3] st testcase bugfix

---
 tf_adapter/ops/aicore/npu_aicore_ops.cc       |   1 +
 .../estimator/npu/npu_dynamic_rnn.py          |   2 +
 .../python/npu_bridge/estimator/npu_ops.py    |   1 +
 .../testcase/dynamic_augru_grad_test.cc       |   5 +-
 .../testcase/dynamic_gruv2_grad_test.cc       |   5 +-
 .../testcase/dynamic_augru_grad_test.cc       | 104 +++++++++---------
 .../testcase/dynamic_gruv2_grad_test.cc       |   5 +-
 7 files changed, 64 insertions(+), 59 deletions(-)

diff --git a/tf_adapter/ops/aicore/npu_aicore_ops.cc b/tf_adapter/ops/aicore/npu_aicore_ops.cc
index 353834228..c72bf9c05 100644
--- a/tf_adapter/ops/aicore/npu_aicore_ops.cc
+++ b/tf_adapter/ops/aicore/npu_aicore_ops.cc
@@ -113,6 +113,7 @@ REGISTER_OP("DynamicGruV2Grad")
     .Input("reset: T")
     .Input("new: T")
     .Input("hidden_new: T")
+    .Input("seq_length: int32")
     .Output("dw_input: T")
     .Output("dw_hidden: T")
     .Output("db_input: T")
diff --git a/tf_adapter/python/npu_bridge/estimator/npu/npu_dynamic_rnn.py b/tf_adapter/python/npu_bridge/estimator/npu/npu_dynamic_rnn.py
index ea1f57473..5d17344ee 100644
--- a/tf_adapter/python/npu_bridge/estimator/npu/npu_dynamic_rnn.py
+++ b/tf_adapter/python/npu_bridge/estimator/npu/npu_dynamic_rnn.py
@@ -231,6 +231,8 @@ class DynamicGRUV2(_DynamicBasic):
         self._args["weight_hidden"] = self._gruv2_weight_hidden
         self._args["bias_input"] = self._bias_input
         self._args["bias_hidden"] = self._bias_hidden
+        if seq_length is not None:
+            self._args["seq_length"] = seq_length
         return gen_npu_ops.dynamic_gru_v2(**self._args)
 
 
diff --git a/tf_adapter/python/npu_bridge/estimator/npu_ops.py b/tf_adapter/python/npu_bridge/estimator/npu_ops.py
index 8cbcbbd29..907479c76 100644
--- a/tf_adapter/python/npu_bridge/estimator/npu_ops.py
+++ b/tf_adapter/python/npu_bridge/estimator/npu_ops.py
@@ -234,6 +234,7 @@ def dynamic_gru_v2_grad(op, dy, doutput_h, dupdate, dreset, dnew, dhidden_new):
                                                                                               doutput_h[-1],
                                                                                               update, reset, new,
                                                                                               hidden_new,
+                                                                                              seq_length,
                                                                                               direction=op.get_attr(
                                                                                                   "direction"),
                                                                                               cell_depth=op.get_attr(
diff --git a/tf_adapter/tests/st/kernels/testcase/dynamic_augru_grad_test.cc b/tf_adapter/tests/st/kernels/testcase/dynamic_augru_grad_test.cc
index 6cf752c5e..71febcbd1 100644
--- a/tf_adapter/tests/st/kernels/testcase/dynamic_augru_grad_test.cc
+++ b/tf_adapter/tests/st/kernels/testcase/dynamic_augru_grad_test.cc
@@ -29,7 +29,7 @@ FakeInputFunctor FakeInputStub(DataType dt) {
 TEST(DynamicAUGRUGradTest, TestDynamicAUGRUGrad) {
   DataTypeSlice input_types({DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT,
                              DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT,
-                             DT_FLOAT, DT_FLOAT});
+                             DT_FLOAT, DT_FLOAT, DT_INT32});
   MemoryTypeSlice input_memory_types;
   DataTypeSlice output_types(
       {DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT});
@@ -72,13 +72,14 @@ TEST(DynamicAUGRUGradOpTest, TestDynamicAUGRUGradShapeInference) {
                   .Input(FakeInputStub(DT_FLOAT))
                   .Input(FakeInputStub(DT_FLOAT))
                   .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_INT32))
                   .Finalize(&def));
   shape_inference::InferenceContext c(
       0, &def, op_def,
       {TShape({1, 16, 16}), TShape({16, 48}), TShape({16, 48}), TShape({1, 16}),
        TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
        TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
-       TShape({16, 16})},
+       TShape({16, 16}), TShape({16})},
       {}, {}, {});
   TF_CHECK_OK(reg->shape_inference_fn(&c));
 }
diff --git a/tf_adapter/tests/st/kernels/testcase/dynamic_gruv2_grad_test.cc b/tf_adapter/tests/st/kernels/testcase/dynamic_gruv2_grad_test.cc
index d53e4d0bc..b60069e51 100644
--- a/tf_adapter/tests/st/kernels/testcase/dynamic_gruv2_grad_test.cc
+++ b/tf_adapter/tests/st/kernels/testcase/dynamic_gruv2_grad_test.cc
@@ -29,7 +29,7 @@ FakeInputFunctor FakeInputStub(DataType dt) {
 TEST(DynamicGruV2GradTest, TestDynamicGruV2Grad) {
   DataTypeSlice input_types({DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT,
                              DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT,
-                             DT_FLOAT, DT_FLOAT});
+                             DT_FLOAT, DT_FLOAT, DT_INT32});
   MemoryTypeSlice input_memory_types;
   DataTypeSlice output_types(
       {DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT});
@@ -70,13 +70,14 @@ TEST(DynamicGruV2GradOpTest, TestDynamicGruV2GradShapeInference) {
                   .Input(FakeInputStub(DT_FLOAT))
                   .Input(FakeInputStub(DT_FLOAT))
                   .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_INT32))
                   .Finalize(&def));
   shape_inference::InferenceContext c(
       0, &def, op_def,
       {TShape({1, 16, 16}), TShape({16, 48}), TShape({16, 48}),
        TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
        TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
-       TShape({16, 16})},
+       TShape({16, 16}), TShape({16})},
       {}, {}, {});
   TF_CHECK_OK(reg->shape_inference_fn(&c));
 }
diff --git a/tf_adapter/tests/ut/kernels/testcase/dynamic_augru_grad_test.cc b/tf_adapter/tests/ut/kernels/testcase/dynamic_augru_grad_test.cc
index 7f9dcc4da..1cec26db5 100644
--- a/tf_adapter/tests/ut/kernels/testcase/dynamic_augru_grad_test.cc
+++ b/tf_adapter/tests/ut/kernels/testcase/dynamic_augru_grad_test.cc
@@ -27,60 +27,58 @@ FakeInputFunctor FakeInputStub(DataType dt) {
 }
 
 TEST(DynamicAUGRUGradTest, TestDynamicAUGRUGrad) {
-DataTypeSlice input_types({DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT,
-                           DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT,
-                           DT_FLOAT, DT_FLOAT});
-MemoryTypeSlice input_memory_types;
-DataTypeSlice output_types(
-    {DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT});
-MemoryTypeSlice output_memory_types;
-DeviceBase *device = new DeviceBase(Env::Default());
-NodeDef *node_def = new NodeDef();
-OpDef *op_def = new OpDef();
-OpKernelConstruction *context = new OpKernelConstruction(
-    DEVICE_CPU, device, nullptr, node_def, op_def, nullptr, input_types,
-    input_memory_types, output_types, output_memory_types, 1, nullptr);
-DynamicAUGRUGradOP<int> dynamic_augru_grad(context);
-OpKernelContext *ctx = nullptr;
-dynamic_augru_grad.Compute(ctx);
-dynamic_augru_grad.IsExpensive();
-delete device;
-delete node_def;
-delete op_def;
-delete context;
+  DataTypeSlice input_types({DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT,
+                             DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_INT32});
+  MemoryTypeSlice input_memory_types;
+  DataTypeSlice output_types({DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT});
+  MemoryTypeSlice output_memory_types;
+  DeviceBase *device = new DeviceBase(Env::Default());
+  NodeDef *node_def = new NodeDef();
+  OpDef *op_def = new OpDef();
+  OpKernelConstruction *context =
+      new OpKernelConstruction(DEVICE_CPU, device, nullptr, node_def, op_def, nullptr, input_types, input_memory_types,
+                               output_types, output_memory_types, 1, nullptr);
+  DynamicAUGRUGradOP<int> dynamic_augru_grad(context);
+  OpKernelContext *ctx = nullptr;
+  dynamic_augru_grad.Compute(ctx);
+  dynamic_augru_grad.IsExpensive();
+  delete device;
+  delete node_def;
+  delete op_def;
+  delete context;
 }
 
 TEST(DynamicAUGRUGradOpTest, TestDynamicAUGRUGradShapeInference) {
-const OpRegistrationData *reg;
-TF_CHECK_OK(OpRegistry::Global()->LookUp("DynamicAUGRUGrad", &reg));
-OpDef op_def = reg->op_def;
-NodeDef def;
-TF_CHECK_OK(NodeDefBuilder("dummy", &op_def)
-.Attr("T", DT_FLOAT)
-.Attr("direction", "BIDIRECTIONAL")
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Input(FakeInputStub(DT_FLOAT))
-.Finalize(&def));
-shape_inference::InferenceContext c(
-    0, &def, op_def,
-    {TShape({1, 16, 16}), TShape({16, 48}), TShape({16, 48}), TShape({1, 16}),
-     TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
-     TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
-     TShape({16, 16})},
-    {}, {}, {});
-TF_CHECK_OK(reg->shape_inference_fn(&c));
+  const OpRegistrationData *reg;
+  TF_CHECK_OK(OpRegistry::Global()->LookUp("DynamicAUGRUGrad", &reg));
+  OpDef op_def = reg->op_def;
+  NodeDef def;
+  TF_CHECK_OK(NodeDefBuilder("dummy", &op_def)
+                  .Attr("T", DT_FLOAT)
+                  .Attr("direction", "BIDIRECTIONAL")
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_INT32))
+                  .Finalize(&def));
+  shape_inference::InferenceContext c(0, &def, op_def,
+                                      {TShape({1, 16, 16}), TShape({16, 48}), TShape({16, 48}), TShape({1, 16}),
+                                       TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
+                                       TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
+                                       TShape({16, 16}), TShape({16, 16}), TShape({16})},
+                                      {}, {}, {});
+  TF_CHECK_OK(reg->shape_inference_fn(&c));
 }
-} // namespace
-} // namespace tensorflow
\ No newline at end of file
+}  // namespace
+}  // namespace tensorflow
\ No newline at end of file
diff --git a/tf_adapter/tests/ut/kernels/testcase/dynamic_gruv2_grad_test.cc b/tf_adapter/tests/ut/kernels/testcase/dynamic_gruv2_grad_test.cc
index d53e4d0bc..b60069e51 100644
--- a/tf_adapter/tests/ut/kernels/testcase/dynamic_gruv2_grad_test.cc
+++ b/tf_adapter/tests/ut/kernels/testcase/dynamic_gruv2_grad_test.cc
@@ -29,7 +29,7 @@ FakeInputFunctor FakeInputStub(DataType dt) {
 TEST(DynamicGruV2GradTest, TestDynamicGruV2Grad) {
   DataTypeSlice input_types({DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT,
                              DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT,
-                             DT_FLOAT, DT_FLOAT});
+                             DT_FLOAT, DT_FLOAT, DT_INT32});
   MemoryTypeSlice input_memory_types;
   DataTypeSlice output_types(
       {DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT, DT_FLOAT});
@@ -70,13 +70,14 @@ TEST(DynamicGruV2GradOpTest, TestDynamicGruV2GradShapeInference) {
                   .Input(FakeInputStub(DT_FLOAT))
                   .Input(FakeInputStub(DT_FLOAT))
                   .Input(FakeInputStub(DT_FLOAT))
+                  .Input(FakeInputStub(DT_INT32))
                   .Finalize(&def));
   shape_inference::InferenceContext c(
       0, &def, op_def,
       {TShape({1, 16, 16}), TShape({16, 48}), TShape({16, 48}),
        TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
        TShape({16, 16}), TShape({16, 16}), TShape({16, 16}), TShape({16, 16}),
-       TShape({16, 16})},
+       TShape({16, 16}), TShape({16})},
       {}, {}, {});
   TF_CHECK_OK(reg->shape_inference_fn(&c));
 }
-- 
Gitee