update gru grad op

test=develop

update gru grad op
test=develop
e10af895 · Qiao Longfei · 78ec7c0f · e10af895
隐藏空白更改
内联并排

Showing with 6 addition and 3 deletion

paddle/fluid/operators/gru_unit_op.h paddle/fluid/operators/gru_unit_op.h +6 -3

未找到文件。
--- a/paddle/fluid/operators/gru_unit_op.h
+++ b/paddle/fluid/operators/gru_unit_op.h
@@ -113,8 +113,7 @@ class GRUUnitKernel : public framework::OpKernel<T> {
    auto c = g.slice(c_offsets, extents);  // output candidate
    // calculate final output
-    bool origin_mode = context.Attr<bool>("origin_mode");
+    if (context.Attr<bool>("origin_mode")) {
-    if (origin_mode) {
      h.device(place) = c + u * (h_p - c);  // (1 - u) * c + u * h_p
    } else {
      h.device(place) = u * (c - h_p) + h_p;  // u * c + (1 - u) * h_p
@@ -218,7 +217,11 @@ class GRUUnitGradKernel : public framework::OpKernel<T> {
      T* hidden_prev_grad_data =
          hidden_prev_grad->mutable_data<T>(context.GetPlace());
      auto d_h_p = EigenMatrix<T>::From(*hidden_prev_grad);
-      d_h_p.device(place) = d_r_h_p * r + d_h * (u.constant(T(1)) - u);
+      if (context.Attr<bool>("origin_mode")) {
+        d_h_p.device(place) = d_r_h_p * (u.constant(T(1)) - u) + d_h * r;
+      } else {
+        d_h_p.device(place) = d_r_h_p * r + d_h * (u.constant(T(1)) - u);
+      }
      blas.GEMM(false, true, batch_size, frame_size, frame_size * 2, 1,
                gate_grad_data, frame_size * 3, weight_data, frame_size * 2, 1,
                hidden_prev_grad_data, frame_size);