From 6a82c5cf60d43b1c408831e9aa05662491375e96 Mon Sep 17 00:00:00 2001
From: miraiwk <miraiwk@gmail.com>
Date: Fri, 18 Sep 2020 19:39:17 +0800
Subject: [PATCH] update spectral norm

---
 paddle/fluid/operators/spectral_norm_op.cc    |  2 ++
 paddle/fluid/operators/spectral_norm_op.h     | 10 +++---
 python/paddle/fluid/dygraph/nn.py             | 26 +++++++++++++-
 python/paddle/fluid/layers/nn.py              |  4 ++-
 .../tests/unittests/test_spectral_norm_op.py  | 34 +++++++++++++++++++
 5 files changed, 68 insertions(+), 8 deletions(-)
diff --git a/paddle/fluid/operators/spectral_norm_op.cc b/paddle/fluid/operators/spectral_norm_op.cc
index 8e083fa05c7..8d486341b34 100644
--- a/paddle/fluid/operators/spectral_norm_op.cc
+++ b/paddle/fluid/operators/spectral_norm_op.cc
@@ -205,6 +205,8 @@ class SpectralNormGradOpMaker : public framework::SingleGradOpMaker<T> {
     op->SetInput("Weight", this->Input("Weight"));
     op->SetInput("U", this->Input("U"));
     op->SetInput("V", this->Input("V"));
+    op->SetInput("UOut", this->Output("UOut"));
+    op->SetInput("VOut", this->Output("VOut"));
 
     op->SetOutput(framework::GradVarName("Weight"), this->InputGrad("Weight"));
 
diff --git a/paddle/fluid/operators/spectral_norm_op.h b/paddle/fluid/operators/spectral_norm_op.h
index 15d637a495b..fa334942b13 100644
--- a/paddle/fluid/operators/spectral_norm_op.h
+++ b/paddle/fluid/operators/spectral_norm_op.h
@@ -64,6 +64,7 @@ template <typename DeviceContext, typename T>
 static inline void UpdateUandV(
     Tensor* u, Tensor* v, Tensor* weight, const int power_iters,
     const float eps, const framework::ExecutionContext& ctx) {
+  if (power_iters <= 0) return;
   auto& place = *ctx.template device_context<DeviceContext>().eigen_device();
   auto blas = math::GetBlas<DeviceContext, T>(ctx);
   auto u_t = EigenTensor<T, 2>::From(*u);
@@ -92,8 +93,7 @@ static inline void UpdateUandV(
 template <typename DeviceContext, typename T>
 static inline void CalcMatrixSigmaAndNormWeight(
     Tensor* sigma, const Tensor* u, const Tensor* v,
-    Tensor* weight, const int power_iters,
-    const float eps, const framework::ExecutionContext& ctx) {
+    Tensor* weight, const framework::ExecutionContext& ctx) {
   auto& place = *ctx.template device_context<DeviceContext>().eigen_device();
   auto blas = math::GetBlas<DeviceContext, T>(ctx);
   auto sigma_t = EigenTensor<T, 2>::From(*sigma);
@@ -168,7 +168,7 @@ class SpectralNormKernel : public framework::OpKernel<T> {
         power_iters, eps, ctx);
     CalcMatrixSigmaAndNormWeight<DeviceContext, T>(
         &sigma, &(u_out->Resize({h, 1})), &(v_out->Resize({w, 1})), &weight_mat,
-        power_iters, eps, ctx);
+        ctx);
 
     if (dim != 0) {
       std::vector<int> perm;
@@ -205,8 +205,6 @@ class SpectralNormGradKernel : public framework::OpKernel<T> {
     auto weight_grad = ctx.Output<Tensor>(framework::GradVarName("Weight"));
 
     int dim = ctx.Attr<int>("dim");
-    int power_iters = ctx.Attr<int>("power_iters");
-    float eps = ctx.Attr<float>("eps");
 
     const int h = u_out->dims()[0];
     const int w = v_out->dims()[0];
@@ -251,7 +249,7 @@ class SpectralNormGradKernel : public framework::OpKernel<T> {
 
     CalcMatrixSigmaAndNormWeight<DeviceContext, T>(
         &sigma, &(u_mat.Resize({h, 1})), &(v_mat.Resize({w, 1})), &weight_mat,
-        power_iters, eps, ctx);
+        ctx);
 
     Tensor uv;
     uv.mutable_data<T>({h, w}, ctx.GetPlace());
diff --git a/python/paddle/fluid/dygraph/nn.py b/python/paddle/fluid/dygraph/nn.py
index a14c3a81c12..fc76dbc216f 100644
--- a/python/paddle/fluid/dygraph/nn.py
+++ b/python/paddle/fluid/dygraph/nn.py
@@ -3031,6 +3031,7 @@ class SpectralNorm(layers.Layer):
         dim(int, optional): The index of dimension which should be permuted to the first before reshaping Input(Weight) to matrix, it should be set as 0 if Input(Weight) is the weight of fc layer, and should be set as 1 if Input(Weight) is the weight of conv layer. Default: 0.
         power_iters(int, optional): The number of power iterations to calculate spectral norm. Default: 1.
         eps(float, optional): The epsilon for numerical stability in calculating norms. Default: 1e-12.
+        fix_state(bool, optional): whether to update the two vectors `u` and `v`. Default: True.
         name (str, optional): The default value is None.  Normally there is no need for user to set this property.  For more information, please refer to :ref:`api_guide_Name` .
         dtype (str, optional): Data type, it can be "float32" or "float64". Default: "float32".
 
@@ -3055,10 +3056,12 @@ class SpectralNorm(layers.Layer):
                  dim=0,
                  power_iters=1,
                  eps=1e-12,
+                 fix_state=True,
                  dtype='float32'):
         super(SpectralNorm, self).__init__()
         self._power_iters = power_iters
         self._eps = eps
+        self._fix_state = fix_state
         self._dim = dim
         self._dtype = dtype
 
@@ -3080,10 +3083,31 @@ class SpectralNorm(layers.Layer):
             default_initializer=Normal(0., 1.))
         self.weight_v.stop_gradient = True
 
+        if fix_state:
+            self.out_weight_u = self.create_parameter(
+                attr=ParamAttr(),
+                shape=[h],
+                dtype=self._dtype,
+                default_initializer=Normal(0., 1.))
+            self.out_weight_u.stop_gradient = True
+
+            self.out_weight_v = self.create_parameter(
+                attr=ParamAttr(),
+                shape=[w],
+                dtype=self._dtype,
+                default_initializer=Normal(0., 1.))
+            self.out_weight_v.stop_gradient = True
+        else:
+            self.out_weight_u = self.weight_u
+            self.out_weight_v = self.weight_v
+
     def forward(self, weight):
         check_variable_and_dtype(weight, "weight", ['float32', 'float64'],
                                  'SpectralNorm')
-        inputs = {'Weight': weight, 'U': self.weight_u, 'V': self.weight_v}
+        inputs = {
+            'Weight': weight, 'U': self.weight_u, 'V': self.weight_v,
+            'UOut': self.out_weight_u, 'VOut': self.out_weight_v,
+        }
         out = self._helper.create_variable_for_type_inference(self._dtype)
         self._helper.append_op(
             type="spectral_norm",
diff --git a/python/paddle/fluid/layers/nn.py b/python/paddle/fluid/layers/nn.py
index 9313de8c64f..61a6b0ad994 100755
--- a/python/paddle/fluid/layers/nn.py
+++ b/python/paddle/fluid/layers/nn.py
@@ -3720,11 +3720,13 @@ def spectral_norm(weight, dim=0, power_iters=1, eps=1e-12, name=None):
 
     # create output
     out = helper.create_variable(dtype=dtype)
+    u_out = helper.create_variable(dtype=dtype)
+    v_out = helper.create_variable(dtype=dtype)
 
     helper.append_op(
         type="spectral_norm",
         inputs=inputs,
-        outputs={"Out": out, },
+        outputs={"Out": out, "UOut": u_out, "VOut": v_out},
         attrs={
             "dim": dim,
             "power_iters": power_iters,
diff --git a/python/paddle/fluid/tests/unittests/test_spectral_norm_op.py b/python/paddle/fluid/tests/unittests/test_spectral_norm_op.py
index 227ed1d2ff0..c080583cec0 100644
--- a/python/paddle/fluid/tests/unittests/test_spectral_norm_op.py
+++ b/python/paddle/fluid/tests/unittests/test_spectral_norm_op.py
@@ -132,6 +132,40 @@ class TestSpectralNormOp2(TestSpectralNormOp):
         self.fix_state = True
 
 
+class TestSpectralNormOpFixState(TestSpectralNormOpNoGrad):
+    def test_check_grad_ignore_uv(self):
+        self.check_grad(
+            ['Weight'],
+            'Out',
+            no_grad_set=set(["U", "V"]), )
+
+    def initTestCase(self):
+        self.weight_shape = (10, 12)
+        self.u_shape = (10, )
+        self.v_shape = (12, )
+        self.dim = 0
+        self.power_iters = 3
+        self.eps = 1e-12
+        self.fix_state = False
+
+
+class TestSpectralNormOpUpdateState(TestSpectralNormOpNoGrad):
+    def test_check_grad_ignore_uv(self):
+        self.check_grad(
+            ['Weight'],
+            'Out',
+            no_grad_set=set(["U", "V"]), )
+
+    def initTestCase(self):
+        self.weight_shape = (10, 12)
+        self.u_shape = (10, )
+        self.v_shape = (12, )
+        self.dim = 0
+        self.power_iters = 3
+        self.eps = 1e-12
+        self.fix_state = True
+
+
 class TestSpectralNormOpError(unittest.TestCase):
     def test_errors(self):
         with program_guard(Program(), Program()):
-- 
GitLab