From 02df634da2cda1a0cdb2c320da95e5f0ae63008e Mon Sep 17 00:00:00 2001
From: Megvii Engine Team <megengine@megvii.com>
Date: Wed, 3 Feb 2021 18:21:12 +0800
Subject: [PATCH] fix(mge/quantization): set ``q_dict`` as an instance property

GitOrigin-RevId: 2f32008aadd9d0302285fda8667f71cbfb9552b4
---
 .../python/megengine/quantization/observer.py |  2 +-
 imperative/python/megengine/tensor.py         | 10 ++-
 .../test/unit/core/test_serialization.py      | 14 ++--
 .../test/unit/functional/test_tensor.py       | 16 ++++
 .../test/unit/module/test_module_tensor.py    |  1 +
 .../test/unit/quantization/test_module.py     | 83 +++++++++++--------
 .../test/unit/quantization/test_quantize.py   | 23 +++--
 7 files changed, 93 insertions(+), 56 deletions(-)

diff --git a/imperative/python/megengine/quantization/observer.py b/imperative/python/megengine/quantization/observer.py
index 5d3c4ca9..8da70581 100644
--- a/imperative/python/megengine/quantization/observer.py
+++ b/imperative/python/megengine/quantization/observer.py
@@ -467,7 +467,7 @@ class PassiveObserver(Observer):
     @scale.setter
     def scale(self, value):
         assert value > 0
-        self.q_dict["scale"].set_value(value)
+        self.q_dict["scale"][...] = Tensor(value)
 
     def get_qparams(self):
         return self.q_dict
diff --git a/imperative/python/megengine/tensor.py b/imperative/python/megengine/tensor.py
index 3c7f909a..2da9c774 100644
--- a/imperative/python/megengine/tensor.py
+++ b/imperative/python/megengine/tensor.py
@@ -25,7 +25,7 @@ from .utils.deprecation import deprecated
 class Tensor(_Tensor, ArrayMethodMixin):
     grad = None
     dmap_callback = None
-    q_dict = {"mode": None, "scale": None, "zero_point": None}
+    _q_dict = None
 
     def __new__(cls, data, dtype=None, device=None, is_const=False, no_cache=False):
         if device is None:
@@ -70,6 +70,12 @@ class Tensor(_Tensor, ArrayMethodMixin):
     def dtype(self) -> np.dtype:
         return super().dtype
 
+    @property
+    def q_dict(self):
+        if self._q_dict is None:
+            self._q_dict = {"mode": None, "scale": None, "zero_point": None}
+        return self._q_dict
+
     def numpy(self) -> np.ndarray:
         return super().numpy()
 
@@ -135,7 +141,7 @@ class Tensor(_Tensor, ArrayMethodMixin):
         return state
 
     def __setstate__(self, state):
-        self.q_dict = state.pop("qdict")
+        self._q_dict = state.pop("qdict")
 
 
 tensor = Tensor
diff --git a/imperative/python/test/unit/core/test_serialization.py b/imperative/python/test/unit/core/test_serialization.py
index 0a974fac..72e79c5c 100644
--- a/imperative/python/test/unit/core/test_serialization.py
+++ b/imperative/python/test/unit/core/test_serialization.py
@@ -16,11 +16,6 @@ from megengine import Parameter, Tensor
 
 
 def test_tensor_serialization():
-    def tensor_eq(a, b):
-        assert a.dtype == b.dtype
-        assert a.device == b.device
-        np.testing.assert_equal(a.numpy(), b.numpy())
-
     with TemporaryFile() as f:
         data = np.random.randint(low=0, high=7, size=[233])
         a = Tensor(data, device="xpux", dtype=np.int32)
@@ -67,3 +62,12 @@ def test_tensor_serialization():
             assert "cpu0" in str(b.device)
             np.testing.assert_equal(a.numpy(), b.numpy())
             mge.set_default_device(device_org)
+
+    with TemporaryFile() as f:
+        a = Tensor(0)
+        a.q_dict["scale"] = Tensor(1.0)
+        pickle.dump(a, f)
+        f.seek(0)
+        b = pickle.load(f)
+        assert isinstance(b.q_dict["scale"], Tensor)
+        np.testing.assert_equal(b.q_dict["scale"].numpy(), 1.0)
diff --git a/imperative/python/test/unit/functional/test_tensor.py b/imperative/python/test/unit/functional/test_tensor.py
index b4039fc7..2703c67e 100644
--- a/imperative/python/test/unit/functional/test_tensor.py
+++ b/imperative/python/test/unit/functional/test_tensor.py
@@ -379,3 +379,19 @@ def test_copy_d2h():
 def test_copy_d2d():
     copy_test("gpu0", "gpu1")
     copy_test("gpu0:0", "gpu0:1")
+
+
+def test_q_dict():
+    x = tensor(1)
+    assert x.q_dict["scale"] is None
+    x.q_dict["scale"] = tensor(1.0)
+
+    y = tensor(1)
+    assert y.q_dict["scale"] is None
+    y.q_dict["scale"] = tensor(2.0)
+
+    assert x.q_dict["scale"].numpy() == 1.0
+    assert y.q_dict["scale"].numpy() == 2.0
+
+    z = x + y
+    assert z.q_dict["scale"] is None
diff --git a/imperative/python/test/unit/module/test_module_tensor.py b/imperative/python/test/unit/module/test_module_tensor.py
index bbc9698b..6f700ebc 100644
--- a/imperative/python/test/unit/module/test_module_tensor.py
+++ b/imperative/python/test/unit/module/test_module_tensor.py
@@ -17,6 +17,7 @@ from megengine import Parameter, Tensor
 from megengine.module import Conv2d
 
 
+# TODO: delete this test after deleting set_value
 def test_set_value():
     v0 = np.random.random((2, 3)).astype(np.float32)
     param = Parameter(v0)
diff --git a/imperative/python/test/unit/quantization/test_module.py b/imperative/python/test/unit/quantization/test_module.py
index 0fa13082..12e0d27c 100644
--- a/imperative/python/test/unit/quantization/test_module.py
+++ b/imperative/python/test/unit/quantization/test_module.py
@@ -1,3 +1,5 @@
+from functools import partial
+
 import numpy as np
 import pytest
 
@@ -6,17 +8,21 @@ import megengine.functional as F
 import megengine.module as Float
 import megengine.module.qat as QAT
 import megengine.module.quantized as Q
+from megengine import Parameter, Tensor
 from megengine.core.tensor import dtype
-from megengine.quantization import min_max_fakequant_qconfig
+from megengine.quantization import FakeQuantize, MinMaxObserver, QConfig
 from megengine.quantization.quantize import (
     disable_fake_quant,
     disable_observer,
     propagate_qconfig,
 )
 
-"""
-Calculate testing scales based on ``min_max_fakequant_qconfig``
-"""
+min_max_fakequant_qconfig = QConfig(
+    weight_observer=partial(MinMaxObserver, dtype="qint8", narrow_range=True),
+    act_observer=partial(MinMaxObserver, dtype="qint8", narrow_range=False),
+    weight_fake_quant=partial(FakeQuantize, dtype="qint8", narrow_range=True),
+    act_fake_quant=partial(FakeQuantize, dtype="qint8", narrow_range=False),
+)
 
 inp_scale = np.float32(np.random.rand() + 1)
 
@@ -31,21 +37,26 @@ def quant(x, scale):
     return x.astype(inp_dtype)
 
 
-def fake_quant(x, scale):
+def fake_quant(x, scale, qmin, qmax):
     x = x / scale
     x = F.round(x)
-    x = F.clip(x, -128, 127)
+    x = F.clip(x, qmin, qmax)
     x = x * scale
     return x
 
 
+fake_quant_act = partial(fake_quant, qmin=-128, qmax=127)
+fake_quant_weight = partial(fake_quant, qmin=-127, qmax=127)
+fake_quant_bias = partial(fake_quant, qmin=-(2 ** 31), qmax=2 ** 31 - 1)
+
+
 def init_qat_net(net):
     if net.with_weight:
-        net.weight_observer.min_val.set_value(min_val[0])
-        net.weight_observer.max_val.set_value(max_val[0])
+        net.weight_observer.min_val[...] = Tensor(min_val[0])
+        net.weight_observer.max_val[...] = Tensor(max_val[0])
     if net.with_act:
-        net.act_observer.min_val.set_value(min_val[1])
-        net.act_observer.max_val.set_value(max_val[1])
+        net.act_observer.min_val[...] = Tensor(min_val[1])
+        net.act_observer.max_val[...] = Tensor(max_val[1])
 
 
 def test_quant_stub():
@@ -71,7 +82,7 @@ def test_quant_stub():
 
     normal = normal_net(x)
     qat_without_fakequant = qat_from_float(x)
-    fake_quant_normal = fake_quant(normal_net(x), act_scale)
+    fake_quant_normal = fake_quant_act(normal_net(x), act_scale)
     qat = qat_net(x)
     q = q_net(x).numpy() * act_scale
     np.testing.assert_allclose(qat_without_fakequant, normal)
@@ -99,7 +110,7 @@ def test_dequant_stub():
     q_net.eval()
 
     x = mge.tensor(np.random.normal(size=(3, 3)).astype("float32"))
-    x = fake_quant(x, inp_scale)
+    x = fake_quant_act(x, inp_scale)
     x.q_dict["scale"] = inp_scale
 
     normal = normal_net(x)
@@ -134,12 +145,12 @@ def test_elemwise(kind):
 
     x1_scale = np.float32(np.random.rand() + 1)
     x1 = mge.tensor(np.random.normal(size=(3, 3)).astype("float32"))
-    x1 = fake_quant(x1, x1_scale)
+    x1 = fake_quant_act(x1, x1_scale)
     x1.q_dict["scale"] = x1_scale
 
     x2_scale = np.float32(np.random.rand() + 1)
     x2 = mge.tensor(np.random.normal(size=(3, 3)).astype("float32"))
-    x2 = fake_quant(x2, x2_scale)
+    x2 = fake_quant_act(x2, x2_scale)
     x2.q_dict["scale"] = x2_scale
 
     x1_int8 = quant(x1, x1_scale)
@@ -149,13 +160,13 @@ def test_elemwise(kind):
     if kind in ("ADD", "MUL", "FUSE_ADD_RELU"):
         normal = normal_net(x1, x2)
         qat_without_fakequant = qat_from_float(x1, x2)
-        fake_quant_normal = fake_quant(normal_net(x1, x2), act_scale)
+        fake_quant_normal = fake_quant_act(normal_net(x1, x2), act_scale)
         qat = qat_net(x1, x2)
         q = q_net(x1_int8, x2_int8).numpy() * act_scale
     else:
         normal = normal_net(x1)
         qat_without_fakequant = qat_from_float(x1)
-        fake_quant_normal = fake_quant(normal_net(x1), act_scale)
+        fake_quant_normal = fake_quant_act(normal_net(x1), act_scale)
         qat = qat_net(x1)
         q = q_net(x1_int8).numpy() * act_scale
     np.testing.assert_allclose(qat_without_fakequant, normal)
@@ -175,17 +186,17 @@ def test_linear():
     init_qat_net(qat_net)
 
     x = mge.tensor(np.random.normal(size=(3, 3)).astype("float32"))
-    x = fake_quant(x, inp_scale)
+    x = fake_quant_act(x, inp_scale)
     x.q_dict["scale"] = inp_scale
 
     x_int8 = quant(x, inp_scale)
 
     weight = np.random.normal(size=(3, 3)).astype("float32")
     bias = np.random.normal(size=(3,)).astype("float32")
-    normal_net.weight.set_value(fake_quant(weight, weight_scale))
-    normal_net.bias.set_value(fake_quant(bias, inp_scale * weight_scale))
-    qat_net.weight.set_value(weight)
-    qat_net.bias.set_value(bias)
+    normal_net.weight[...] = fake_quant_weight(weight, weight_scale)
+    normal_net.bias[...] = fake_quant_bias(bias, inp_scale * weight_scale)
+    qat_net.weight[...] = Parameter(weight)
+    qat_net.bias[...] = Parameter(bias)
 
     qat_from_float = QAT.Linear.from_float_module(normal_net)
     qat_from_float.eval()
@@ -197,11 +208,11 @@ def test_linear():
 
     normal = normal_net(x)
     qat_without_fakequant = qat_from_float(x)
-    fake_quant_normal = fake_quant(normal_net(x), act_scale)
+    fake_quant_normal = fake_quant_act(normal_net(x), act_scale)
     qat = qat_net(x)
     q = q_net(x_int8).numpy() * act_scale
     np.testing.assert_allclose(qat_without_fakequant, normal)
-    np.testing.assert_allclose(qat, fake_quant_normal)
+    np.testing.assert_allclose(qat, fake_quant_normal.numpy())
     np.testing.assert_allclose(q, fake_quant_normal.numpy())
 
 
@@ -218,7 +229,7 @@ def test_conv(module):
     init_qat_net(qat_net)
 
     x = mge.tensor(np.random.normal(size=(1, 3, 3, 3)).astype("float32"))
-    x = fake_quant(x, inp_scale)
+    x = fake_quant_act(x, inp_scale)
     x.q_dict["scale"] = inp_scale
 
     x_int8 = quant(x, inp_scale)
@@ -226,15 +237,15 @@ def test_conv(module):
     weight = np.random.normal(size=(3, 3, 3, 3)).astype("float32")
     bias = np.random.normal(size=(1, 3, 1, 1)).astype("float32")
     if module in ("ConvBn2d", "ConvBnRelu2d"):
-        normal_net.conv.weight.set_value(fake_quant(weight, weight_scale))
-        normal_net.conv.bias.set_value(fake_quant(bias, inp_scale * weight_scale))
-        qat_net.conv.weight.set_value(weight)
-        qat_net.conv.bias.set_value(bias)
+        normal_net.conv.weight[...] = fake_quant_weight(weight, weight_scale)
+        normal_net.conv.bias[...] = fake_quant_bias(bias, inp_scale * weight_scale)
+        qat_net.conv.weight[...] = Parameter(weight)
+        qat_net.conv.bias[...] = Parameter(bias)
     else:
-        normal_net.weight.set_value(fake_quant(weight, weight_scale))
-        normal_net.bias.set_value(fake_quant(bias, inp_scale * weight_scale))
-        qat_net.weight.set_value(weight)
-        qat_net.bias.set_value(bias)
+        normal_net.weight[...] = fake_quant_weight(weight, weight_scale)
+        normal_net.bias[...] = fake_quant_bias(bias, inp_scale * weight_scale)
+        qat_net.weight[...] = Parameter(weight)
+        qat_net.bias[...] = Parameter(bias)
 
     qat_from_float = getattr(QAT, module).from_float_module(normal_net)
     qat_from_float.eval()
@@ -246,9 +257,9 @@ def test_conv(module):
 
     normal = normal_net(x)
     qat_without_fakequant = qat_from_float(x)
-    fake_quant_normal = fake_quant(normal_net(x), act_scale)
+    fake_quant_normal = fake_quant_act(normal_net(x), act_scale)
     qat = qat_net(x)
     q = q_net(x_int8).numpy() * act_scale
-    np.testing.assert_allclose(qat_without_fakequant, normal, atol=1e-6)
-    np.testing.assert_allclose(qat, fake_quant_normal)
-    np.testing.assert_allclose(q, fake_quant_normal.numpy())
+    np.testing.assert_allclose(qat_without_fakequant, normal, atol=1e-5)
+    np.testing.assert_allclose(qat, fake_quant_normal, atol=act_scale)
+    np.testing.assert_allclose(q, fake_quant_normal.numpy(), atol=act_scale)
diff --git a/imperative/python/test/unit/quantization/test_quantize.py b/imperative/python/test/unit/quantization/test_quantize.py
index 65953543..ed561bc1 100644
--- a/imperative/python/test/unit/quantization/test_quantize.py
+++ b/imperative/python/test/unit/quantization/test_quantize.py
@@ -8,9 +8,8 @@
 import numpy as np
 import pytest
 
-from megengine import functional
+from megengine import Parameter, Tensor
 from megengine import module as Float
-from megengine import tensor
 from megengine.module import qat as QAT
 from megengine.module import quantized as Q
 from megengine.quantization import (
@@ -40,7 +39,7 @@ class Net(Float.Module):
         self.quant = Float.QuantStub()
         self.linear = Float.Linear(3, 3)
         self.dequant = Float.DequantStub()
-        self.linear.bias.set_value(np.random.rand(3))
+        self.linear.bias[...] = Parameter(np.random.rand(3))
 
     def forward(self, x):
         x = self.quant(x)
@@ -55,7 +54,7 @@ class QATNet(Float.Module):
         self.quant = QAT.QuantStub()
         self.linear = QAT.Linear(3, 3)
         self.dequant = QAT.DequantStub()
-        self.linear.bias.set_value(np.random.rand(3))
+        self.linear.bias[...] = Parameter(np.random.rand(3))
 
     def forward(self, x):
         x = self.quant(x)
@@ -90,12 +89,12 @@ def init_qat_net():
     propagate_qconfig(net, min_max_fakequant_qconfig)
     min_val = np.random.randint(-127, 0, size=(3,))
     max_val = np.random.randint(1, 127, size=(3,))
-    net.quant.act_observer.min_val.set_value(min_val[0])
-    net.quant.act_observer.max_val.set_value(max_val[0])
-    net.linear.weight_observer.min_val.set_value(min_val[1])
-    net.linear.weight_observer.max_val.set_value(max_val[1])
-    net.linear.act_observer.min_val.set_value(min_val[2])
-    net.linear.act_observer.max_val.set_value(max_val[2])
+    net.quant.act_observer.min_val[...] = Parameter(min_val[0])
+    net.quant.act_observer.max_val[...] = Parameter(max_val[0])
+    net.linear.weight_observer.min_val[...] = Parameter(min_val[1])
+    net.linear.weight_observer.max_val[...] = Parameter(max_val[1])
+    net.linear.act_observer.min_val[...] = Parameter(min_val[2])
+    net.linear.act_observer.max_val[...] = Parameter(max_val[2])
     return net
 
 
@@ -144,7 +143,7 @@ def init_observer(module, data):
 
 
 def test_enable_and_disable_all():
-    x = tensor(np.random.randint(1, 10, size=(3, 3)).astype(np.float32))
+    x = Tensor(np.random.randint(1, 10, size=(3, 3)).astype(np.float32))
     net = Net()
     y1 = net(x).numpy()
     net = quantize_qat(net, min_max_fakequant_qconfig)
@@ -180,7 +179,7 @@ def test_quantize():
 
 def test_apply_easy_quant():
     qat_net = init_qat_net()
-    data = tensor(np.random.rand(2, 3, 3, 3), dtype=np.float32)
+    data = Tensor(np.random.rand(2, 3, 3, 3), dtype=np.float32)
     eq_net = reset_qconfig(qat_net, passive_qconfig, inplace=False)
     apply_easy_quant(eq_net, data, 0.9, 1.1, 10)
     assert isinstance(eq_net.quant.act_observer, PassiveObserver)
-- 
GitLab