fix(mge/quantization): set ``q_dict`` as an instance property

GitOrigin-RevId: 2f32008aadd9d0302285fda8667f71cbfb9552b4

fix(mge/quantization): set ``q_dict`` as an instance property
GitOrigin-RevId: 2f32008aadd9d0302285fda8667f71cbfb9552b4
02df634d · Megvii Engine Team · 193e77d4 · 02df634d · 02df634d · 02df634d
7 changed file
--- a/imperative/python/megengine/quantization/observer.py
+++ b/imperative/python/megengine/quantization/observer.py
@@ -467,7 +467,7 @@ class PassiveObserver(Observer):
    @scale.setter
    def scale(self, value):
        assert value > 0
-        self.q_dict["scale"].set_value(value)
+        self.q_dict["scale"][...] = Tensor(value)
    def get_qparams(self):
        return self.q_dict

--- a/imperative/python/megengine/tensor.py
+++ b/imperative/python/megengine/tensor.py
@@ -25,7 +25,7 @@ from .utils.deprecation import deprecated
 class Tensor(_Tensor, ArrayMethodMixin):
    grad = None
    dmap_callback = None
-    q_dict = {"mode": None, "scale": None, "zero_point": None}
+    _q_dict = None
    def __new__(cls, data, dtype=None, device=None, is_const=False, no_cache=False):
        if device is None:
@@ -70,6 +70,12 @@ class Tensor(_Tensor, ArrayMethodMixin):
    def dtype(self) -> np.dtype:
        return super().dtype
+    @property
+    def q_dict(self):
+        if self._q_dict is None:
+            self._q_dict = {"mode": None, "scale": None, "zero_point": None}
+        return self._q_dict
    def numpy(self) -> np.ndarray:
        return super().numpy()
@@ -135,7 +141,7 @@ class Tensor(_Tensor, ArrayMethodMixin):
        return state
    def __setstate__(self, state):
-        self.q_dict = state.pop("qdict")
+        self._q_dict = state.pop("qdict")
 tensor = Tensor

--- a/imperative/python/test/unit/core/test_serialization.py
+++ b/imperative/python/test/unit/core/test_serialization.py
@@ -16,11 +16,6 @@ from megengine import Parameter, Tensor
 def test_tensor_serialization():
-    def tensor_eq(a, b):
-        assert a.dtype == b.dtype
-        assert a.device == b.device
-        np.testing.assert_equal(a.numpy(), b.numpy())
    with TemporaryFile() as f:
        data = np.random.randint(low=0, high=7, size=[233])
        a = Tensor(data, device="xpux", dtype=np.int32)
@@ -67,3 +62,12 @@ def test_tensor_serialization():
            assert "cpu0" in str(b.device)
            np.testing.assert_equal(a.numpy(), b.numpy())
            mge.set_default_device(device_org)
+    with TemporaryFile() as f:
+        a = Tensor(0)
+        a.q_dict["scale"] = Tensor(1.0)
+        pickle.dump(a, f)
+        f.seek(0)
+        b = pickle.load(f)
+        assert isinstance(b.q_dict["scale"], Tensor)
+        np.testing.assert_equal(b.q_dict["scale"].numpy(), 1.0)
--- a/imperative/python/test/unit/functional/test_tensor.py
+++ b/imperative/python/test/unit/functional/test_tensor.py
@@ -379,3 +379,19 @@ def test_copy_d2h():
 def test_copy_d2d():
    copy_test("gpu0", "gpu1")
    copy_test("gpu0:0", "gpu0:1")
+def test_q_dict():
+    x = tensor(1)
+    assert x.q_dict["scale"] is None
+    x.q_dict["scale"] = tensor(1.0)
+    y = tensor(1)
+    assert y.q_dict["scale"] is None
+    y.q_dict["scale"] = tensor(2.0)
+    assert x.q_dict["scale"].numpy() == 1.0
+    assert y.q_dict["scale"].numpy() == 2.0
+    z = x + y
+    assert z.q_dict["scale"] is None
--- a/imperative/python/test/unit/module/test_module_tensor.py
+++ b/imperative/python/test/unit/module/test_module_tensor.py
@@ -17,6 +17,7 @@ from megengine import Parameter, Tensor
 from megengine.module import Conv2d
+# TODO: delete this test after deleting set_value
 def test_set_value():
    v0 = np.random.random((2, 3)).astype(np.float32)
    param = Parameter(v0)

--- a/imperative/python/test/unit/quantization/test_module.py
+++ b/imperative/python/test/unit/quantization/test_module.py
+from functools import partial
 import numpy as np
 import pytest
@@ -6,17 +8,21 @@ import megengine.functional as F
 import megengine.module as Float
 import megengine.module.qat as QAT
 import megengine.module.quantized as Q
+from megengine import Parameter, Tensor
 from megengine.core.tensor import dtype
-from megengine.quantization import min_max_fakequant_qconfig
+from megengine.quantization import FakeQuantize, MinMaxObserver, QConfig
 from megengine.quantization.quantize import (
    disable_fake_quant,
    disable_observer,
    propagate_qconfig,
 )
-"""
+min_max_fakequant_qconfig = QConfig(
-Calculate testing scales based on ``min_max_fakequant_qconfig``
+    weight_observer=partial(MinMaxObserver, dtype="qint8", narrow_range=True),
-"""
+    act_observer=partial(MinMaxObserver, dtype="qint8", narrow_range=False),
+    weight_fake_quant=partial(FakeQuantize, dtype="qint8", narrow_range=True),
+    act_fake_quant=partial(FakeQuantize, dtype="qint8", narrow_range=False),
+)
 inp_scale = np.float32(np.random.rand() + 1)
@@ -31,21 +37,26 @@ def quant(x, scale):
    return x.astype(inp_dtype)
-def fake_quant(x, scale):
+def fake_quant(x, scale, qmin, qmax):
    x = x / scale
    x = F.round(x)
-    x = F.clip(x, -128, 127)
+    x = F.clip(x, qmin, qmax)
    x = x * scale
    return x
+fake_quant_act = partial(fake_quant, qmin=-128, qmax=127)
+fake_quant_weight = partial(fake_quant, qmin=-127, qmax=127)
+fake_quant_bias = partial(fake_quant, qmin=-(2 ** 31), qmax=2 ** 31 - 1)
 def init_qat_net(net):
    if net.with_weight:
-        net.weight_observer.min_val.set_value(min_val[0])
+        net.weight_observer.min_val[...] = Tensor(min_val[0])
-        net.weight_observer.max_val.set_value(max_val[0])
+        net.weight_observer.max_val[...] = Tensor(max_val[0])
    if net.with_act:
-        net.act_observer.min_val.set_value(min_val[1])
+        net.act_observer.min_val[...] = Tensor(min_val[1])
-        net.act_observer.max_val.set_value(max_val[1])
+        net.act_observer.max_val[...] = Tensor(max_val[1])
 def test_quant_stub():
@@ -71,7 +82,7 @@ def test_quant_stub():
    normal = normal_net(x)
    qat_without_fakequant = qat_from_float(x)
-    fake_quant_normal = fake_quant(normal_net(x), act_scale)
+    fake_quant_normal = fake_quant_act(normal_net(x), act_scale)
    qat = qat_net(x)
    q = q_net(x).numpy() * act_scale
    np.testing.assert_allclose(qat_without_fakequant, normal)
@@ -99,7 +110,7 @@ def test_dequant_stub():
    q_net.eval()
    x = mge.tensor(np.random.normal(size=(3, 3)).astype("float32"))
-    x = fake_quant(x, inp_scale)
+    x = fake_quant_act(x, inp_scale)
    x.q_dict["scale"] = inp_scale
    normal = normal_net(x)
@@ -134,12 +145,12 @@ def test_elemwise(kind):
    x1_scale = np.float32(np.random.rand() + 1)
    x1 = mge.tensor(np.random.normal(size=(3, 3)).astype("float32"))
-    x1 = fake_quant(x1, x1_scale)
+    x1 = fake_quant_act(x1, x1_scale)
    x1.q_dict["scale"] = x1_scale
    x2_scale = np.float32(np.random.rand() + 1)
    x2 = mge.tensor(np.random.normal(size=(3, 3)).astype("float32"))
-    x2 = fake_quant(x2, x2_scale)
+    x2 = fake_quant_act(x2, x2_scale)
    x2.q_dict["scale"] = x2_scale
    x1_int8 = quant(x1, x1_scale)
@@ -149,13 +160,13 @@ def test_elemwise(kind):
    if kind in ("ADD", "MUL", "FUSE_ADD_RELU"):
        normal = normal_net(x1, x2)
        qat_without_fakequant = qat_from_float(x1, x2)
-        fake_quant_normal = fake_quant(normal_net(x1, x2), act_scale)
+        fake_quant_normal = fake_quant_act(normal_net(x1, x2), act_scale)
        qat = qat_net(x1, x2)
        q = q_net(x1_int8, x2_int8).numpy() * act_scale
    else:
        normal = normal_net(x1)
        qat_without_fakequant = qat_from_float(x1)
-        fake_quant_normal = fake_quant(normal_net(x1), act_scale)
+        fake_quant_normal = fake_quant_act(normal_net(x1), act_scale)
        qat = qat_net(x1)
        q = q_net(x1_int8).numpy() * act_scale
    np.testing.assert_allclose(qat_without_fakequant, normal)
@@ -175,17 +186,17 @@ def test_linear():
    init_qat_net(qat_net)
    x = mge.tensor(np.random.normal(size=(3, 3)).astype("float32"))
-    x = fake_quant(x, inp_scale)
+    x = fake_quant_act(x, inp_scale)
    x.q_dict["scale"] = inp_scale
    x_int8 = quant(x, inp_scale)
    weight = np.random.normal(size=(3, 3)).astype("float32")
    bias = np.random.normal(size=(3,)).astype("float32")
-    normal_net.weight.set_value(fake_quant(weight, weight_scale))
+    normal_net.weight[...] = fake_quant_weight(weight, weight_scale)
-    normal_net.bias.set_value(fake_quant(bias, inp_scale * weight_scale))
+    normal_net.bias[...] = fake_quant_bias(bias, inp_scale * weight_scale)
-    qat_net.weight.set_value(weight)
+    qat_net.weight[...] = Parameter(weight)
-    qat_net.bias.set_value(bias)
+    qat_net.bias[...] = Parameter(bias)
    qat_from_float = QAT.Linear.from_float_module(normal_net)
    qat_from_float.eval()
@@ -197,11 +208,11 @@ def test_linear():
    normal = normal_net(x)
    qat_without_fakequant = qat_from_float(x)
-    fake_quant_normal = fake_quant(normal_net(x), act_scale)
+    fake_quant_normal = fake_quant_act(normal_net(x), act_scale)
    qat = qat_net(x)
    q = q_net(x_int8).numpy() * act_scale
    np.testing.assert_allclose(qat_without_fakequant, normal)
-    np.testing.assert_allclose(qat, fake_quant_normal)
+    np.testing.assert_allclose(qat, fake_quant_normal.numpy())
    np.testing.assert_allclose(q, fake_quant_normal.numpy())
@@ -218,7 +229,7 @@ def test_conv(module):
    init_qat_net(qat_net)
    x = mge.tensor(np.random.normal(size=(1, 3, 3, 3)).astype("float32"))
-    x = fake_quant(x, inp_scale)
+    x = fake_quant_act(x, inp_scale)
    x.q_dict["scale"] = inp_scale
    x_int8 = quant(x, inp_scale)
@@ -226,15 +237,15 @@ def test_conv(module):
    weight = np.random.normal(size=(3, 3, 3, 3)).astype("float32")
    bias = np.random.normal(size=(1, 3, 1, 1)).astype("float32")
    if module in ("ConvBn2d", "ConvBnRelu2d"):
-        normal_net.conv.weight.set_value(fake_quant(weight, weight_scale))
+        normal_net.conv.weight[...] = fake_quant_weight(weight, weight_scale)
-        normal_net.conv.bias.set_value(fake_quant(bias, inp_scale * weight_scale))
+        normal_net.conv.bias[...] = fake_quant_bias(bias, inp_scale * weight_scale)
-        qat_net.conv.weight.set_value(weight)
+        qat_net.conv.weight[...] = Parameter(weight)
-        qat_net.conv.bias.set_value(bias)
+        qat_net.conv.bias[...] = Parameter(bias)
    else:
-        normal_net.weight.set_value(fake_quant(weight, weight_scale))
+        normal_net.weight[...] = fake_quant_weight(weight, weight_scale)
-        normal_net.bias.set_value(fake_quant(bias, inp_scale * weight_scale))
+        normal_net.bias[...] = fake_quant_bias(bias, inp_scale * weight_scale)
-        qat_net.weight.set_value(weight)
+        qat_net.weight[...] = Parameter(weight)
-        qat_net.bias.set_value(bias)
+        qat_net.bias[...] = Parameter(bias)
    qat_from_float = getattr(QAT, module).from_float_module(normal_net)
    qat_from_float.eval()
@@ -246,9 +257,9 @@ def test_conv(module):
    normal = normal_net(x)
    qat_without_fakequant = qat_from_float(x)
-    fake_quant_normal = fake_quant(normal_net(x), act_scale)
+    fake_quant_normal = fake_quant_act(normal_net(x), act_scale)
    qat = qat_net(x)
    q = q_net(x_int8).numpy() * act_scale
-    np.testing.assert_allclose(qat_without_fakequant, normal, atol=1e-6)
+    np.testing.assert_allclose(qat_without_fakequant, normal, atol=1e-5)
-    np.testing.assert_allclose(qat, fake_quant_normal)
+    np.testing.assert_allclose(qat, fake_quant_normal, atol=act_scale)
-    np.testing.assert_allclose(q, fake_quant_normal.numpy())
+    np.testing.assert_allclose(q, fake_quant_normal.numpy(), atol=act_scale)
--- a/imperative/python/test/unit/quantization/test_quantize.py
+++ b/imperative/python/test/unit/quantization/test_quantize.py
@@ -8,9 +8,8 @@
 import numpy as np
 import pytest
-from megengine import functional
+from megengine import Parameter, Tensor
 from megengine import module as Float
-from megengine import tensor
 from megengine.module import qat as QAT
 from megengine.module import quantized as Q
 from megengine.quantization import (
@@ -40,7 +39,7 @@ class Net(Float.Module):
        self.quant = Float.QuantStub()
        self.linear = Float.Linear(3, 3)
        self.dequant = Float.DequantStub()
-        self.linear.bias.set_value(np.random.rand(3))
+        self.linear.bias[...] = Parameter(np.random.rand(3))
    def forward(self, x):
        x = self.quant(x)
@@ -55,7 +54,7 @@ class QATNet(Float.Module):
        self.quant = QAT.QuantStub()
        self.linear = QAT.Linear(3, 3)
        self.dequant = QAT.DequantStub()
-        self.linear.bias.set_value(np.random.rand(3))
+        self.linear.bias[...] = Parameter(np.random.rand(3))
    def forward(self, x):
        x = self.quant(x)
@@ -90,12 +89,12 @@ def init_qat_net():
    propagate_qconfig(net, min_max_fakequant_qconfig)
    min_val = np.random.randint(-127, 0, size=(3,))
    max_val = np.random.randint(1, 127, size=(3,))
-    net.quant.act_observer.min_val.set_value(min_val[0])
+    net.quant.act_observer.min_val[...] = Parameter(min_val[0])
-    net.quant.act_observer.max_val.set_value(max_val[0])
+    net.quant.act_observer.max_val[...] = Parameter(max_val[0])
-    net.linear.weight_observer.min_val.set_value(min_val[1])
+    net.linear.weight_observer.min_val[...] = Parameter(min_val[1])
-    net.linear.weight_observer.max_val.set_value(max_val[1])
+    net.linear.weight_observer.max_val[...] = Parameter(max_val[1])
-    net.linear.act_observer.min_val.set_value(min_val[2])
+    net.linear.act_observer.min_val[...] = Parameter(min_val[2])
-    net.linear.act_observer.max_val.set_value(max_val[2])
+    net.linear.act_observer.max_val[...] = Parameter(max_val[2])
    return net
@@ -144,7 +143,7 @@ def init_observer(module, data):
 def test_enable_and_disable_all():
-    x = tensor(np.random.randint(1, 10, size=(3, 3)).astype(np.float32))
+    x = Tensor(np.random.randint(1, 10, size=(3, 3)).astype(np.float32))
    net = Net()
    y1 = net(x).numpy()
    net = quantize_qat(net, min_max_fakequant_qconfig)
@@ -180,7 +179,7 @@ def test_quantize():
 def test_apply_easy_quant():
    qat_net = init_qat_net()
-    data = tensor(np.random.rand(2, 3, 3, 3), dtype=np.float32)
+    data = Tensor(np.random.rand(2, 3, 3, 3), dtype=np.float32)
    eq_net = reset_qconfig(qat_net, passive_qconfig, inplace=False)
    apply_easy_quant(eq_net, data, 0.9, 1.1, 10)
    assert isinstance(eq_net.quant.act_observer, PassiveObserver)