Fix Bugs (#1792)

bb02b103 · Chang Xu · GitHub · 73e15291 · bb02b103 · bb02b103
3 changed file
--- a/paddleslim/quant/advanced/layerwise_quant_error.py
+++ b/paddleslim/quant/advanced/layerwise_quant_error.py
@@ -54,6 +54,7 @@ class LayerWiseQuantError(nn.Layer):
            if type(cur_layer) == LayerWiseQuantError:
                print(cur_name, cur_layer.losses.mean())
        '''
+        super(LayerWiseQuantError, self).__init__()
        self.layer = layer
        self.weight = layer.weight
        self.weight_bits = weight_bits
@@ -62,14 +63,13 @@ class LayerWiseQuantError(nn.Layer):
        self.act_method = act_quant_method
        self.loss_function = loss_function
        self.losses = []
+        self.loss = None
    def forward(self, input):
        act = input[0] if type(input) == tuple else input
        origin_out = paddle.matmul(act, self.weight)
        bnt = (1 << (self.weight_bits - 1)) - 1
-        quant_scale = compute_scales(
+        quant_scale = compute_scales(self.weight, method=self.weight_method)
-            self.weight.cast('float32'),
-            method=self.weight_method).cast(self.weight.dtype)
        quant_weight = paddle.clip(
            paddle.round(self.weight / quant_scale * bnt), -bnt - 1, bnt)
        quant_dequant_weight = quant_weight / bnt * quant_scale
@@ -80,6 +80,7 @@ class LayerWiseQuantError(nn.Layer):
            paddle.round(act / quant_scale * bnt), -bnt - 1, bnt)
        quant_dequant_act = quant_act / bnt * quant_scale
        quant_out = paddle.matmul(quant_dequant_act, quant_dequant_weight)
-        loss = self.loss_function(origin_out, quant_out)
+        loss = self.loss_function(origin_out, quant_out).cast('float32')
        self.losses.append(loss)
+        self.loss = paddle.to_tensor(self.losses, dtype='float32').mean()
        return self.layer(input)
--- a/paddleslim/quant/advanced/utils.py
+++ b/paddleslim/quant/advanced/utils.py
@@ -48,8 +48,10 @@ def compute_scales(x, method='abs_max'):
    elif method == 'abs_max_channel_wise':
        reduce_axis = tuple([i for i in range(len(x.shape)) if i != 1])
        quant_scale = paddle.max(paddle.abs(x), axis=reduce_axis)
-        quant_scale = paddle.where(quant_scale == np.float32(0.0),
+        quant_scale = paddle.where(quant_scale == paddle.to_tensor(
-                                   np.float32(1e-8), quant_scale)
+            0, dtype=x.dtype),
+                                   paddle.to_tensor(1e-8, dtype=x.dtype),
+                                   quant_scale)
    return quant_scale

--- a/paddleslim/quant/advanced/utils_layers.py
+++ b/paddleslim/quant/advanced/utils_layers.py
@@ -26,7 +26,7 @@ class ShiftSmoothHelpLayer(nn.Layer):
        super(ShiftSmoothHelpLayer, self).__init__()
        self.weight = layer.weight
        shift_shape = self.weight.shape[0]
-        if hasattr(layer, "bias") or layer.bias is None:
+        if not hasattr(layer, "bias") or layer.bias is None:
            self.bias = paddle.create_parameter(
                shape=[self.weight.shape[1]],
                dtype=self.weight.dtype,