add caffe op part1

3021f600 · SunAhong1993 · 7cab088d · 3021f600 · 3021f600 · 3021f600
3 changed file
--- a/x2paddle/decoder/caffe_decoder.py
+++ b/x2paddle/decoder/caffe_decoder.py
@@ -60,11 +60,14 @@ class CaffeResolver(object):
 class CaffeGraphNode(GraphNode):
    def __init__(self, layer, layer_name=None):
        if layer_name is None:
-            super(CaffeGraphNode, self).__init__(layer, layer.name.replace('/', '_'))
+            super(CaffeGraphNode, self).__init__(layer,
+                                                 layer.name.replace('/', '_'))
        else:
-            super(CaffeGraphNode, self).__init__(layer, layer_name.replace('/', '_'))
+            super(CaffeGraphNode, self).__init__(layer,
+                                                 layer_name.replace('/', '_'))
        self.layer_type = layer.type
        self.fluid_code = FluidCode()
+        self.data = None

    def set_params(self, params):
        self.data = params

--- a/x2paddle/decoder/caffe_shape.py
+++ b/x2paddle/decoder/caffe_shape.py
@@ -110,7 +110,7 @@ def get_strided_kernel_output_shape(params, input_shape, round_func):
                                       round_func)
    has_c_o = hasattr(params, 'num_output')
    c = params.num_output if has_c_o else input_shape[1]
-    
+
    return [[input_shape[0], c, o_h, o_w]]


@@ -169,6 +169,7 @@ def shape_softmax(layer, input_shape):
 def shape_input(layer, input_shape):
    return [list(layer.input_param.shape[0].dim)]

+
 def shape_concat(layer, input_shape):
    params = layer.concat_param
    axis = params.axis
@@ -178,4 +179,54 @@ def shape_concat(layer, input_shape):
            output_shape = shape
        else:
            output_shape[axis] += shape[axis]
-    return [output_shape]
\ No newline at end of file
+    return [output_shape]
+
+
+def shape_slice(layer, input_shape):
+    inshape = input_shape[0]
+    params = layer.slice_param
+    axis = params.axis
+    count = inshape[axis]
+    points = list(params.slice_point)
+    points = [0] + points + [count]
+    output_shape = []
+    for i in range(len(points)):
+        shape = inshape
+        size = points[i + 1] - points[i]
+        shape[axis] = size
+        output_shape.append(shape)
+        if i == len(points) - 2:
+            break
+    return output_shape
+
+
+def shape_prelu(layer, input_shape):
+    return input_shape
+
+
+def shape_sigmoid(layer, input_shape):
+    return input_shape
+
+
+def shape_absval(layer, input_shape):
+    return input_shape
+
+
+def shape_accuracy(layer, input_shape):
+    return [[1]]
+
+
+def shape_tanh(layer, input_shape):
+    return input_shape
+
+
+def shape_eltwise(layer, input_shape):
+    return [input_shape[0]]
+
+
+def shape_batchnorm(layer, input_shape):
+    return input_shape
+
+
+def shape_scale(layer, input_shape):
+    return input_shape
--- a/x2paddle/op_mapper/caffe_op_mapper.py
+++ b/x2paddle/op_mapper/caffe_op_mapper.py
@@ -106,11 +106,17 @@ class CaffeOpMapper(OpMapper):
            raise ValueError('Unable to determine kernel parameter!')
        return default

-    def get_kernel_parameters(self, kind, params, kernel_default=[1, 1]):
+    def get_kernel_parameters(self, kind, params):
        assert kind in ['Convolution', 'Pooling', 'Deconvolution']

-        k_h = self.get_kernel_value(params.kernel_h, params.kernel_size, 0, kernel_default[0])
-        k_w = self.get_kernel_value(params.kernel_w, params.kernel_size, 1, kernel_default[1])
+        k_h = self.get_kernel_value(params.kernel_h,
+                                    params.kernel_size,
+                                    0,
+                                    default=1)
+        k_w = self.get_kernel_value(params.kernel_w,
+                                    params.kernel_size,
+                                    1,
+                                    default=1)
        s_h = self.get_kernel_value(params.stride_h,
                                    params.stride,
                                    0,
@@ -144,6 +150,12 @@ class CaffeOpMapper(OpMapper):

        return c_o, kernel, stride, pad, dilation, group

+    def get_input_name(self, node):
+        if hasattr(node, "index"):
+            return node.layer_name + "[{}]".format(node.index)
+        else:
+            return node.layer_name
+
    def Input(self, node):
        shape = list(node.layer.input_param.shape[0].dim)[1:]
        dtype = 'float32'
@@ -159,6 +171,8 @@ class CaffeOpMapper(OpMapper):

    def Convolution(self, node):
        data = node.data
+        assert data is not None, 'The parameter of {} (type is {}) is not set. You need to use python package of caffe to set the default value.'.format(
+            node.layer_name, node.layer_type)
        data = self.adjust_parameters(node, data)
        self.weights[node.layer_name + '_weights'] = data[0]
        if len(data) == 2:
@@ -187,6 +201,8 @@ class CaffeOpMapper(OpMapper):

    def Deconvolution(self, node):
        data = node.data
+        assert data is not None, 'The parameter of {} (type is {}) is not set. You need to use python package of caffe to set the default value.'.format(
+            node.layer_name, node.layer_type)
        data = self.adjust_parameters(node, data)
        self.weights[node.layer_name + '_weights'] = data[0]
        if len(data) == 2:
@@ -216,13 +232,10 @@ class CaffeOpMapper(OpMapper):

    def Pooling(self, node):
        params = node.layer.pooling_param
-        shape = node.input_shape[0]
        global_pool = getattr(params, 'global_pooling', False)
        kernel_default = [1, 1]
-        if global_pool:
-            kernel_default = [shape[2],shape[3]]
        channel, kernel, stride, pad, dilation, group = self.get_kernel_parameters(
-            node.layer_type, params, kernel_default=kernel_default)
+            node.layer_type, params)
        if params.pool == 0:
            pool_type = 'max'
        else:
@@ -237,6 +250,7 @@ class CaffeOpMapper(OpMapper):
            'ceil_mode': True,
            'pool_type': string(pool_type),
            'exclusive': True,
+            'global_pooling': global_pool,
            'name': string(node.layer_name)
        }
        node.fluid_code.add_layer("pool2d",
@@ -279,6 +293,8 @@ class CaffeOpMapper(OpMapper):

    def InnerProduct(self, node):
        data = node.data
+        assert data is not None, 'The parameter of {} (type is {}) is not set. You need to use python package of caffe to set the default value.'.format(
+            node.layer_name, node.layer_type)
        data = self.adjust_parameters(node, data)
        # Reshape the parameters to Paddle's ordering
        transpose_order = (1, 0)
@@ -361,47 +377,308 @@ class CaffeOpMapper(OpMapper):
        params = node.layer.slice_param
        axis = params.axis
        points = list(params.slice_point)
-        shape = node.input_shape[0]
-        count = shape[axis]
-        sections = []
-        idx = 0
-        for p in points:
-            if idx == 0:
-                sections.append(p - 0)
-            elif idx == len(points) - 1:
-                sections.append(count - p)
-            else:
-                sections.append(points[idx + 1] - p)
-            idx += 1
-        attr = {
-            'dim': axis,
-            'num_or_sections': sections,
-            'name': string(node.layer_name + '_slice')
-        }
-        node.fluid_code.add_layer("split",
-                                  inputs=input,
-                                  output=node,
-                                  param_attr=attr)
+        maxint32 = 2147483647
+        points = [0] + points
+        points.append(maxint32)
+        i = 0
+        node.fluid_code.add_note('{} = []'.format(node.layer_name))
+        for i in range(len(points)):
+            attr = {
+                'axes': [axis],
+                'starts': [points[i]],
+                'ends': [points[i + 1]],
+                'name': string(node.layer_name + '_' + str(i))
+            }
+            node.fluid_code.add_layer("slice",
+                                      inputs=input,
+                                      output=string(node.layer_name + '_' +
+                                                    str(i)),
+                                      param_attr=attr)
+            node.fluid_code.add_note('{}.append({})'.format(
+                node.layer_name, node.layer_name + '_' + str(i)))
+            if i == len(points) - 2:
+                break

    def Concat(self, node):
        assert len(
-            node.inputs) > 1, 'The count of Concat node\'s input is not more than 1.'
+            node.inputs
+        ) > 1, 'The count of Concat node\'s input is not more than 1.'
        inputs = []
        for i in range(len(node.inputs)):
            input = self.graph.get_bottom_node(node, idx=i, copy=True)
            inputs.append(input)
        params = node.layer.concat_param
        axis = params.axis
+        attr = {'axis': axis, 'name': string(node.layer_name)}
+        node.fluid_code.add_layer("concat",
+                                  inputs=inputs,
+                                  output=node,
+                                  param_attr=attr)
+
+    def PReLU(self, node):
+        assert len(
+            node.inputs) == 1, 'The count of PReLU node\'s input is not 1.'
+        input = self.graph.get_bottom_node(node, idx=0, copy=True)
+        params = node.layer.prelu_param
+        mode_bool = params.channel_shared
+        if mode_bool:
+            mode = 'all'
+        else:
+            mode = 'channel'
+        data = node.data
+        assert data is not None, 'The parameter of {} (type is {}) is not set. You need to use python package of caffe to set the default value.'.format(
+            node.layer_name, node.layer_type)
+        self.weights[node.layer_name + '_weights'] = data[0]
        attr = {
-            'axis': axis,
-            'name': string(node.layer_name + '_concat')
+            'mode': mode,
+            'param_attr': string(node.layer_name + '_weights'),
+            'name': string(node.layer_name)
        }
-        node.fluid_code.add_layer("concat",
+        node.fluid_code.add_layer("prelu",
+                                  inputs=input,
+                                  output=node,
+                                  param_attr=attr)
+
+    def Sigmoid(self, node):
+        assert len(
+            node.inputs) == 1, 'The count of PReLU node\'s input is not 1.'
+        input = self.graph.get_bottom_node(node, idx=0, copy=True)
+        attr = {'name': string(node.layer_name)}
+        node.fluid_code.add_layer("sigmoid",
+                                  inputs=input,
+                                  output=node,
+                                  param_attr=attr)
+
+    def AbsVal(self, node):
+        assert len(
+            node.inputs) == 1, 'The count of PReLU node\'s input is not 1.'
+        input = self.graph.get_bottom_node(node, idx=0, copy=True)
+        attr = {'name': string(node.layer_name)}
+        node.fluid_code.add_layer("absval",
+                                  inputs=input,
+                                  output=node,
+                                  param_attr=attr)
+
+    def Accuracy(self, node):
+        assert len(
+            node.inputs) == 2, 'The count of Accuracy node\'s input is not 2.'
+        inputs = []
+        inputs[0] = None
+        inputs[1] = None
+        i = 0
+        for shape in node.input_shape:
+            if shape[1] == 1:
+                inputs[1] = self.graph.get_bottom_node(node, idx=i, copy=True)
+            else:
+                inputs[0] = self.graph.get_bottom_node(node, idx=i, copy=True)
+            i += 1
+        params = node.layer.accuracy_param
+        top_k = params.top_k
+        axis = params.axis
+        ignore_label = params.ignore_label
+        # TODO(syf)
+        assert axis == 1, 'PaddlePaddle can not support the situation when the axis is not 1.'
+        assert not ignore_label >= 0, 'PaddlePaddle can not support the situation when the model has ignore label.'
+        attr = {'k': top_k}
+        node.fluid_code.add_layer("accuracy",
                                  inputs=inputs,
                                  output=node,
                                  param_attr=attr)
-    
-            
-        
-        
-        
\ No newline at end of file
+
+    def TanH(self, node):
+        assert len(
+            node.inputs) == 1, 'The count of TanH node\'s input is not 1.'
+        input = self.graph.get_bottom_node(node, idx=0, copy=True)
+        attr = {'name': string(node.layer_name)}
+        node.fluid_code.add_layer("tanh",
+                                  inputs=input,
+                                  output=node,
+                                  param_attr=attr)
+
+    def Eltwise(self, node):
+        assert len(
+            node.inputs) == 2, 'The count of TanH node\'s input is not 2.'
+        params = node.layer.eltwise_param
+        mode = params.operation
+        inputs = []
+        inputs.append(self.graph.get_bottom_node(node, idx=0, copy=True))
+        inputs.append(self.graph.get_bottom_node(node, idx=1, copy=True))
+        if mode == 0:
+            attr = {'act': None, 'name': string(node.layer_name)}
+            node.fluid_code.add_layer("elementwise_mul",
+                                      inputs=inputs,
+                                      output=node,
+                                      param_attr=attr)
+        elif mode == 1:
+            if hasattr(params, 'coeff') and len(params.coeff) == 2:
+                coeff = params.coeff
+                input1_name = self.get_input_name(inputs[0])
+                attr = {
+                    'shape': [1],
+                    'value': coeff[0],
+                    'dtype': '{}.dtype'.format(input1_name)
+                }
+                node.fluid_code.add_layer("fill_constant",
+                                          inputs=None,
+                                          output=node.layer_name + '_const1',
+                                          param_attr=attr)
+                attr = {'act': None, 'name': string(node.layer_name + '_mul1')}
+                node.fluid_code.add_layer("elementwise_mul",
+                                          inputs=input1_name + ', ' +
+                                          node.layer_name + '_const1',
+                                          output=node.layer_name + '_mul1',
+                                          param_attr=attr)
+                input2_name = self.get_input_name(inputs[1])
+                attr = {
+                    'shape': [1],
+                    'value': coeff[1],
+                    'dtype': '{}.dtype'.format(input2_name)
+                }
+                node.fluid_code.add_layer("fill_constant",
+                                          inputs=None,
+                                          output=node.layer_name + '_const2',
+                                          param_attr=attr)
+                attr = {'act': None, 'name': string(node.layer_name + '_mul2')}
+                node.fluid_code.add_layer("elementwise_mul",
+                                          inputs=input2_name + ', ' +
+                                          node.layer_name + '_const2',
+                                          output=node.layer_name + '_mul2',
+                                          param_attr=attr)
+
+                attr = {'act': None, 'name': string(node.layer_name)}
+                node.fluid_code.add_layer("elementwise_add",
+                                          inputs='{}_mul1, {}_mul2'.format(
+                                              node.layer_name, node.layer_name),
+                                          output=node,
+                                          param_attr=attr)
+            else:
+                attr = {'act': None, 'name': string(node.layer_name)}
+                node.fluid_code.add_layer("elementwise_add",
+                                          inputs=inputs,
+                                          output=node,
+                                          param_attr=attr)
+        else:
+            attr = {'act': None, 'name': string(node.layer_name)}
+            node.fluid_code.add_layer("elementwise_max",
+                                      inputs=inputs,
+                                      output=node,
+                                      param_attr=attr)
+
+    def BatchNorm(self, node):
+        assert len(node.inputs) == 1 and len(
+            node.outputs
+        ) == 1, 'The count of BatchNorm node\'s input and output is not 1.'
+        input = self.graph.get_bottom_node(node, idx=0, copy=True)
+        params = node.layer.batch_norm_param
+        if hasattr(params, eps):
+            eps = params.eps
+        else:
+            eps = 1e-5
+        assert len(node.data) == 3
+        node.data = [np.squeeze(i) for i in node.data]
+        mean, variance, scale = node.data
+        # Prescale the stats
+        scaling_factor = 1.0 / scale if scale != 0 else 0
+        mean *= scaling_factor
+        variance *= scaling_factor
+        self.weights[node.layer_name + '_mean'] = mean
+        self.weights[node.layer_name + '_variance'] = variance
+        if self.graph.get_node(node.outputs[0]).layer_type == 'Scale':
+            data = self.graph.get_node(node.outputs[0]).data
+            self.weights[node.layer_name + '_scale'] = np.squeeze(data[0])
+            self.weights[node.layer_name + '_offset'] = np.squeeze(data[1])
+            attr = {
+                'is_test': True,
+                'param_attr': string(node.layer_name + '_scale'),
+                'bias_attr': string(node.layer_name + '_offset'),
+                'moving_mean_name': string(node.layer_name + '_mean'),
+                'moving_variance_name': string(node.layer_name + '_variance'),
+                'epsilon': eps,
+                'name': string(node.layer_name)
+            }
+        else:
+            attr = {
+                'is_test': True,
+                'param_attr': None,
+                'bias_attr': None,
+                'moving_mean_name': string(node.layer_name + '_mean'),
+                'moving_variance_name': string(node.layer_name + '_variance'),
+                'epsilon': eps,
+                'name': string(node.layer_name)
+            }
+        node.fluid_code.add_layer("batch_norm",
+                                  inputs=input,
+                                  output=node,
+                                  param_attr=attr)
+
+    def Scale(self, node):
+        assert len(
+            node.outputs) == 1, 'The count of Scale node\'s output is not 1.'
+        if len(node.inputs) == 1 and self.graph.get_node(
+                node.inputs[0]).layer_type == 'BatchNorm':
+            return
+        else:
+            self.weights[node.layer_name + '_scale'] = np.squeeze(nose.data[0])
+            self.weights[node.layer_name + '_offset'] = np.squeeze(node.data[1])
+            params = node.layer.scale_params
+            axis = params.axis
+            num_axes = params.num_axes
+            assert num_axes == 1, "layer scale not support this num_axes[%d] now" % (
+                num_axes)
+            inputs = []
+            if len(node.inputs) == 2:
+                # for two tensor, here resets axis to 1. Maybe there is a bug for unkown case.
+                axis = 1
+                bias_shape = node.input_shape[0][axis:axis + num_axes]
+                input0 = self.graph.get_bottom_node(node, idx=0, copy=True)
+                input1 = self.graph.get_bottom_node(node, idx=1, copy=True)
+                inputs.append(input0)
+                inputs.append(input1)
+                attr = {'axis': axis, 'name': string(node.layer_name + '_mul')}
+                node.fluid_code.add_layer("elementwise_mul",
+                                          inputs=inputs,
+                                          output=node.layer_name + '_mul',
+                                          param_attr=attr)
+            else:
+                bias_shape = node.input_shape[0][axis:axis + num_axes]
+                input0 = self.graph.get_bottom_node(node, idx=0, copy=True)
+                input0_name = self.get_input_name(input0)
+                attr = {
+                    'dtype': '{}.dtype'.formatr(input0_name),
+                    'shape': bias_shape,
+                    'name': string(node.layer_name + '_cparam1'),
+                    'attr': string(node.layer_name + '_scale'),
+                    'is_bias': True,
+                    'default_initializer': 'Constant(value=1.0)'
+                }
+                node.fluid_code.add_layer("create_parameter",
+                                          inputs=None,
+                                          output=node,
+                                          param_attr=attr)
+                inputs.append(input0)
+                inputs.append(node)
+                attr = {'axis': axis, 'name': string(node.layer_name + '_mul')}
+                node.fluid_code.add_layer("elementwise_mul",
+                                          inputs=inputs,
+                                          output=node.layer_name + '_mul',
+                                          param_attr=attr)
+            scale_shape = bias_shape
+            input0_name = self.get_input_name(input0)
+            attr = {
+                'dtype': '{}.dtype'.formatr(input0_name),
+                'shape': scale_shape,
+                'name': string(node.layer_name + '_cparam2'),
+                'attr': string(node.layer_name + '_offset'),
+                'is_bias': True,
+                'default_initializer': 'Constant(value=1.0)'
+            }
+            node.fluid_code.add_layer("create_parameter",
+                                      inputs=None,
+                                      output=node.layer_name + '_offset_param',
+                                      param_attr=attr)
+            attr = {'axis': axis, 'name': string(node.layer_name + '_add')}
+            node.fluid_code.add_layer("elementwise_add",
+                                      inputs='{}_mul, {}_offset_param'.format(
+                                          node.layer_name, node.layer_name),
+                                      output=node,
+                                      param_attr=attr)