resolve conflicts

6cf56035 · dangqingqing · 15180e85 · ac712688 · 6cf56035 · 6cf56035
8 changed file
--- a/doc/api/trainer_config_helpers/layers.rst
+++ b/doc/api/trainer_config_helpers/layers.rst
@@ -308,6 +308,12 @@ repeat_layer
    :members: repeat_layer
    :noindex:
+seq_reshape_layer
+-----------------
+..  automodule:: paddle.trainer_config_helpers.layers
+    :members: seq_reshape_layer
+    :noindex:
 Math Layers
 ===========

--- a/paddle/gserver/layers/SequenceReshapeLayer.cpp
+++ b/paddle/gserver/layers/SequenceReshapeLayer.cpp
@@ -20,9 +20,12 @@ limitations under the License. */
 namespace paddle {
 /**
- * A layer for reshaping the sequence
+ *  A layer for reshaping the sequence. Assume the input sequence has
- * Input: a sequence
+ *  T instances, the dimension of each instance is M, and the input
- * Output: a sequence
+ *  reshape_dim is N, then the output sequence has T*M/N instances,
+ *  the dimension of each instance is N.
+ *
+ *  Note that T*M/N must be an integer.
 */
 class SequenceReshapeLayer : public Layer {

--- a/python/paddle/trainer_config_helpers/layers.py
+++ b/python/paddle/trainer_config_helpers/layers.py
@@ -37,6 +37,7 @@ __all__ = [
    "dotmul_projection",
    "dotmul_operator",
    "repeat_layer",
+    "seq_reshape_layer",
    "table_projection",
    "mixed_layer",
    "data_layer",
@@ -125,6 +126,7 @@ class LayerType(object):
    GRUMEMORY = "gated_recurrent"
    SEQUENCE_LAST_INSTANCE = "seqlastins"
    SEQUENCE_FIRST_INSTANCE = "seqfirstins"
+    SEQUENCE_RESHAPE = "seqreshape"
    POOLING_MAX = "max"
    POOLING_AVG = 'average'
    FC_LAYER = "fc"
@@ -1450,6 +1452,61 @@ def repeat_layer(input, num_repeats, name=None, layer_attr=None):
        parents=[input])
+@wrap_name_default("seqreshape")
+@wrap_act_default(act=IdentityActivation())
+@wrap_bias_attr_default(has_bias=False)
+@layer_support()
+def seq_reshape_layer(input,
+                      reshape_size,
+                      act=None,
+                      name=None,
+                      layer_attr=None,
+                      bias_attr=None):
+    """
+    A layer for reshaping the sequence. Assume the input sequence has T instances,
+    the dimension of each instance is M, and the input reshape_size is N, then the 
+    output sequence has T*M/N instances, the dimension of each instance is N.
+    Note that T*M/N must be an integer.
+    The example usage is:
+    .. code-block:: python
+       reshape = seq_reshape_layer(input=layer, reshape_size=4)
+    :param input: Input layer.
+    :type input: LayerOutput
+    :param reshape_size: the size of reshaped sequence.
+    :type reshape_size: int
+    :param name: Layer name.
+    :type name: basestring
+    :param act: Activation type.
+    :type act: BaseActivation
+    :param layer_attr: extra layer attributes.
+    :type layer_attr: ExtraLayerAttribute.
+    :param bias_attr: The Bias Attribute. If no bias, then pass False or
+                      something not type of ParameterAttribute. None will get a
+                      default Bias.
+    :type bias_attr: ParameterAttribute or None or bool
+    :return: LayerOutput object.
+    :rtype: LayerOutput
+    """
+    Layer(
+        inputs=[input.name],
+        name=name,
+        size=reshape_size,
+        type=LayerType.SEQUENCE_RESHAPE,
+        bias=ParamAttr.to_bias(bias_attr),
+        **ExtraAttr.to_kwargs(layer_attr))
+    return LayerOutput(
+        name=name,
+        size=reshape_size,
+        layer_type=LayerType.SEQUENCE_RESHAPE,
+        parents=[input])
 @wrap_name_default()
 @layer_support()
 def interpolation_layer(input, weight, name=None, layer_attr=None):
@@ -2604,6 +2661,10 @@ def seq_concat_layer(a, b, act=None, name=None, layer_attr=None,
    :type act: BaseActivation
    :param layer_attr: Extra Layer Attribute.
    :type layer_attr: ExtraLayerAttribute
+    :param bias_attr: The Bias Attribute. If no bias, then pass False or
+                      something not type of ParameterAttribute. None will get a
+                      default Bias.
+    :type bias_attr: ParameterAttribute or None or bool
    :return: LayerOutput object.
    :rtype: LayerOutput
    """

--- a/python/paddle/trainer_config_helpers/tests/configs/file_list.sh
+++ b/python/paddle/trainer_config_helpers/tests/configs/file_list.sh
@@ -5,6 +5,6 @@ last_first_seq test_expand_layer test_ntm_layers test_hsigmoid
 img_layers img_trans_layers util_layers simple_rnn_layers unused_layers test_cost_layers
 test_rnn_group shared_fc shared_lstm shared_gru test_cost_layers_with_weight
 test_spp_layer test_bilinear_interp test_maxout test_bi_grumemory math_ops
-test_seq_concat)
+test_seq_concat_reshape)
 export whole_configs=(test_split_datasource)
--- a/python/paddle/trainer_config_helpers/tests/configs/protostr/test_seq_concat.protostr
+++ b/python/paddle/trainer_config_helpers/tests/configs/protostr/test_seq_concat.protostr
@@ -23,17 +23,29 @@ layers {
    input_layer_name: "data2"
  }
 }
+layers {
+  name: "__seqreshape_0__"
+  type: "seqreshape"
+  size: 5
+  active_type: "linear"
+  inputs {
+    input_layer_name: "data1"
+  }
+}
 input_layer_names: "data1"
 input_layer_names: "data2"
 output_layer_names: "__seqconcat_0__"
+output_layer_names: "__seqreshape_0__"
 sub_models {
  name: "root"
  layer_names: "data1"
  layer_names: "data2"
  layer_names: "__seqconcat_0__"
+  layer_names: "__seqreshape_0__"
  input_layer_names: "data1"
  input_layer_names: "data2"
  output_layer_names: "__seqconcat_0__"
+  output_layer_names: "__seqreshape_0__"
  is_recurrent_layer_group: false
 }
--- a/python/paddle/trainer_config_helpers/tests/configs/test_seq_concat.py
+++ b/python/paddle/trainer_config_helpers/tests/configs/test_seq_concat.py
@@ -3,7 +3,10 @@ from paddle.trainer_config_helpers import *
 settings(batch_size=1000, learning_rate=1e-5)
 din1 = data_layer(name='data1', size=30)
 din2 = data_layer(name='data2', size=30)
-outputs(seq_concat_layer(a=din1, b=din2))
+opts = []
+opts.append(seq_concat_layer(a=din1, b=din2))
+opts.append(seq_reshape_layer(input=din1, reshape_size=5))
+outputs(opts)
--- a/python/paddle/v2/__init__.py
+++ b/python/paddle/v2/__init__.py
@@ -21,15 +21,8 @@ import data_type
 import py_paddle.swig_paddle as api
 __all__ = [
-    'optimizer',
+    'optimizer', 'layer', 'activation', 'parameters', 'init', 'trainer',
-    'layer',
+    'event', 'data_type', 'data_feeder'
-    'activation',
-    'parameters',
-    'init',
-    'trainer',
-    'event',
-    'data_type',
-    'data_feeder',
 ]

--- a/python/paddle/v2/layer.py
+++ b/python/paddle/v2/layer.py
@@ -66,12 +66,14 @@ Also, the creation of a protobuf message is hidden in the invocation of
 paddle.v2.parameters.create, no longer exposed to users.
 """
+import collections
 import paddle.trainer_config_helpers as conf_helps
-from . import data_type as v2_data
 from paddle.trainer_config_helpers.config_parser_utils import \
    parse_network_config as __parse__
 from paddle.trainer_config_helpers.default_decorators import wrap_name_default
-import collections
+import data_type
 __all__ = [
    'parse_network', 'data', 'fc', 'max_id', 'classification_cost',
@@ -166,7 +168,7 @@ So we also need to implement some special LayerV2.
 class DataLayerV2(Layer):
    def __init__(self, name, type, **kwargs):
-        assert isinstance(type, v2_data.InputType)
+        assert isinstance(type, data_type.InputType)
        self.type = type
        self.__method_name__ = 'data_layer'
@@ -198,8 +200,8 @@ cross_entropy_cost = __convert_to_v2__(
    parent_names=['input', 'label'])
 if __name__ == '__main__':
-    pixel = data(name='pixel', type=v2_data.dense_vector(784))
+    pixel = data(name='pixel', type=data_type.dense_vector(784))
-    label = data(name='label', type=v2_data.integer_value(10))
+    label = data(name='label', type=data_type.integer_value(10))
    hidden = fc(input=pixel, size=100, act=conf_helps.SigmoidActivation())
    inference = fc(input=hidden, size=10, act=conf_helps.SoftmaxActivation())
    maxid = max_id(input=inference)