Merge pull request #1762 from reyoung/feature/refine_nce_layer

Refine NCE Layer

Merge pull request #1762 from reyoung/feature/refine_nce_layer
Refine NCE Layer
4b1b599a · Yu Yang · GitHub · 7e6def58 · 7adad0c9 · 4b1b599a
显示空白变更内容
内联并排

Showing with 18 addition and 6 deletion

python/paddle/trainer_config_helpers/layers.py python/paddle/trainer_config_helpers/layers.py +18 -6

未找到文件。
--- a/python/paddle/trainer_config_helpers/layers.py
+++ b/python/paddle/trainer_config_helpers/layers.py
@@ -18,7 +18,7 @@ import inspect
 from paddle.trainer.config_parser import *
 from .activations import LinearActivation, SigmoidActivation, TanhActivation, \
-    ReluActivation, IdentityActivation, SoftmaxActivation
+    ReluActivation, IdentityActivation, SoftmaxActivation, BaseActivation
 from .evaluators import *
 from .poolings import MaxPooling, AvgPooling, BasePoolingType
 from .attrs import *
@@ -2253,7 +2253,8 @@ def img_pool_layer(input,
        pool_type.name = 'avg'
    type_name = pool_type.name + '-projection' \
-      if (isinstance(pool_type, AvgPooling) or isinstance(pool_type, MaxPooling)) \
+        if (
+    isinstance(pool_type, AvgPooling) or isinstance(pool_type, MaxPooling)) \
        else pool_type.name
    pool_size_y = pool_size if pool_size_y is None else pool_size_y
@@ -4807,12 +4808,14 @@ def crf_decoding_layer(input,
    return LayerOutput(name, LayerType.CRF_DECODING_LAYER, parents, size=1)
+@wrap_act_default(act=SigmoidActivation())
 @wrap_bias_attr_default(has_bias=True)
 @wrap_name_default()
 @layer_support()
 def nce_layer(input,
              label,
              num_classes,
+              act=None,
              weight=None,
              num_neg_samples=10,
              neg_distribution=None,
@@ -4841,6 +4844,8 @@ def nce_layer(input,
    :type weight: LayerOutput
    :param num_classes: number of classes.
    :type num_classes: int
+    :param act: Activation, default is Sigmoid.
+    :type act: BaseActivation
    :param num_neg_samples: number of negative samples. Default is 10.
    :type num_neg_samples: int
    :param neg_distribution: The distribution for generating the random negative labels.
@@ -4863,6 +4868,8 @@ def nce_layer(input,
        assert isinstance(neg_distribution, collections.Sequence)
        assert len(neg_distribution) == num_classes
        assert sum(neg_distribution) == 1
+    if not isinstance(act, BaseActivation):
+        raise TypeError()
    ipts_for_layer = []
    parents = []
@@ -4884,12 +4891,17 @@ def nce_layer(input,
        type=LayerType.NCE_LAYER,
        num_classes=num_classes,
        neg_sampling_dist=neg_distribution,
+        active_type=act.name,
        num_neg_samples=num_neg_samples,
        inputs=ipts_for_layer,
        bias=ParamAttr.to_bias(bias_attr),
        **ExtraLayerAttribute.to_kwargs(layer_attr))
    return LayerOutput(
-        name, LayerType.NCE_LAYER, parents=parents, size=l.config.size)
+        name,
+        LayerType.NCE_LAYER,
+        parents=parents,
+        size=l.config.size,
+        activation=act)
 """