提交 e2fd06c3 编写于 作者: C caoying03

refine name of the input parameter.

上级 ac69f773
...@@ -5879,19 +5879,19 @@ def prelu_layer(input, ...@@ -5879,19 +5879,19 @@ def prelu_layer(input,
size=l.config.size) size=l.config.size)
@layer_support(ERROR_CLIPPING, DROPOUT)
@wrap_name_default() @wrap_name_default()
@layer_support(ERROR_CLIPPING, DROPOUT)
@wrap_act_default(act=LinearActivation()) @wrap_act_default(act=LinearActivation())
def gated_unit_layer(input, def gated_unit_layer(input,
size, size,
act=None, act=None,
name=None, name=None,
gate_attr=None, gate_attr=None,
gate_bias_attr=True,
gate_param_attr=None, gate_param_attr=None,
gate_bias_attr=True,
inproj_attr=None,
inproj_param_attr=None, inproj_param_attr=None,
inproj_bias_attr=True, inproj_bias_attr=True,
inproj_layer_attr=None,
layer_attr=None): layer_attr=None):
""" """
The gated unit layer implements a simple gating mechanism over the input. The gated unit layer implements a simple gating mechanism over the input.
...@@ -5923,18 +5923,18 @@ def gated_unit_layer(input, ...@@ -5923,18 +5923,18 @@ def gated_unit_layer(input,
clipping threshold, dropout and so on. See ExtraLayerAttribute for clipping threshold, dropout and so on. See ExtraLayerAttribute for
more details. more details.
:type gate_attr: ExtraLayerAttribute|None :type gate_attr: ExtraLayerAttribute|None
:param gate_bias_attr: Attributes to tune the learnable bias of the gate.
:type gate_bias_attr: ParameterAttribute|None
:param gate_param_attr: Attributes to tune the learnable projected matrix :param gate_param_attr: Attributes to tune the learnable projected matrix
parameter of the gate. parameter of the gate.
:type gate_param_attr: ParameterAttribute|None :type gate_param_attr: ParameterAttribute|None
:param gate_bias_attr: Attributes to tune the learnable bias of the gate.
:type gate_bias_attr: ParameterAttribute|None
:param inproj_attr: Attributes to the tune the projected input, for
example, error clipping threshold, dropout and so on. See
ExtraLayerAttribute for more details.
:type inproj_attr: ExtraLayerAttribute|None
:param inproj_param_attr: Attributes to tune the learnable parameter of :param inproj_param_attr: Attributes to tune the learnable parameter of
the projection of input. the projection of input.
:type inproj_param_attr: ParameterAttribute|None :type inproj_param_attr: ParameterAttribute|None
:param inproj_layer_attr: Attributes to the tune the projected input, for
example, error clipping threshold, dropout and so on. See
ExtraLayerAttribute for more details.
:type inproj_layer_attr: ExtraLayerAttribute|None
:param inproj_bias_attr: Attributes to tune the learnable bias of :param inproj_bias_attr: Attributes to tune the learnable bias of
projection of the input. projection of the input.
:type inproj_bias_attr: ParameterAttribute|None :type inproj_bias_attr: ParameterAttribute|None
...@@ -5954,8 +5954,8 @@ def gated_unit_layer(input, ...@@ -5954,8 +5954,8 @@ def gated_unit_layer(input,
name="%s_input_proj" % name, name="%s_input_proj" % name,
size=size, size=size,
act=act, act=act,
layer_attr=inproj_attr,
param_attr=inproj_param_attr, param_attr=inproj_param_attr,
layer_attr=inproj_layer_attr,
bias_attr=inproj_bias_attr) bias_attr=inproj_bias_attr)
gate = fc_layer( gate = fc_layer(
...@@ -5963,8 +5963,8 @@ def gated_unit_layer(input, ...@@ -5963,8 +5963,8 @@ def gated_unit_layer(input,
name="%s_gate" % name, name="%s_gate" % name,
act=SigmoidActivation(), act=SigmoidActivation(),
input=input, input=input,
param_attr=gate_param_attr,
layer_attr=gate_attr, layer_attr=gate_attr,
param_attr=gate_param_attr,
bias_attr=gate_bias_attr) bias_attr=gate_bias_attr)
return mixed_layer( return mixed_layer(
name="%s_gated_act" % name, name="%s_gated_act" % name,
......
...@@ -5,11 +5,11 @@ glu = gated_unit_layer( ...@@ -5,11 +5,11 @@ glu = gated_unit_layer(
size=512, size=512,
input=data, input=data,
act=TanhActivation(), act=TanhActivation(),
gate_param_attr=ParamAttr(initial_std=1e-4),
gate_attr=ExtraLayerAttribute(error_clipping_threshold=100.0), gate_attr=ExtraLayerAttribute(error_clipping_threshold=100.0),
gate_param_attr=ParamAttr(initial_std=1e-4),
gate_bias_attr=ParamAttr(initial_std=1), gate_bias_attr=ParamAttr(initial_std=1),
inproj_attr=ExtraLayerAttribute(error_clipping_threshold=100.0),
inproj_param_attr=ParamAttr(initial_std=1e-4), inproj_param_attr=ParamAttr(initial_std=1e-4),
inproj_layer_attr=ExtraLayerAttribute(error_clipping_threshold=100.0),
inproj_bias_attr=ParamAttr(initial_std=1), inproj_bias_attr=ParamAttr(initial_std=1),
layer_attr=ExtraLayerAttribute(error_clipping_threshold=100.0)) layer_attr=ExtraLayerAttribute(error_clipping_threshold=100.0))
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册