test_gated_unit_layer.protostr 2.2 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106
type: "nn"
layers {
  name: "input"
  type: "data"
  size: 256
  active_type: ""
}
layers {
  name: "__gated_unit_layer_0___input_proj"
  type: "fc"
  size: 512
  active_type: "tanh"
  inputs {
    input_layer_name: "input"
    input_parameter_name: "___gated_unit_layer_0___input_proj.w0"
  }
  bias_parameter_name: "___gated_unit_layer_0___input_proj.wbias"
  error_clipping_threshold: 100.0
}
layers {
  name: "__gated_unit_layer_0___gate"
  type: "fc"
  size: 512
  active_type: "sigmoid"
  inputs {
    input_layer_name: "input"
    input_parameter_name: "___gated_unit_layer_0___gate.w0"
  }
  bias_parameter_name: "___gated_unit_layer_0___gate.wbias"
  error_clipping_threshold: 100.0
}
layers {
  name: "__gated_unit_layer_0___gated_act"
  type: "mixed"
  size: 512
  active_type: ""
  inputs {
    input_layer_name: "__gated_unit_layer_0___input_proj"
  }
  inputs {
    input_layer_name: "__gated_unit_layer_0___gate"
  }
  error_clipping_threshold: 100.0
  operator_confs {
    type: "dot_mul"
    input_indices: 0
    input_indices: 1
    input_sizes: 512
    input_sizes: 512
    output_size: 512
    dotmul_scale: 1
  }
}
parameters {
  name: "___gated_unit_layer_0___input_proj.w0"
  size: 131072
  initial_mean: 0.0
  initial_std: 0.0001
  dims: 256
  dims: 512
  initial_strategy: 0
  initial_smart: false
}
parameters {
  name: "___gated_unit_layer_0___input_proj.wbias"
  size: 512
  initial_mean: 0.0
  initial_std: 1
  dims: 1
  dims: 512
  initial_strategy: 0
  initial_smart: false
}
parameters {
  name: "___gated_unit_layer_0___gate.w0"
  size: 131072
  initial_mean: 0.0
  initial_std: 0.0001
  dims: 256
  dims: 512
  initial_strategy: 0
  initial_smart: false
}
parameters {
  name: "___gated_unit_layer_0___gate.wbias"
  size: 512
  initial_mean: 0.0
  initial_std: 1
  dims: 1
  dims: 512
  initial_strategy: 0
  initial_smart: false
}
input_layer_names: "input"
output_layer_names: "__gated_unit_layer_0___gated_act"
sub_models {
  name: "root"
  layer_names: "input"
  layer_names: "__gated_unit_layer_0___input_proj"
  layer_names: "__gated_unit_layer_0___gate"
  layer_names: "__gated_unit_layer_0___gated_act"
  input_layer_names: "input"
  output_layer_names: "__gated_unit_layer_0___gated_act"
  is_recurrent_layer_group: false
}