Fix the inference batch_size in Transformer.

ec70ff45 · guosheng · f3c247d3 · ec70ff45 · ec70ff45
2 changed file
--- a/fluid/neural_machine_translation/transformer/config.py
+++ b/fluid/neural_machine_translation/transformer/config.py
@@ -22,8 +22,7 @@ class TrainTaskConfig(object):
 class InferTaskConfig(object):
    use_gpu = False
    # the number of examples in one run for sequence generation.
-    # currently the batch size can only be set to 1.
+    batch_size = 10
-    batch_size = 1
    # the parameters for beam search.
    beam_size = 5

--- a/fluid/neural_machine_translation/transformer/infer.py
+++ b/fluid/neural_machine_translation/transformer/infer.py
@@ -84,8 +84,11 @@ def translate_batch(exe, src_words, encoder, enc_in_names, enc_out_names,
                             [-1e9]).astype("float32")
        # This is used to remove attention on the paddings of source sequences.
        trg_src_attn_bias = np.tile(
-            src_slf_attn_bias[:, :, ::src_max_length, :],
+            src_slf_attn_bias[:, :, ::src_max_length, :][:, np.newaxis],
-            [beam_size, 1, trg_max_len, 1])
+            [1, beam_size, 1, trg_max_len, 1]).reshape([
+                -1, src_slf_attn_bias.shape[1], trg_max_len,
+                src_slf_attn_bias.shape[-1]
+            ])
        trg_data_shape = np.array(
            [batch_size * beam_size, trg_max_len, d_model], dtype="int32")
        enc_output = np.tile(