From caca568746f790efcc5739f028de04036b7c9f1e Mon Sep 17 00:00:00 2001 From: Kaipeng Deng Date: Tue, 8 Nov 2022 15:31:34 +0800 Subject: [PATCH] add fuse_multi_transformer passes to fp16. test=develop (#47676) --- paddle/fluid/inference/api/paddle_pass_builder.cc | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/paddle/fluid/inference/api/paddle_pass_builder.cc b/paddle/fluid/inference/api/paddle_pass_builder.cc index ae7b81e9c3..4c6ab76dba 100755 --- a/paddle/fluid/inference/api/paddle_pass_builder.cc +++ b/paddle/fluid/inference/api/paddle_pass_builder.cc @@ -170,6 +170,12 @@ const std::vector kGpuLowerPrecisionPasses{ "conv_elementwise_add2_act_fuse_pass", "conv_elementwise_add_fuse_pass", "multihead_matmul_fuse_pass_v2", + "fused_multi_transformer_encoder_pass", + "fused_multi_transformer_decoder_pass", + "fused_multi_transformer_encoder_fuse_qkv_pass", + "fused_multi_transformer_decoder_fuse_qkv_pass", + "multi_devices_fused_multi_transformer_encoder_fuse_qkv_pass", + "multi_devices_fused_multi_transformer_decoder_fuse_qkv_pass", "gpu_cpu_map_matmul_v2_to_mul_pass", "gpu_cpu_map_matmul_v2_to_matmul_pass", "fc_fuse_pass", -- GitLab