From 34f67a88a625ea3d5aeea470a75d287e2e54d4cc Mon Sep 17 00:00:00 2001 From: Kaipeng Deng Date: Tue, 8 Nov 2022 20:31:18 +0800 Subject: [PATCH] add fuse_multi_transformer passes to fp16. test=develop (#47733) --- paddle/fluid/inference/api/paddle_pass_builder.cc | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/paddle/fluid/inference/api/paddle_pass_builder.cc b/paddle/fluid/inference/api/paddle_pass_builder.cc index 770cf4577b1..28fd91e3ba3 100755 --- a/paddle/fluid/inference/api/paddle_pass_builder.cc +++ b/paddle/fluid/inference/api/paddle_pass_builder.cc @@ -163,6 +163,12 @@ const std::vector kGpuLowerPrecisionPasses{ "conv_elementwise_add2_act_fuse_pass", "conv_elementwise_add_fuse_pass", "multihead_matmul_fuse_pass_v2", + "fused_multi_transformer_encoder_pass", + "fused_multi_transformer_decoder_pass", + "fused_multi_transformer_encoder_fuse_qkv_pass", + "fused_multi_transformer_decoder_fuse_qkv_pass", + "multi_devices_fused_multi_transformer_encoder_fuse_qkv_pass", + "multi_devices_fused_multi_transformer_decoder_fuse_qkv_pass", "gpu_cpu_map_matmul_v2_to_mul_pass", "gpu_cpu_map_matmul_v2_to_matmul_pass", "fc_fuse_pass", -- GitLab