diff --git a/paddle/fluid/operators/conv_mkldnn_op.cc b/paddle/fluid/operators/conv_mkldnn_op.cc index 31d45c08bff497d111d6b87cd7f75f7a057aba03..ca7275d044e6f77a54e14b3fa7d01a01c8c1dfb3 100644 --- a/paddle/fluid/operators/conv_mkldnn_op.cc +++ b/paddle/fluid/operators/conv_mkldnn_op.cc @@ -147,14 +147,15 @@ class ConvMKLDNNHandler : public platform::MKLDNNHandler { std::shared_ptr AcquireBiasMemoryFromPrimitive( const std::shared_ptr user_bias_memory_p, std::vector& pipeline, + bool is_persistent = false, bool is_INT8 = false, std::vector scale_data = {1.0f}, int mask = 0) { // NOLINT auto user_bias_pd = user_bias_memory_p->get_primitive_desc(); auto bias_pd = conv_pd_->bias_primitive_desc(); return this->AcquireMemory(bias_pd, user_bias_pd, user_bias_memory_p, - "@bias_mem_p", pipeline, - false, is_INT8, scale_data, mask); + "@bias_mem_p", pipeline, is_persistent, + is_INT8, scale_data, mask); } std::shared_ptr AcquireConvolution( @@ -547,7 +548,7 @@ class ConvMKLDNNOpKernel : public paddle::framework::OpKernel { scale_bias_data[i] = (*scale_in->data()) * (*(scale_weights->data() + i)); } bias_memory_p = - handler.AcquireBiasMemoryFromPrimitive(user_bias_memory_p, pipeline, is_INT8, scale_bias_data, mask_reorder); + handler.AcquireBiasMemoryFromPrimitive(user_bias_memory_p, pipeline, is_test, is_INT8, scale_bias_data, mask_reorder); } else{ bias_memory_p = handler.AcquireBiasMemoryFromPrimitive(user_bias_memory_p, pipeline);