From d61d6d7500afde2d0d07f3d88756634014130a77 Mon Sep 17 00:00:00 2001 From: zhupengyang Date: Mon, 7 Sep 2020 19:55:29 +0800 Subject: [PATCH] add .part to speed up compile (#27044) (#27099) --- .../operators/reduce_ops/logsumexp_op.cu | 6 ----- .../operators/reduce_ops/logsumexp_op.part.cu | 22 +++++++++++++++++++ 2 files changed, 22 insertions(+), 6 deletions(-) create mode 100644 paddle/fluid/operators/reduce_ops/logsumexp_op.part.cu diff --git a/paddle/fluid/operators/reduce_ops/logsumexp_op.cu b/paddle/fluid/operators/reduce_ops/logsumexp_op.cu index c25e5d01b27..c9ad1075c0c 100644 --- a/paddle/fluid/operators/reduce_ops/logsumexp_op.cu +++ b/paddle/fluid/operators/reduce_ops/logsumexp_op.cu @@ -12,7 +12,6 @@ // See the License for the specific language governing permissions and // limitations under the License. -#include "paddle/fluid/operators/reduce_ops/cub_reduce.h" #include "paddle/fluid/operators/reduce_ops/logsumexp_op.h" REGISTER_OP_CUDA_KERNEL(logsumexp, @@ -20,8 +19,3 @@ REGISTER_OP_CUDA_KERNEL(logsumexp, float, ops::LogsumexpFunctor>, ops::ReduceKernel); -REGISTER_OP_CUDA_KERNEL( - logsumexp_grad, ops::ReduceGradKernel, - ops::ReduceGradKernel); diff --git a/paddle/fluid/operators/reduce_ops/logsumexp_op.part.cu b/paddle/fluid/operators/reduce_ops/logsumexp_op.part.cu new file mode 100644 index 00000000000..d6ad4863092 --- /dev/null +++ b/paddle/fluid/operators/reduce_ops/logsumexp_op.part.cu @@ -0,0 +1,22 @@ +// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved. +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. + +// .part used to speed up nvcc compile +#include "paddle/fluid/operators/reduce_ops/logsumexp_op.h" + +REGISTER_OP_CUDA_KERNEL( + logsumexp_grad, ops::ReduceGradKernel, + ops::ReduceGradKernel); -- GitLab