// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #pragma once #include "paddle/fluid/platform/transform.h" #include "paddle/pten/api/ext/dispatch.h" #include "paddle/pten/core/dense_tensor.h" #include "paddle/pten/kernels/cast_kernel.h" #include "paddle/pten/kernels/hybird/eigen/reduce.h" namespace pten { namespace general { template void Reduce(const DeviceContext& dev_ctx, const DenseTensor& x, bool reduce_all, const std::vector& dims, bool keep_dim, DataType out_dtype, DenseTensor* out) { // If the dims has full dim, set the reduce_all is True const int& input_dim_size = x.dims().size(); std::set dims_set(dims.begin(), dims.end()); bool full_dim = true; for (int i = 0; i < input_dim_size; ++i) { if (dims_set.find(i) == dims_set.end() && dims_set.find(i - input_dim_size) == dims_set.end()) { full_dim = false; break; } } reduce_all = (reduce_all || full_dim); // no need to cast dtype if (out_dtype == pten::DataType::UNDEFINED || out_dtype == x.dtype()) { if (out_dtype == pten::DataType::UNDEFINED) { out_dtype = x.dtype(); } // do reduce sum PD_VISIT_ALL_TYPES( out_dtype, "ReduceKernelImpl", ([&] { pten::eigen::ReduceKernelImpl( dev_ctx, x, out, dims, keep_dim, reduce_all); })); } else { pten::DenseTensor tmp_tensor = pten::DenseTensor( pten::make_intrusive(x.place()), pten::DenseTensorMeta(out_dtype, x.dims(), x.layout())); // cast x tensor to out_dtype pten::Cast(dev_ctx, x, out_dtype, &tmp_tensor); // do reduce sum PD_VISIT_ALL_TYPES( out_dtype, "ReduceKernelImpl", ([&] { pten::eigen::ReduceKernelImpl( dev_ctx, tmp_tensor, out, dims, keep_dim, reduce_all); })); } } } // namespace general } // namespace pten