// Copyright (c) 2022 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #include "paddle/phi/kernels/deformable_conv_kernel.h" #include "paddle/phi/backends/xpu/enforce_xpu.h" #include "paddle/phi/core/kernel_registry.h" namespace phi { template void DeformableConvKernel(const Context& dev_ctx, const DenseTensor& x, const DenseTensor& offset, const DenseTensor& filter, const paddle::optional& mask, const std::vector& strides, const std::vector& paddings, const std::vector& dilations, int deformable_groups, int groups, int im2col_step, DenseTensor* out) { dev_ctx.template Alloc(out); PADDLE_ENFORCE_EQ( deformable_groups == 1, true, errors::InvalidArgument( ("XPU only support deformable_groups == 1 in deformable_conv op."))); PADDLE_ENFORCE_EQ( groups == 1, true, errors::InvalidArgument( ("XPU only support groups == 1 in deformable_conv op."))); PADDLE_ENFORCE_EQ(filter.dims()[2] <= 8 && filter.dims()[3] <= 8, true, errors::InvalidArgument( "Filter high and weight should less than 8 on xpu " "in deformable_conv op.")); const int batch_size = static_cast(x.dims()[0]); std::vector output_shape_vec(phi::vectorize(out->dims())); const T* input_ptr = x.data(); const T* filter_ptr = filter.data(); const float* offset_ptr = offset.data(); const float* mask_ptr = mask->data(); T* output_prt = out->data(); // set zeros for d_table_data const int zero = 0; int r = xpu::constant(dev_ctx.x_context(), output_prt, out->numel(), zero); PADDLE_ENFORCE_XDNN_SUCCESS(r, "constant"); int input_dim = x.numel() / x.dims()[0]; int input_offset_dim = offset.numel() / offset.dims()[0]; int input_mask_dim = mask->numel() / mask->dims()[0]; int output_dim = output_shape_vec[1] * output_shape_vec[2] * output_shape_vec[3]; std::vector ksize{static_cast(filter.dims()[2]), static_cast(filter.dims()[3])}; int n = im2col_step; int c = x.dims()[1]; int h = x.dims()[2]; int w = x.dims()[3]; int f = filter.dims()[0]; for (int i = 0; i < batch_size / im2col_step; ++i) { int r = xpu::deformable_conv( dev_ctx.x_context(), input_ptr + i * im2col_step * input_dim, filter_ptr, offset_ptr + i * im2col_step * input_offset_dim, mask_ptr + i * im2col_step * input_mask_dim, output_prt + i * im2col_step * output_dim, n, c, h, w, f, ksize, strides, paddings, dilations, groups, deformable_groups, nullptr, nullptr, nullptr, true); PADDLE_ENFORCE_XDNN_SUCCESS(r, "deformable_conv"); } } } // namespace phi PD_REGISTER_KERNEL( deformable_conv, XPU, ALL_LAYOUT, phi::DeformableConvKernel, float) {}