pool2d support fp16 on xpu and update pool2d unittest, test=kunlun (#40841)

4d198acb · zhangyikun02 · GitHub · d1c1d731 · 4d198acb · 4d198acb
Showing with 227 addition and 229 deletion

paddle/fluid/operators/pool_op_xpu.cc paddle/fluid/operators/pool_op_xpu.cc +28 -18

python/paddle/fluid/tests/unittests/xpu/test_pool2d_op_xpu.py ...on/paddle/fluid/tests/unittests/xpu/test_pool2d_op_xpu.py +199 -211

未找到文件。
--- a/paddle/fluid/operators/pool_op_xpu.cc
+++ b/paddle/fluid/operators/pool_op_xpu.cc
@@ -37,6 +37,8 @@ xpu::Pooling_t XPUPoolingType(const std::string& pooltype, bool exclusive,
 template <typename DeviceContext, typename T>
 class PoolXPUKernel : public framework::OpKernel<T> {
+  using XPUType = typename XPUTypeTrait<T>::Type;
 public:
  void Compute(const framework::ExecutionContext& context) const override {
    const Tensor* in_x = context.Input<Tensor>("X");
@@ -68,17 +70,19 @@ class PoolXPUKernel : public framework::OpKernel<T> {
    const int c = in_x->dims()[1];
    const int in_h = in_x->dims()[2];
    const int in_w = in_x->dims()[3];
-    const float* input = in_x->data<float>();
+    auto input = reinterpret_cast<const XPUType*>(in_x->data<T>());
    out->mutable_data<T>(context.GetPlace());
-    float* output = out->data<float>();
+    auto output = reinterpret_cast<XPUType*>(out->data<T>());
    auto& dev_ctx = context.template device_context<DeviceContext>();
    int r = xpu::Error_t::SUCCESS;
    if (pooling_type == "max") {
-      r = xpu::max_pool2d(dev_ctx.x_context(), input, output, index_data, n, c,
+      r = xpu::max_pool2d<XPUType>(dev_ctx.x_context(), input, output,
-                          in_h, in_w, ksize, strides, paddings, true);
+                                   index_data, n, c, in_h, in_w, ksize, strides,
+                                   paddings, true);
    } else if (pooling_type == "avg") {
-      r = xpu::avg_pool2d(dev_ctx.x_context(), input, output, n, c, in_h, in_w,
+      r = xpu::avg_pool2d<XPUType>(dev_ctx.x_context(), input, output, n, c,
-                          ksize, strides, paddings, !exclusive, true);
+                                   in_h, in_w, ksize, strides, paddings,
+                                   !exclusive, true);
    } else {
      PADDLE_THROW(platform::errors::InvalidArgument(
          "Unsupported pooling type for kunlun ", pooling_type));
@@ -92,6 +96,8 @@ class PoolXPUKernel : public framework::OpKernel<T> {
 template <typename DeviceContext, typename T>
 class PoolGradXPUKernel : public framework::OpKernel<T> {
+  using XPUType = typename XPUTypeTrait<T>::Type;
 public:
  void Compute(const framework::ExecutionContext& context) const override {
    const Tensor* in_x = context.Input<Tensor>("X");
@@ -130,21 +136,21 @@ class PoolGradXPUKernel : public framework::OpKernel<T> {
    const int c = in_x->dims()[1];
    const int in_h = in_x->dims()[2];
    const int in_w = in_x->dims()[3];
-    const float* input = in_x->data<float>();
+    auto input = reinterpret_cast<const XPUType*>(in_x->data<T>());
-    const float* output = out->data<float>();
+    auto output = reinterpret_cast<const XPUType*>(out->data<T>());
-    const float* output_grad = out_grad->data<float>();
+    auto output_grad = reinterpret_cast<const XPUType*>(out_grad->data<T>());
    in_x_grad->mutable_data<T>(context.GetPlace());
-    float* input_grad = in_x_grad->data<float>();
+    auto input_grad = reinterpret_cast<XPUType*>(in_x_grad->data<T>());
    auto& dev_ctx = context.template device_context<DeviceContext>();
    int r = xpu::Error_t::SUCCESS;
    if (pooling_type == "max") {
-      r = xpu::max_pool2d_grad(dev_ctx.x_context(), input, output, index_data,
+      r = xpu::max_pool2d_grad<XPUType>(
-                               output_grad, input_grad, n, c, in_h, in_w, ksize,
+          dev_ctx.x_context(), input, output, index_data, output_grad,
-                               strides, paddings, true);
+          input_grad, n, c, in_h, in_w, ksize, strides, paddings, true);
    } else if (pooling_type == "avg") {
-      r = xpu::avg_pool2d_grad(dev_ctx.x_context(), input, output, output_grad,
+      r = xpu::avg_pool2d_grad<XPUType>(
-                               input_grad, n, c, in_h, in_w, ksize, strides,
+          dev_ctx.x_context(), input, output, output_grad, input_grad, n, c,
-                               paddings, !exclusive, true);
+          in_h, in_w, ksize, strides, paddings, !exclusive, true);
    } else {
      PADDLE_THROW(platform::errors::InvalidArgument(
          "Unsupported pooling type for kunlun ", pooling_type));
@@ -161,9 +167,13 @@ class PoolGradXPUKernel : public framework::OpKernel<T> {
 namespace ops = paddle::operators;
 REGISTER_OP_XPU_KERNEL(
-    pool2d, ops::PoolXPUKernel<paddle::platform::XPUDeviceContext, float>);
+    pool2d, ops::PoolXPUKernel<paddle::platform::XPUDeviceContext, float>,
+    ops::PoolXPUKernel<paddle::platform::XPUDeviceContext,
+                       paddle::platform::float16>);
 REGISTER_OP_XPU_KERNEL(
    pool2d_grad,
-    ops::PoolGradXPUKernel<paddle::platform::XPUDeviceContext, float>);
+    ops::PoolGradXPUKernel<paddle::platform::XPUDeviceContext, float>,
+    ops::PoolGradXPUKernel<paddle::platform::XPUDeviceContext,
+                           paddle::platform::float16>);
 #endif
--- a/python/paddle/fluid/tests/unittests/xpu/test_pool2d_op_xpu.py
+++ b/python/paddle/fluid/tests/unittests/xpu/test_pool2d_op_xpu.py
@@ -25,6 +25,7 @@ from op_test_xpu import XPUOpTest
 import paddle.fluid as fluid
 from paddle.fluid import Program, program_guard
 from test_pool2d_op import adaptive_start_index, adaptive_end_index
+from xpu.get_test_cover_info import create_test_class, get_xpu_op_support_types, XPUOpTestWrapper
 import paddle
 paddle.enable_static()
@@ -246,229 +247,216 @@ def pool2D_forward_naive(x,
    return out
-class TestPool2D_Op(XPUOpTest):
+class XPUTestPool2D_Op(XPUOpTestWrapper):
-    def setUp(self):
+    def __init__(self):
-        self.op_type = "pool2d"
+        self.op_name = 'pool2d'
-        self.use_cudnn = False
+        self.use_dynamic_create_class = False
-        self.init_kernel_type()
-        self.use_mkldnn = False
+    class TestPool2D_Op(XPUOpTest):
-        self.init_data_type()
+        def setUp(self):
-        self.init_test_case()
+            self.op_type = "pool2d"
-        self.padding_algorithm = "EXPLICIT"
+            self.dtype = self.in_type
-        self.init_paddings()
+            self.place = paddle.XPUPlace(0)
-        self.init_global_pool()
+            self.use_cudnn = False
-        self.init_kernel_type()
+            self.init_kernel_type()
-        self.init_pool_type()
+            self.use_mkldnn = False
-        self.init_ceil_mode()
+            self.init_test_case()
-        self.init_exclusive()
+            self.padding_algorithm = "EXPLICIT"
-        self.init_adaptive()
+            self.init_paddings()
-        self.init_data_format()
+            self.init_global_pool()
-        self.init_shape()
+            self.init_kernel_type()
+            self.init_pool_type()
-        input = np.random.random(self.shape).astype(self.dtype)
+            self.init_ceil_mode()
-        output = pool2D_forward_naive(
+            self.init_exclusive()
-            input, self.ksize, self.strides, self.paddings, self.global_pool,
+            self.init_adaptive()
-            self.ceil_mode, self.exclusive, self.adaptive, self.data_format,
+            self.init_data_format()
-            self.pool_type, self.padding_algorithm).astype(self.dtype)
+            self.init_shape()
-        self.inputs = {'X': XPUOpTest.np_dtype_to_fluid_dtype(input)}
+            input = np.random.random(self.shape).astype(self.dtype)
-        self.attrs = {
+            output = pool2D_forward_naive(
-            'strides': self.strides,
+                input, self.ksize, self.strides, self.paddings,
-            'paddings': self.paddings,
+                self.global_pool, self.ceil_mode, self.exclusive, self.adaptive,
-            'ksize': self.ksize,
+                self.data_format, self.pool_type,
-            'pooling_type': self.pool_type,
+                self.padding_algorithm).astype(self.dtype)
-            'global_pooling': self.global_pool,
+            self.inputs = {'X': XPUOpTest.np_dtype_to_fluid_dtype(input)}
-            'use_cudnn': self.use_cudnn,
-            'use_mkldnn': self.use_mkldnn,
+            self.attrs = {
-            'ceil_mode': self.ceil_mode,
+                'strides': self.strides,
-            'data_format': self.data_format,
+                'paddings': self.paddings,
-            'exclusive': self.exclusive,
+                'ksize': self.ksize,
-            'adaptive': self.adaptive,
+                'pooling_type': self.pool_type,
-            "padding_algorithm": self.padding_algorithm,
+                'global_pooling': self.global_pool,
-        }
+                'use_cudnn': self.use_cudnn,
+                'use_mkldnn': self.use_mkldnn,
+                'ceil_mode': self.ceil_mode,
+                'data_format': self.data_format,
+                'exclusive': self.exclusive,
+                'adaptive': self.adaptive,
+                "padding_algorithm": self.padding_algorithm,
+            }
+            self.outputs = {'Out': output}
+        def test_check_output(self):
+            self.check_output_with_place(self.place)
+        def test_check_grad(self):
+            self.check_grad_with_place(self.place, set(['X']), 'Out')
+        def init_data_format(self):
+            self.data_format = "NCHW"
+        def init_shape(self):
+            self.shape = [2, 3, 5, 5]
+        def init_test_case(self):
+            self.ksize = [3, 3]
+            self.strides = [1, 1]
+        def init_paddings(self):
+            self.paddings = [0, 0]
+            self.padding_algorithm = "EXPLICIT"
+        def init_kernel_type(self):
+            self.use_cudnn = False
+        def init_pool_type(self):
+            self.pool_type = "avg"
+            self.pool2D_forward_naive = avg_pool2D_forward_naive
+        def init_global_pool(self):
+            self.global_pool = True
+        def init_ceil_mode(self):
+            self.ceil_mode = False
+        def init_exclusive(self):
+            self.exclusive = True
+        def init_adaptive(self):
+            self.adaptive = False
+    class TestCase1(TestPool2D_Op):
+        def init_test_case(self):
+            self.ksize = [3, 3]
+            self.strides = [1, 1]
+        def init_paddings(self):
+            self.paddings = [0, 0]
+        def init_pool_type(self):
+            self.pool_type = "avg"
+            self.pool2D_forward_naive = avg_pool2D_forward_naive
+        def init_global_pool(self):
+            self.global_pool = False
+        def init_shape(self):
+            self.shape = [2, 3, 7, 7]
+    class TestCase2(TestPool2D_Op):
+        def init_test_case(self):
+            self.ksize = [3, 3]
+            self.strides = [1, 1]
+        def init_paddings(self):
+            self.paddings = [1, 1]
+        def init_pool_type(self):
+            self.pool_type = "avg"
+            self.pool2D_forward_naive = avg_pool2D_forward_naive
+        def init_global_pool(self):
+            self.global_pool = False
+        def init_shape(self):
+            self.shape = [2, 3, 7, 7]
+    class TestCase3(TestPool2D_Op):
+        def init_pool_type(self):
+            self.pool_type = "max"
+            self.pool2D_forward_naive = max_pool2D_forward_naive
+    class TestCase4(TestCase1):
+        def init_pool_type(self):
+            self.pool_type = "max"
+            self.pool2D_forward_naive = max_pool2D_forward_naive
+    class TestCase5(TestCase2):
+        def init_pool_type(self):
+            self.pool_type = "max"
+            self.pool2D_forward_naive = max_pool2D_forward_naive
-        self.outputs = {'Out': output}
+    class TestPool2D_AsyPadding(TestPool2D_Op):
+        def init_test_case(self):
-    def has_xpu(self):
+            self.ksize = [3, 3]
-        return core.is_compiled_with_xpu()
+            self.strides = [1, 1]
+            self.paddings = [1, 0, 1, 2]
-    def test_check_output(self):
+        def init_shape(self):
-        if self.has_xpu():
+            self.shape = [2, 3, 5, 5]
-            place = core.XPUPlace(0)
-            self.check_output_with_place(place)
-        return
-    def test_check_grad(self):
+    class TestCase1_AsyPadding(TestCase1):
-        if self.has_xpu():
+        def init_test_case(self):
-            place = core.XPUPlace(0)
+            self.ksize = [3, 3]
-            self.check_grad_with_place(place, set(['X']), 'Out')
+            self.strides = [1, 1]
-        return
+            self.paddings = [1, 0, 1, 0]
-    def init_data_format(self):
+        def init_shape(self):
-        self.data_format = "NCHW"
+            self.shape = [2, 3, 7, 7]
-    def init_shape(self):
+    class TestCase2_AsyPadding(TestCase2):
-        self.shape = [2, 3, 5, 5]
+        def init_test_case(self):
+            self.ksize = [3, 3]
+            self.strides = [1, 1]
+            self.paddings = [1, 2, 1, 2]
-    def init_test_case(self):
+        def init_shape(self):
-        self.ksize = [3, 3]
+            self.shape = [2, 3, 7, 7]
-        self.strides = [1, 1]
-    def init_paddings(self):
+    class TestCase3_AsyPadding(TestCase3):
-        self.paddings = [0, 0]
+        def init_test_case(self):
-        self.padding_algorithm = "EXPLICIT"
+            self.ksize = [3, 3]
+            self.strides = [1, 1]
+            self.paddings = [1, 0, 1, 2]
-    def init_kernel_type(self):
+        def init_shape(self):
-        self.use_cudnn = False
+            self.shape = [2, 3, 5, 5]
-    def init_data_type(self):
+    class TestCase4_AsyPadding(TestCase4):
-        self.dtype = np.float32
+        def init_test_case(self):
+            self.ksize = [3, 3]
+            self.strides = [1, 1]
+            self.paddings = [1, 0, 1, 0]
-    def init_pool_type(self):
+        def init_shape(self):
-        self.pool_type = "avg"
+            self.shape = [2, 3, 7, 7]
-        self.pool2D_forward_naive = avg_pool2D_forward_naive
-    def init_global_pool(self):
+    class TestCase5_AsyPadding(TestCase5):
-        self.global_pool = True
+        def init_test_case(self):
+            self.ksize = [3, 3]
-    def init_ceil_mode(self):
+            self.strides = [1, 1]
-        self.ceil_mode = False
+            self.paddings = [2, 2, 1, 2]
-    def init_exclusive(self):
+        def init_shape(self):
-        self.exclusive = True
+            self.shape = [2, 3, 7, 7]
-    def init_adaptive(self):
-        self.adaptive = False
-class TestCase1(TestPool2D_Op):
-    def init_test_case(self):
-        self.ksize = [3, 3]
-        self.strides = [1, 1]
-    def init_paddings(self):
-        self.paddings = [0, 0]
-    def init_pool_type(self):
-        self.pool_type = "avg"
-        self.pool2D_forward_naive = avg_pool2D_forward_naive
-    def init_global_pool(self):
-        self.global_pool = False
-    def init_shape(self):
-        self.shape = [2, 3, 7, 7]
-class TestCase2(TestPool2D_Op):
-    def init_test_case(self):
-        self.ksize = [3, 3]
-        self.strides = [1, 1]
-    def init_paddings(self):
-        self.paddings = [1, 1]
-    def init_pool_type(self):
-        self.pool_type = "avg"
-        self.pool2D_forward_naive = avg_pool2D_forward_naive
-    def init_global_pool(self):
-        self.global_pool = False
-    def init_shape(self):
-        self.shape = [2, 3, 7, 7]
-class TestCase3(TestPool2D_Op):
-    def init_pool_type(self):
-        self.pool_type = "max"
-        self.pool2D_forward_naive = max_pool2D_forward_naive
-class TestCase4(TestCase1):
-    def init_pool_type(self):
-        self.pool_type = "max"
-        self.pool2D_forward_naive = max_pool2D_forward_naive
-class TestCase5(TestCase2):
-    def init_pool_type(self):
-        self.pool_type = "max"
-        self.pool2D_forward_naive = max_pool2D_forward_naive
-class TestPool2D_AsyPadding(TestPool2D_Op):
-    def init_test_case(self):
-        self.ksize = [3, 3]
-        self.strides = [1, 1]
-        self.paddings = [1, 0, 1, 2]
-    def init_shape(self):
-        self.shape = [2, 3, 5, 5]
-class TestCase1_AsyPadding(TestCase1):
-    def init_test_case(self):
-        self.ksize = [3, 3]
-        self.strides = [1, 1]
-        self.paddings = [1, 0, 1, 0]
-    def init_shape(self):
-        self.shape = [2, 3, 7, 7]
-class TestCase2_AsyPadding(TestCase2):
-    def init_test_case(self):
-        self.ksize = [3, 3]
-        self.strides = [1, 1]
-        self.paddings = [1, 2, 1, 2]
-    def init_shape(self):
-        self.shape = [2, 3, 7, 7]
-class TestCase3_AsyPadding(TestCase3):
-    def init_test_case(self):
-        self.ksize = [3, 3]
-        self.strides = [1, 1]
-        self.paddings = [1, 0, 1, 2]
-    def init_shape(self):
-        self.shape = [2, 3, 5, 5]
-class TestCase4_AsyPadding(TestCase4):
-    def init_test_case(self):
-        self.ksize = [3, 3]
-        self.strides = [1, 1]
-        self.paddings = [1, 0, 1, 0]
-    def init_shape(self):
-        self.shape = [2, 3, 7, 7]
-class TestCase5_AsyPadding((TestCase5)):
-    def init_test_case(self):
-        self.ksize = [3, 3]
-        self.strides = [1, 1]
-        self.paddings = [2, 2, 1, 2]
-    def init_shape(self):
-        self.shape = [2, 3, 7, 7]
-class TestAvgInclude_AsyPadding(TestCase2):
-    def init_exclusive(self):
-        self.exclusive = False
-    def init_test_case(self):
-        self.ksize = [3, 3]
-        self.strides = [1, 1]
-        self.paddings = [1, 2, 1, 2]
-    def init_shape(self):
-        self.shape = [2, 3, 7, 7]
+    class TestAvgInclude_AsyPadding(TestCase2):
+        def init_exclusive(self):
+            self.exclusive = False
+        def init_test_case(self):
+            self.ksize = [3, 3]
+            self.strides = [1, 1]
+            self.paddings = [1, 2, 1, 2]
+        def init_shape(self):
+            self.shape = [2, 3, 7, 7]
+support_types = get_xpu_op_support_types('pool2d')
+for stype in support_types:
+    create_test_class(globals(), XPUTestPool2D_Op, stype)
 if __name__ == '__main__':
    unittest.main()