From fb2a9cdf83a8fa7e026032011b361ef08d0570a2 Mon Sep 17 00:00:00 2001 From: chengduo <30176695+chengduoZH@users.noreply.github.com> Date: Fri, 27 Sep 2019 15:47:14 +0800 Subject: [PATCH] Add fp16 support for pad and split (#19881) * make pad and split support fp16 test=develop --- paddle/fluid/operators/math/padding.h | 2 +- paddle/fluid/operators/pad_op.cu | 9 +++- paddle/fluid/operators/pad_op.h | 6 +-- paddle/fluid/operators/split_op.cc | 11 ++-- paddle/fluid/operators/split_op.cu.cc | 10 ++-- .../fluid/tests/unittests/test_concat_op.py | 53 +++++++++++++------ .../fluid/tests/unittests/test_pad_op.py | 27 +++++++++- .../fluid/tests/unittests/test_split_op.py | 24 ++++++++- 8 files changed, 110 insertions(+), 32 deletions(-) diff --git a/paddle/fluid/operators/math/padding.h b/paddle/fluid/operators/math/padding.h index 3ae25eae98..8bacb5def4 100644 --- a/paddle/fluid/operators/math/padding.h +++ b/paddle/fluid/operators/math/padding.h @@ -58,7 +58,7 @@ void PadGradFunction(const framework::ExecutionContext& context, auto src_tensor = EigenTensor::From(src); auto& place = *context.template device_context().eigen_device(); - d_out_tensor.device(place) = src_tensor.pad(paddings, 0); + d_out_tensor.device(place) = src_tensor.pad(paddings, static_cast(0)); } template diff --git a/paddle/fluid/operators/pad_op.cu b/paddle/fluid/operators/pad_op.cu index 95098a8dca..e07c99b12b 100644 --- a/paddle/fluid/operators/pad_op.cu +++ b/paddle/fluid/operators/pad_op.cu @@ -14,7 +14,12 @@ limitations under the License. */ #include "paddle/fluid/operators/pad_op.h" namespace ops = paddle::operators; +namespace plat = paddle::platform; REGISTER_OP_CUDA_KERNEL( - pad, ops::PadKernel); + pad, ops::PadKernel, + ops::PadKernel, + ops::PadKernel); REGISTER_OP_CUDA_KERNEL( - pad_grad, ops::PadGradKernel); + pad_grad, ops::PadGradKernel, + ops::PadGradKernel, + ops::PadGradKernel); diff --git a/paddle/fluid/operators/pad_op.h b/paddle/fluid/operators/pad_op.h index 32698dac49..d494c954e1 100644 --- a/paddle/fluid/operators/pad_op.h +++ b/paddle/fluid/operators/pad_op.h @@ -30,14 +30,14 @@ class PadKernel : public framework::OpKernel { public: void Compute(const framework::ExecutionContext& context) const override { auto pads = context.Attr>("paddings"); - T pad_value = context.Attr("pad_value"); + float pad_value = context.Attr("pad_value"); auto* x = context.Input("X"); auto* out = context.Output("Out"); out->mutable_data(context.GetPlace()); int rank = x->dims().size(); - math::PaddingFunctor(rank, context, pads, pad_value, *x, - out); + math::PaddingFunctor(rank, context, pads, + static_cast(pad_value), *x, out); } }; diff --git a/paddle/fluid/operators/split_op.cc b/paddle/fluid/operators/split_op.cc index a43bad8781..f224c807bd 100644 --- a/paddle/fluid/operators/split_op.cc +++ b/paddle/fluid/operators/split_op.cc @@ -119,10 +119,11 @@ Example: } // namespace paddle namespace ops = paddle::operators; - +namespace plat = paddle::platform; REGISTER_OPERATOR(split, ops::SplitOp, ops::SplitOpMaker, ops::SplitGradMaker); REGISTER_OP_CPU_KERNEL( - split, ops::SplitOpKernel, - ops::SplitOpKernel, - ops::SplitOpKernel, - ops::SplitOpKernel); + split, ops::SplitOpKernel, + ops::SplitOpKernel, + ops::SplitOpKernel, + ops::SplitOpKernel, + ops::SplitOpKernel); diff --git a/paddle/fluid/operators/split_op.cu.cc b/paddle/fluid/operators/split_op.cu.cc index 18e0904681..bbdac686a2 100644 --- a/paddle/fluid/operators/split_op.cu.cc +++ b/paddle/fluid/operators/split_op.cu.cc @@ -14,8 +14,10 @@ limitations under the License. */ #include "paddle/fluid/operators/split_op.h" namespace ops = paddle::operators; +namespace plat = paddle::platform; REGISTER_OP_CUDA_KERNEL( - split, ops::SplitOpKernel, - ops::SplitOpKernel, - ops::SplitOpKernel, - ops::SplitOpKernel); + split, ops::SplitOpKernel, + ops::SplitOpKernel, + ops::SplitOpKernel, + ops::SplitOpKernel, + ops::SplitOpKernel); diff --git a/python/paddle/fluid/tests/unittests/test_concat_op.py b/python/paddle/fluid/tests/unittests/test_concat_op.py index b5d1115723..3ba2002a66 100644 --- a/python/paddle/fluid/tests/unittests/test_concat_op.py +++ b/python/paddle/fluid/tests/unittests/test_concat_op.py @@ -22,6 +22,7 @@ from op_test import OpTest class TestConcatOp(OpTest): def setUp(self): self.op_type = "concat" + self.dtype = self.get_dtype() self.init_test_data() self.inputs = {'X': [('x0', self.x0), ('x1', self.x1), ('x2', self.x2)]} self.attrs = {'axis': self.axis} @@ -36,6 +37,9 @@ class TestConcatOp(OpTest): (self.x0, self.x1, self.x2), axis=self.actual_axis) } + def get_dtype(self): + return "float32" + def test_check_output(self): self.check_output() @@ -45,25 +49,25 @@ class TestConcatOp(OpTest): self.check_grad(['x2'], 'Out') def init_test_data(self): - self.x0 = np.random.random((2, 1, 4, 5)).astype('float32') - self.x1 = np.random.random((2, 2, 4, 5)).astype('float32') - self.x2 = np.random.random((2, 3, 4, 5)).astype('float32') + self.x0 = np.random.random((2, 1, 4, 5)).astype(self.dtype) + self.x1 = np.random.random((2, 2, 4, 5)).astype(self.dtype) + self.x2 = np.random.random((2, 3, 4, 5)).astype(self.dtype) self.axis = 1 class TestConcatOp2(TestConcatOp): def init_test_data(self): - self.x0 = np.random.random((2, 3, 4, 5)).astype('float32') - self.x1 = np.random.random((2, 3, 4, 5)).astype('float32') - self.x2 = np.random.random((2, 3, 4, 5)).astype('float32') + self.x0 = np.random.random((2, 3, 4, 5)).astype(self.dtype) + self.x1 = np.random.random((2, 3, 4, 5)).astype(self.dtype) + self.x2 = np.random.random((2, 3, 4, 5)).astype(self.dtype) self.axis = 1 class TestConcatOp3(TestConcatOp): def init_test_data(self): - self.x0 = np.random.random((1, 256, 170, 256)).astype('float32') - self.x1 = np.random.random((1, 128, 170, 256)).astype('float32') - self.x2 = np.random.random((1, 128, 170, 256)).astype('float32') + self.x0 = np.random.random((1, 256, 170, 256)).astype(self.dtype) + self.x1 = np.random.random((1, 128, 170, 256)).astype(self.dtype) + self.x2 = np.random.random((1, 128, 170, 256)).astype(self.dtype) self.axis = 1 def test_check_grad(self): @@ -72,9 +76,9 @@ class TestConcatOp3(TestConcatOp): class TestConcatOp4(TestConcatOp): def init_test_data(self): - self.x0 = np.random.random((2, 3, 4, 5)).astype('float32') - self.x1 = np.random.random((2, 3, 4, 5)).astype('float32') - self.x2 = np.random.random((0, 3, 4, 5)).astype('float32') + self.x0 = np.random.random((2, 3, 4, 5)).astype(self.dtype) + self.x1 = np.random.random((2, 3, 4, 5)).astype(self.dtype) + self.x2 = np.random.random((0, 3, 4, 5)).astype(self.dtype) self.axis = 0 def test_check_grad(self): @@ -83,11 +87,30 @@ class TestConcatOp4(TestConcatOp): class TestConcatOp5(TestConcatOp): def init_test_data(self): - self.x0 = np.random.random((2, 1, 4, 5)).astype('float32') - self.x1 = np.random.random((2, 2, 4, 5)).astype('float32') - self.x2 = np.random.random((2, 3, 4, 5)).astype('float32') + self.x0 = np.random.random((2, 1, 4, 5)).astype(self.dtype) + self.x1 = np.random.random((2, 2, 4, 5)).astype(self.dtype) + self.x2 = np.random.random((2, 3, 4, 5)).astype(self.dtype) self.axis = -3 +#----------------Concat Fp16---------------- + + +def create_test_fp16(parent): + class TestConcatFp16(parent): + def get_dtype(self): + return np.float16 + + cls_name = "{0}_{1}".format(parent.__name__, "Fp16") + TestConcatFp16.__name__ = cls_name + globals()[cls_name] = TestConcatFp16 + + +create_test_fp16(TestConcatOp) +create_test_fp16(TestConcatOp2) +create_test_fp16(TestConcatOp3) +create_test_fp16(TestConcatOp4) +create_test_fp16(TestConcatOp5) + if __name__ == '__main__': unittest.main() diff --git a/python/paddle/fluid/tests/unittests/test_pad_op.py b/python/paddle/fluid/tests/unittests/test_pad_op.py index 58e56ca1a4..e2afa19091 100644 --- a/python/paddle/fluid/tests/unittests/test_pad_op.py +++ b/python/paddle/fluid/tests/unittests/test_pad_op.py @@ -22,8 +22,9 @@ from op_test import OpTest class TestPadOp(OpTest): def setUp(self): self.initTestCase() + self.dtype = self.get_dtype() self.op_type = "pad" - self.inputs = {'X': np.random.random(self.shape).astype("float32"), } + self.inputs = {'X': np.random.random(self.shape).astype(self.dtype), } self.attrs = {} self.attrs['paddings'] = np.array(self.paddings).flatten() self.attrs['pad_value'] = self.pad_value @@ -34,6 +35,9 @@ class TestPadOp(OpTest): constant_values=self.pad_value) } + def get_dtype(self): + return np.float32 + def test_check_output(self): self.check_output() @@ -67,5 +71,26 @@ class TestCase3(TestPadOp): self.pad_value = 0.9 +#----------------Pad Fp16---------------- + + +def create_test_fp16(parent): + class TestPadFp16(parent): + def get_dtype(self): + return np.float16 + + def test_check_grad_normal(self): + self.check_grad(['X'], 'Out', max_relative_error=0.3) + + cls_name = "{0}_{1}".format(parent.__name__, "Fp16") + TestPadFp16.__name__ = cls_name + globals()[cls_name] = TestPadFp16 + + +create_test_fp16(TestPadOp) +create_test_fp16(TestCase1) +create_test_fp16(TestCase2) +create_test_fp16(TestCase3) + if __name__ == '__main__': unittest.main() diff --git a/python/paddle/fluid/tests/unittests/test_split_op.py b/python/paddle/fluid/tests/unittests/test_split_op.py index 3c5dd782f8..0374edb9a2 100644 --- a/python/paddle/fluid/tests/unittests/test_split_op.py +++ b/python/paddle/fluid/tests/unittests/test_split_op.py @@ -22,14 +22,18 @@ from op_test import OpTest class TestSplitOp(OpTest): def setUp(self): self._set_op_type() + self.dtype = self.get_dtype() axis = 1 - x = np.random.random((4, 5, 6)).astype('float32') + x = np.random.random((4, 5, 6)).astype(self.dtype) out = np.split(x, [2, 3], axis) self.inputs = {'X': x} self.attrs = {'axis': axis, 'sections': [2, 1, 2]} self.outputs = {'Out': [('out%d' % i, out[i]) \ for i in range(len(out))]} + def get_dtype(self): + return "float32" + def _set_op_type(self): self.op_type = "split" @@ -45,5 +49,23 @@ class TestSplitByrefOp(OpTest): self.op_type = "split_byref" +#----------------Split Fp16---------------- + + +def create_test_fp16(parent): + class TestSplitFp16(parent): + def get_dtype(self): + return np.float16 + + def test_check_grad(self): + pass + + cls_name = "{0}_{1}".format(parent.__name__, "Fp16") + TestSplitFp16.__name__ = cls_name + globals()[cls_name] = TestSplitFp16 + + +create_test_fp16(TestSplitOp) + if __name__ == '__main__': unittest.main() -- GitLab