未验证 提交 1a7f2de3 编写于 作者: Y ykkk2333 提交者: GitHub

add adaptive pool and softmax with cross entropy supports different axis, * test = kunlun (#44428)

* add xpu pnorm op and fix pool op, *test=kunlun

* add adaptive pool, and softmax with cross entropy supports different axis, *test=kunlun
上级 5414694b
...@@ -102,6 +102,7 @@ class P_NormXPUKernel : public framework::OpKernel<T> { ...@@ -102,6 +102,7 @@ class P_NormXPUKernel : public framework::OpKernel<T> {
XPUType* zeros = RAII_GUARD.alloc_l3_or_gm<XPUType>(1); XPUType* zeros = RAII_GUARD.alloc_l3_or_gm<XPUType>(1);
PADDLE_ENFORCE_XDNN_NOT_NULL(zeros); PADDLE_ENFORCE_XDNN_NOT_NULL(zeros);
r = xpu::constant(dev_ctx.x_context(), zeros, 1, 0.0f); r = xpu::constant(dev_ctx.x_context(), zeros, 1, 0.0f);
PADDLE_ENFORCE_XDNN_SUCCESS(r, "constant");
std::vector<int> zeros_dim(1, 1); std::vector<int> zeros_dim(1, 1);
bool* tmp2_x = RAII_GUARD.alloc_l3_or_gm<bool>(m * t * n); bool* tmp2_x = RAII_GUARD.alloc_l3_or_gm<bool>(m * t * n);
......
...@@ -60,11 +60,7 @@ class PoolXPUKernel : public framework::OpKernel<T> { ...@@ -60,11 +60,7 @@ class PoolXPUKernel : public framework::OpKernel<T> {
2, 2,
platform::errors::InvalidArgument( platform::errors::InvalidArgument(
"The Pool2d XPU OP only support 2 dimension pooling!")); "The Pool2d XPU OP only support 2 dimension pooling!"));
PADDLE_ENFORCE_EQ(!adaptive || (ksize[0] * ksize[1] == 1),
true,
platform::errors::InvalidArgument(
"The Pool2d XPU OP does not support (adaptive == "
"true && output_size != 1)"));
int* index_data = nullptr; int* index_data = nullptr;
bool global_pooling = context.Attr<bool>("global_pooling") || bool global_pooling = context.Attr<bool>("global_pooling") ||
(adaptive && (ksize[0] * ksize[1] == 1)); (adaptive && (ksize[0] * ksize[1] == 1));
...@@ -80,6 +76,9 @@ class PoolXPUKernel : public framework::OpKernel<T> { ...@@ -80,6 +76,9 @@ class PoolXPUKernel : public framework::OpKernel<T> {
const int in_h = in_x->dims()[2]; const int in_h = in_x->dims()[2];
const int in_w = in_x->dims()[3]; const int in_w = in_x->dims()[3];
const int out_h = out->dims()[2];
const int out_w = out->dims()[3];
framework::DDim data_dims; framework::DDim data_dims;
data_dims = phi::slice_ddim(in_x->dims(), 2, in_x->dims().size()); data_dims = phi::slice_ddim(in_x->dims(), 2, in_x->dims().size());
...@@ -90,9 +89,13 @@ class PoolXPUKernel : public framework::OpKernel<T> { ...@@ -90,9 +89,13 @@ class PoolXPUKernel : public framework::OpKernel<T> {
data_dims, data_dims,
strides, strides,
ksize); ksize);
if (ceil_mode) { if (ceil_mode) {
paddings[1] += (strides[0] - 1); int in_h_ceil = (out_h - 1) * strides[0] + ksize[0] - 2 * paddings[0];
paddings[3] += (strides[1] - 1); int in_w_ceil = (out_w - 1) * strides[1] + ksize[1] - 2 * paddings[2];
paddings[1] += (in_h_ceil - in_h);
paddings[3] += (in_w_ceil - in_w);
} }
auto input = reinterpret_cast<const XPUType*>(in_x->data<T>()); auto input = reinterpret_cast<const XPUType*>(in_x->data<T>());
...@@ -100,35 +103,65 @@ class PoolXPUKernel : public framework::OpKernel<T> { ...@@ -100,35 +103,65 @@ class PoolXPUKernel : public framework::OpKernel<T> {
auto output = reinterpret_cast<XPUType*>(out->data<T>()); auto output = reinterpret_cast<XPUType*>(out->data<T>());
auto& dev_ctx = context.template device_context<DeviceContext>(); auto& dev_ctx = context.template device_context<DeviceContext>();
int r = xpu::Error_t::SUCCESS; int r = xpu::Error_t::SUCCESS;
if (pooling_type == "max") { if (!adaptive) {
r = xpu::max_pool2d<XPUType>(dev_ctx.x_context(), if (pooling_type == "max") {
input, r = xpu::max_pool2d<XPUType>(dev_ctx.x_context(),
output, input,
index_data, output,
n, index_data,
c, n,
in_h, c,
in_w, in_h,
ksize, in_w,
strides, ksize,
paddings, strides,
true); paddings,
} else if (pooling_type == "avg") { true);
r = xpu::avg_pool2d<XPUType>(dev_ctx.x_context(), } else if (pooling_type == "avg") {
input, r = xpu::avg_pool2d<XPUType>(dev_ctx.x_context(),
output, input,
n, output,
c, n,
in_h, c,
in_w, in_h,
ksize, in_w,
strides, ksize,
paddings, strides,
!exclusive, paddings,
true); !exclusive,
true);
} else {
PADDLE_THROW(platform::errors::InvalidArgument(
"Unsupported pooling type for kunlun ", pooling_type));
}
} else { } else {
PADDLE_THROW(platform::errors::InvalidArgument( if (pooling_type == "max") {
"Unsupported pooling type for kunlun ", pooling_type)); r = xpu::adaptive_max_pool2d<XPUType>(dev_ctx.x_context(),
input,
output,
index_data,
n,
c,
in_h,
in_w,
out_h,
out_w,
true);
} else if (pooling_type == "avg") {
r = xpu::adaptive_avg_pool2d<XPUType>(dev_ctx.x_context(),
input,
output,
n,
c,
in_h,
in_w,
out_h,
out_w,
true);
} else {
PADDLE_THROW(platform::errors::InvalidArgument(
"Unsupported pooling type for kunlun ", pooling_type));
}
} }
PADDLE_ENFORCE_EQ(r, PADDLE_ENFORCE_EQ(r,
xpu::Error_t::SUCCESS, xpu::Error_t::SUCCESS,
...@@ -167,11 +200,6 @@ class PoolGradXPUKernel : public framework::OpKernel<T> { ...@@ -167,11 +200,6 @@ class PoolGradXPUKernel : public framework::OpKernel<T> {
"dimension pooling!, but received " "dimension pooling!, but received "
"%d-dimension pool kernel size", "%d-dimension pool kernel size",
ksize.size())); ksize.size()));
PADDLE_ENFORCE_EQ(!adaptive || (ksize[0] * ksize[1] == 1),
true,
platform::errors::InvalidArgument(
"The Pool2d XPU OP does not support (adaptive == "
"true && output_size != 1)"));
bool global_pooling = context.Attr<bool>("global_pooling") || bool global_pooling = context.Attr<bool>("global_pooling") ||
(adaptive && (ksize[0] * ksize[1] == 1)); (adaptive && (ksize[0] * ksize[1] == 1));
if (global_pooling) { if (global_pooling) {
...@@ -188,6 +216,16 @@ class PoolGradXPUKernel : public framework::OpKernel<T> { ...@@ -188,6 +216,16 @@ class PoolGradXPUKernel : public framework::OpKernel<T> {
const int in_h = in_x->dims()[2]; const int in_h = in_x->dims()[2];
const int in_w = in_x->dims()[3]; const int in_w = in_x->dims()[3];
const int out_h = out->dims()[2];
const int out_w = out->dims()[3];
PADDLE_ENFORCE_EQ(!adaptive || (ksize[0] * ksize[1] == 1) ||
(in_h % out_h == 0 && in_w % out_w == 0),
true,
platform::errors::InvalidArgument(
"The Pool2d XPU OP does not support (adaptive == "
"true && output_size != 1)"));
framework::DDim data_dims; framework::DDim data_dims;
data_dims = phi::slice_ddim(in_x->dims(), 2, in_x->dims().size()); data_dims = phi::slice_ddim(in_x->dims(), 2, in_x->dims().size());
...@@ -199,8 +237,11 @@ class PoolGradXPUKernel : public framework::OpKernel<T> { ...@@ -199,8 +237,11 @@ class PoolGradXPUKernel : public framework::OpKernel<T> {
strides, strides,
ksize); ksize);
if (ceil_mode) { if (ceil_mode) {
paddings[1] += (strides[0] - 1); int in_h_ceil = (out_h - 1) * strides[0] + ksize[0] - 2 * paddings[0];
paddings[3] += (strides[1] - 1); int in_w_ceil = (out_w - 1) * strides[1] + ksize[1] - 2 * paddings[2];
paddings[1] += (in_h_ceil - in_h);
paddings[3] += (in_w_ceil - in_w);
} }
auto input = reinterpret_cast<const XPUType*>(in_x->data<T>()); auto input = reinterpret_cast<const XPUType*>(in_x->data<T>());
...@@ -210,6 +251,14 @@ class PoolGradXPUKernel : public framework::OpKernel<T> { ...@@ -210,6 +251,14 @@ class PoolGradXPUKernel : public framework::OpKernel<T> {
auto input_grad = reinterpret_cast<XPUType*>(in_x_grad->data<T>()); auto input_grad = reinterpret_cast<XPUType*>(in_x_grad->data<T>());
auto& dev_ctx = context.template device_context<DeviceContext>(); auto& dev_ctx = context.template device_context<DeviceContext>();
int r = xpu::Error_t::SUCCESS; int r = xpu::Error_t::SUCCESS;
if (adaptive && in_h % out_h == 0 && in_w % out_w == 0) {
strides = {in_h / out_h, in_w / out_w};
int kh = in_h - (out_h - 1) * strides[0];
int kw = in_w - (out_w - 1) * strides[1];
ksize = {kh, kw};
paddings = {0, 0, 0, 0};
}
if (pooling_type == "max") { if (pooling_type == "max") {
r = xpu::max_pool2d_grad<XPUType>(dev_ctx.x_context(), r = xpu::max_pool2d_grad<XPUType>(dev_ctx.x_context(),
input, input,
......
...@@ -45,10 +45,6 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> { ...@@ -45,10 +45,6 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> {
Tensor* loss = context.Output<Tensor>("Loss"); Tensor* loss = context.Output<Tensor>("Loss");
const int rank = logits->dims().size(); const int rank = logits->dims().size();
const int axis = phi::funcs::CanonicalAxis(context.Attr<int>("axis"), rank); const int axis = phi::funcs::CanonicalAxis(context.Attr<int>("axis"), rank);
PADDLE_ENFORCE_EQ(
axis,
rank - 1,
platform::errors::InvalidArgument("axis should == rank - 1"));
softmax->mutable_data<T>(context.GetPlace()); softmax->mutable_data<T>(context.GetPlace());
loss->mutable_data<T>(context.GetPlace()); loss->mutable_data<T>(context.GetPlace());
const int n = phi::funcs::SizeToAxis(axis, logits->dims()); const int n = phi::funcs::SizeToAxis(axis, logits->dims());
...@@ -56,17 +52,20 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> { ...@@ -56,17 +52,20 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> {
std::vector<int> logits_dims = phi::vectorize<int>(logits->dims()); std::vector<int> logits_dims = phi::vectorize<int>(logits->dims());
const bool soft_label = context.Attr<bool>("soft_label"); const bool soft_label = context.Attr<bool>("soft_label");
int t = logits_dims[axis];
auto logits_data = reinterpret_cast<const XPUType*>(logits->data<T>()); auto logits_data = reinterpret_cast<const XPUType*>(logits->data<T>());
auto softmax_data = reinterpret_cast<XPUType*>(softmax->data<T>()); auto softmax_data = reinterpret_cast<XPUType*>(softmax->data<T>());
auto loss_data = reinterpret_cast<XPUType*>(loss->data<T>()); auto loss_data = reinterpret_cast<XPUType*>(loss->data<T>());
// softmax // softmax
auto& dev_ctx = auto& dev_ctx =
context.template device_context<platform::XPUDeviceContext>(); context.template device_context<platform::XPUDeviceContext>();
int r = XPU_SUCCESS; int r = XPU_SUCCESS;
xpu::ctx_guard RAII_GUARD(dev_ctx.x_context());
if (platform::get_xpu_version(context.GetPlace().GetDeviceId()) == if (platform::get_xpu_version(context.GetPlace().GetDeviceId()) ==
phi::backends::xpu::XPUVersion::XPU2 && phi::backends::xpu::XPUVersion::XPU2 &&
soft_label) { soft_label && axis == rank - 1) {
auto labels_data = reinterpret_cast<const XPUType*>(labels->data<T>()); auto labels_data = reinterpret_cast<const XPUType*>(labels->data<T>());
r = xpu::soft_softmax_with_cross_entropy<XPUType>(dev_ctx.x_context(), r = xpu::soft_softmax_with_cross_entropy<XPUType>(dev_ctx.x_context(),
logits_data, logits_data,
...@@ -79,7 +78,6 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> { ...@@ -79,7 +78,6 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> {
return; return;
} }
xpu::ctx_guard RAII_GUARD(dev_ctx.x_context());
int len = logits->numel(); int len = logits->numel();
T* clip_logits = RAII_GUARD.alloc_l3_or_gm<T>(len); T* clip_logits = RAII_GUARD.alloc_l3_or_gm<T>(len);
PADDLE_ENFORCE_XDNN_NOT_NULL(clip_logits); PADDLE_ENFORCE_XDNN_NOT_NULL(clip_logits);
...@@ -105,10 +103,38 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> { ...@@ -105,10 +103,38 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> {
PADDLE_ENFORCE_XDNN_SUCCESS(r, "softmax"); PADDLE_ENFORCE_XDNN_SUCCESS(r, "softmax");
// cross_entropy // cross_entropy
if (axis != rank - 1) {
XPUType* trans_softmax = RAII_GUARD.alloc_l3_or_gm<XPUType>(n * d);
PADDLE_ENFORCE_XDNN_NOT_NULL(trans_softmax);
r = xpu::transpose(dev_ctx.x_context(),
softmax_data,
trans_softmax,
{n, t, d / t},
{0, 2, 1});
PADDLE_ENFORCE_XDNN_SUCCESS(r, "transpose");
softmax_data = trans_softmax;
}
if (soft_label) { if (soft_label) {
auto labels_data = reinterpret_cast<const XPUType*>(labels->data<T>()); auto labels_data = reinterpret_cast<const XPUType*>(labels->data<T>());
r = xpu::soft_cross_entropy<XPUType>( if (axis != rank - 1) {
dev_ctx.x_context(), softmax_data, labels_data, loss_data, n, d); XPUType* trans_label = RAII_GUARD.alloc_l3_or_gm<XPUType>(n * d);
PADDLE_ENFORCE_XDNN_NOT_NULL(trans_label);
r = xpu::transpose(dev_ctx.x_context(),
labels_data,
trans_label,
{n, t, d / t},
{0, 2, 1});
PADDLE_ENFORCE_XDNN_SUCCESS(r, "transpose");
labels_data = trans_label;
}
r = xpu::soft_cross_entropy<XPUType>(dev_ctx.x_context(),
softmax_data,
labels_data,
loss_data,
axis == rank - 1 ? n : n * d / t,
axis == rank - 1 ? d : t);
PADDLE_ENFORCE_XDNN_SUCCESS(r, "soft_cross_entropy"); PADDLE_ENFORCE_XDNN_SUCCESS(r, "soft_cross_entropy");
} else { } else {
auto ignore_index = context.Attr<int>("ignore_index"); auto ignore_index = context.Attr<int>("ignore_index");
...@@ -127,8 +153,8 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> { ...@@ -127,8 +153,8 @@ class SoftmaxWithCrossEntropyXPUKernel : public framework::OpKernel<T> {
labels_int32.data<int32_t>(), labels_int32.data<int32_t>(),
loss_data, loss_data,
nullptr, nullptr,
n, axis == rank - 1 ? n : n * d / t,
d, axis == rank - 1 ? d : t,
ignore_index); ignore_index);
PADDLE_ENFORCE_XDNN_SUCCESS(r, "hard_cross_entropy"); PADDLE_ENFORCE_XDNN_SUCCESS(r, "hard_cross_entropy");
} }
...@@ -157,10 +183,6 @@ class SoftmaxWithCrossEntropyGradXPUKernel : public framework::OpKernel<T> { ...@@ -157,10 +183,6 @@ class SoftmaxWithCrossEntropyGradXPUKernel : public framework::OpKernel<T> {
const int rank = logit_grad->dims().size(); const int rank = logit_grad->dims().size();
const int axis = phi::funcs::CanonicalAxis(context.Attr<int>("axis"), rank); const int axis = phi::funcs::CanonicalAxis(context.Attr<int>("axis"), rank);
PADDLE_ENFORCE_EQ(
axis,
rank - 1,
platform::errors::InvalidArgument("axis should == rank - 1"));
const int n = phi::funcs::SizeToAxis(axis, logit_grad->dims()); const int n = phi::funcs::SizeToAxis(axis, logit_grad->dims());
const int d = phi::funcs::SizeFromAxis(axis, logit_grad->dims()); const int d = phi::funcs::SizeFromAxis(axis, logit_grad->dims());
...@@ -168,40 +190,107 @@ class SoftmaxWithCrossEntropyGradXPUKernel : public framework::OpKernel<T> { ...@@ -168,40 +190,107 @@ class SoftmaxWithCrossEntropyGradXPUKernel : public framework::OpKernel<T> {
context.template device_context<platform::XPUDeviceContext>(); context.template device_context<platform::XPUDeviceContext>();
int r = XPU_SUCCESS; int r = XPU_SUCCESS;
if (soft_label) { if (axis == rank - 1) {
r = xpu::soft_softmax_with_cross_entropy_grad<XPUType>( if (soft_label) {
dev_ctx.x_context(), r = xpu::soft_softmax_with_cross_entropy_grad<XPUType>(
reinterpret_cast<const XPUType*>(out_grad->data<T>()), dev_ctx.x_context(),
reinterpret_cast<const XPUType*>(labels->data<T>()), reinterpret_cast<const XPUType*>(out_grad->data<T>()),
reinterpret_cast<const XPUType*>(softmax->data<T>()), reinterpret_cast<const XPUType*>(labels->data<T>()),
reinterpret_cast<XPUType*>(logit_grad->data<T>()), reinterpret_cast<const XPUType*>(softmax->data<T>()),
use_softmax, reinterpret_cast<XPUType*>(logit_grad->data<T>()),
n, use_softmax,
d); n,
PADDLE_ENFORCE_XDNN_SUCCESS(r, "soft_softmax_with_cross_entropy_grad"); d);
PADDLE_ENFORCE_XDNN_SUCCESS(r, "soft_softmax_with_cross_entropy_grad");
} else {
xpu::ctx_guard RAII_GUARD(dev_ctx.x_context());
int* labels_int_ptr_l3 =
RAII_GUARD.alloc_l3_or_gm<int32_t>(labels->numel());
PADDLE_ENFORCE_XDNN_NOT_NULL(labels_int_ptr_l3);
r = xpu::cast_v2<int64_t, int32_t>(dev_ctx.x_context(),
labels->data<int64_t>(),
labels_int_ptr_l3,
labels->numel());
PADDLE_ENFORCE_XDNN_SUCCESS(r, "cast_v2");
r = xpu::hard_softmax_with_cross_entropy_grad<XPUType, int>(
dev_ctx.x_context(),
reinterpret_cast<const XPUType*>(out_grad->data<T>()),
labels_int_ptr_l3,
reinterpret_cast<const XPUType*>(softmax->data<T>()),
reinterpret_cast<XPUType*>(logit_grad->data<T>()),
ignore_index,
use_softmax,
n,
d);
PADDLE_ENFORCE_XDNN_SUCCESS(r, "hard_softmax_with_cross_entropy_grad");
}
} else { } else {
int t = logit_grad->dims()[axis];
xpu::ctx_guard RAII_GUARD(dev_ctx.x_context()); xpu::ctx_guard RAII_GUARD(dev_ctx.x_context());
int* labels_int_ptr_l3 = int len = softmax->numel();
RAII_GUARD.alloc_l3_or_gm<int32_t>(labels->numel()); XPUType* trans_logit = RAII_GUARD.alloc_l3_or_gm<XPUType>(len);
PADDLE_ENFORCE_XDNN_NOT_NULL(labels_int_ptr_l3); PADDLE_ENFORCE_XDNN_NOT_NULL(trans_logit);
r = xpu::cast_v2<int64_t, int32_t>(dev_ctx.x_context(), XPUType* trans_softmax = RAII_GUARD.alloc_l3_or_gm<XPUType>(len);
labels->data<int64_t>(), PADDLE_ENFORCE_XDNN_NOT_NULL(trans_softmax);
labels_int_ptr_l3, r = xpu::transpose(dev_ctx.x_context(),
labels->numel()); reinterpret_cast<const XPUType*>(softmax->data<T>()),
PADDLE_ENFORCE_XDNN_SUCCESS(r, "cast_v2"); trans_softmax,
{n, t, d / t},
{0, 2, 1});
PADDLE_ENFORCE_XDNN_SUCCESS(r, "transpose");
if (soft_label) {
XPUType* trans_labels = RAII_GUARD.alloc_l3_or_gm<XPUType>(len);
PADDLE_ENFORCE_XDNN_NOT_NULL(trans_labels);
r = xpu::transpose(dev_ctx.x_context(),
reinterpret_cast<const XPUType*>(labels->data<T>()),
trans_labels,
{n, t, d / t},
{0, 2, 1});
PADDLE_ENFORCE_XDNN_SUCCESS(r, "transpose");
r = xpu::soft_softmax_with_cross_entropy_grad<XPUType>(
dev_ctx.x_context(),
reinterpret_cast<const XPUType*>(out_grad->data<T>()),
trans_labels,
trans_softmax,
trans_logit,
use_softmax,
n * d / t,
t);
PADDLE_ENFORCE_XDNN_SUCCESS(r, "soft_softmax_with_cross_entropy_grad");
} else {
int* labels_int_ptr_l3 =
RAII_GUARD.alloc_l3_or_gm<int32_t>(labels->numel());
PADDLE_ENFORCE_XDNN_NOT_NULL(labels_int_ptr_l3);
r = xpu::cast_v2<int64_t, int32_t>(dev_ctx.x_context(),
labels->data<int64_t>(),
labels_int_ptr_l3,
labels->numel());
PADDLE_ENFORCE_XDNN_SUCCESS(r, "clip_v2");
r = xpu::hard_softmax_with_cross_entropy_grad<XPUType, int>(
dev_ctx.x_context(),
reinterpret_cast<const XPUType*>(out_grad->data<T>()),
labels_int_ptr_l3,
trans_softmax,
trans_logit,
ignore_index,
use_softmax,
n * d / t,
t);
PADDLE_ENFORCE_XDNN_SUCCESS(r, "hard_softmax_with_cross_entropy_grad");
}
r = xpu::hard_softmax_with_cross_entropy_grad<XPUType, int>( r = xpu::transpose<XPUType>(
dev_ctx.x_context(), dev_ctx.x_context(),
reinterpret_cast<const XPUType*>(out_grad->data<T>()), trans_logit,
labels_int_ptr_l3,
reinterpret_cast<const XPUType*>(softmax->data<T>()),
reinterpret_cast<XPUType*>(logit_grad->data<T>()), reinterpret_cast<XPUType*>(logit_grad->data<T>()),
ignore_index, {n, d / t, t},
use_softmax, {0, 2, 1});
n, PADDLE_ENFORCE_XDNN_SUCCESS(r, "transpose");
d);
PADDLE_ENFORCE_XDNN_SUCCESS(r, "hard_softmax_with_cross_entropy_grad");
} }
} }
}; };
......
...@@ -541,6 +541,50 @@ class XPUTestPool2D_Op(XPUOpTestWrapper): ...@@ -541,6 +541,50 @@ class XPUTestPool2D_Op(XPUOpTestWrapper):
def init_ceil_mode(self): def init_ceil_mode(self):
self.ceil_mode = True self.ceil_mode = True
class TestCaseAdaptiveAvg(TestPool2D_Op):
def init_test_case(self):
self.ksize = [2, 2]
self.strides = [2, 2]
def init_paddings(self):
self.paddings = [0, 0]
def init_pool_type(self):
self.pool_type = "avg"
self.pool2D_forward_naive = avg_pool2D_forward_naive
def init_global_pool(self):
self.global_pool = False
def init_shape(self):
self.shape = [2, 4, 8, 8]
def init_adaptive_mode(self):
self.adaptive = True
class TestCaseAdaptiveMax(TestPool2D_Op):
def init_test_case(self):
self.ksize = [2, 2]
self.strides = [2, 2]
def init_paddings(self):
self.paddings = [0, 0]
def init_pool_type(self):
self.pool_type = "max"
self.pool2D_forward_naive = max_pool2D_forward_naive
def init_global_pool(self):
self.global_pool = False
def init_shape(self):
self.shape = [2, 4, 8, 8]
def init_adaptive_mode(self):
self.adaptive = True
support_types = get_xpu_op_support_types('pool2d') support_types = get_xpu_op_support_types('pool2d')
for stype in support_types: for stype in support_types:
......
...@@ -62,16 +62,21 @@ class XPUTestSoftmaxWithCrossEntropyOp(XPUOpTestWrapper): ...@@ -62,16 +62,21 @@ class XPUTestSoftmaxWithCrossEntropyOp(XPUOpTestWrapper):
for numeric_stable_mode in [True, False]: for numeric_stable_mode in [True, False]:
for shape in shapes: for shape in shapes:
for logits_type in [0, 1, 2]: for logits_type in [0, 1, 2]:
class_name = 'XPUTestSoftmaxWithCrossEntropy_' + \ for axis in range(len(shape)):
str(soft_label) + "_" + \ if (not numeric_stable_mode):
str(numeric_stable_mode) + "_" + \ axis = -1
str(shape) + "_" + \ class_name = 'XPUTestSoftmaxWithCrossEntropy_' + \
str(logits_type) str(soft_label) + "_" + \
attr_dict = {'soft_label': soft_label, \ str(numeric_stable_mode) + "_" + \
'numeric_stable_mode': numeric_stable_mode, \ str(shape) + "_" + \
'shape': shape, \ str(logits_type) + "_" + \
'logits_type': logits_type} str(axis)
classes.append([class_name, attr_dict]) attr_dict = {'soft_label': soft_label, \
'numeric_stable_mode': numeric_stable_mode, \
'shape': shape, \
'logits_type': logits_type,
'axis': axis}
classes.append([class_name, attr_dict])
return base_class, classes return base_class, classes
class TestSoftmaxWithCrossEntropyOp(XPUOpTest): class TestSoftmaxWithCrossEntropyOp(XPUOpTest):
...@@ -83,7 +88,6 @@ class XPUTestSoftmaxWithCrossEntropyOp(XPUOpTestWrapper): ...@@ -83,7 +88,6 @@ class XPUTestSoftmaxWithCrossEntropyOp(XPUOpTestWrapper):
self.op_type = "softmax_with_cross_entropy" self.op_type = "softmax_with_cross_entropy"
self.use_xpu = True self.use_xpu = True
self.dtype = np.float32 self.dtype = np.float32
self.axis = -1
self.ignore_index = -1 self.ignore_index = -1
if not hasattr(self, 'shape'): if not hasattr(self, 'shape'):
...@@ -91,6 +95,7 @@ class XPUTestSoftmaxWithCrossEntropyOp(XPUOpTestWrapper): ...@@ -91,6 +95,7 @@ class XPUTestSoftmaxWithCrossEntropyOp(XPUOpTestWrapper):
self.numeric_stable_mode = True self.numeric_stable_mode = True
self.logits_type = 0 self.logits_type = 0
self.soft_label = True self.soft_label = True
self.axis = -1
logits = getattr( logits = getattr(
self, "logits", self, "logits",
np.random.uniform(0.1, 1.0, self.shape).astype(self.dtype)) np.random.uniform(0.1, 1.0, self.shape).astype(self.dtype))
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册