未验证 提交 5f31737b 编写于 作者: X xiaoting 提交者: GitHub

fix interpolate launch error (#35577)

* fix interpolate launch error, test=develop

* fix area mode for interp, test=develop
上级 e641c638
...@@ -1035,9 +1035,9 @@ static void Interpolate1DCUDAFwd(const framework::ExecutionContext& ctx, ...@@ -1035,9 +1035,9 @@ static void Interpolate1DCUDAFwd(const framework::ExecutionContext& ctx,
: static_cast<float>(new_scale_w); : static_cast<float>(new_scale_w);
} }
int in_cw = c * in_w; int64_t in_cw = c * in_w;
int out_cw = c * out_w; int64_t out_cw = c * out_w;
int pixelNum = n * out_cw; auto pixelNum = n * out_cw;
platform::GpuLaunchConfig config = platform::GpuLaunchConfig config =
platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum); platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum);
...@@ -1169,12 +1169,12 @@ static void Interpolate2DCUDAFwd(const framework::ExecutionContext& ctx, ...@@ -1169,12 +1169,12 @@ static void Interpolate2DCUDAFwd(const framework::ExecutionContext& ctx,
: static_cast<float>(new_scale_w); : static_cast<float>(new_scale_w);
} }
int in_hw = in_h * in_w; int64_t in_hw = in_h * in_w;
int out_hw = out_h * out_w; int64_t out_hw = out_h * out_w;
int in_chw = c * in_hw; int64_t in_chw = c * in_hw;
int out_chw = c * out_hw; int64_t out_chw = c * out_hw;
int pixelNum = n * out_chw; auto pixelNum = n * out_chw;
platform::GpuLaunchConfig config = platform::GpuLaunchConfig config =
platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum); platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum);
...@@ -1355,12 +1355,12 @@ static void Interpolate3DCUDAFwd(const framework::ExecutionContext& ctx, ...@@ -1355,12 +1355,12 @@ static void Interpolate3DCUDAFwd(const framework::ExecutionContext& ctx,
: static_cast<float>(new_scale_w); : static_cast<float>(new_scale_w);
} }
int in_dhw = in_d * in_h * in_w; int64_t in_dhw = in_d * in_h * in_w;
int out_dhw = out_d * out_h * out_w; int64_t out_dhw = out_d * out_h * out_w;
int in_cdhw = c * in_dhw; int64_t in_cdhw = c * in_dhw;
int out_cdhw = c * out_dhw; int64_t out_cdhw = c * out_dhw;
int pixelNum = n * out_cdhw; auto pixelNum = n * out_cdhw;
platform::GpuLaunchConfig config = platform::GpuLaunchConfig config =
platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum); platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum);
...@@ -1456,9 +1456,9 @@ static void Interpolate1DCUDABwd(const framework::ExecutionContext& ctx, ...@@ -1456,9 +1456,9 @@ static void Interpolate1DCUDABwd(const framework::ExecutionContext& ctx,
ratio_w = (align_corners) ? static_cast<float>(in_w - 1) / (out_w - 1) ratio_w = (align_corners) ? static_cast<float>(in_w - 1) / (out_w - 1)
: static_cast<float>(new_scale_w); : static_cast<float>(new_scale_w);
} }
int in_cw = c * in_w; int64_t in_cw = c * in_w;
int out_cw = c * out_w; int64_t out_cw = c * out_w;
int pixelNum = n * out_cw; auto pixelNum = n * out_cw;
platform::GpuLaunchConfig config = platform::GpuLaunchConfig config =
platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum); platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum);
...@@ -1587,11 +1587,11 @@ static void Interpolate2DCUDABwd(const framework::ExecutionContext& ctx, ...@@ -1587,11 +1587,11 @@ static void Interpolate2DCUDABwd(const framework::ExecutionContext& ctx,
: static_cast<float>(new_scale_w); : static_cast<float>(new_scale_w);
} }
int in_hw = in_h * in_w; int64_t in_hw = in_h * in_w;
int out_hw = out_h * out_w; int64_t out_hw = out_h * out_w;
int in_chw = c * in_hw; int64_t in_chw = c * in_hw;
int out_chw = c * out_hw; int64_t out_chw = c * out_hw;
int pixelNum = n * out_chw; auto pixelNum = n * out_chw;
platform::GpuLaunchConfig config = platform::GpuLaunchConfig config =
platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum); platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum);
...@@ -1773,12 +1773,12 @@ static void Interpolate3DCUDABwd(const framework::ExecutionContext& ctx, ...@@ -1773,12 +1773,12 @@ static void Interpolate3DCUDABwd(const framework::ExecutionContext& ctx,
: static_cast<float>(new_scale_w); : static_cast<float>(new_scale_w);
} }
int in_dhw = in_d * in_h * in_w; int64_t in_dhw = in_d * in_h * in_w;
int out_dhw = out_d * out_h * out_w; int64_t out_dhw = out_d * out_h * out_w;
int in_cdhw = c * in_dhw; int64_t in_cdhw = c * in_dhw;
int out_cdhw = c * out_dhw; int64_t out_cdhw = c * out_dhw;
int pixelNum = n * out_cdhw; auto pixelNum = n * out_cdhw;
platform::GpuLaunchConfig config = platform::GpuLaunchConfig config =
platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum); platform::GetGpuLaunchConfig1D(ctx.cuda_device_context(), pixelNum);
......
...@@ -295,12 +295,15 @@ def interpolate(x, ...@@ -295,12 +295,15 @@ def interpolate(x,
"align_corners option can only be set with the interpolating modes: linear | bilinear | bicubic | trilinear" "align_corners option can only be set with the interpolating modes: linear | bilinear | bicubic | trilinear"
) )
if resample == 'AREA' and len(x.shape) == 3: if resample == 'AREA':
if isinstance(size, list) or isinstance(size, tuple):
if len(size) == 0:
raise ValueError("output size can not be empty")
if len(x.shape) == 3:
return paddle.nn.functional.adaptive_avg_pool1d(x, size) return paddle.nn.functional.adaptive_avg_pool1d(x, size)
elif len(x.shape) == 4:
if resample == 'AREA' and len(x.shape) == 4:
return paddle.nn.functional.adaptive_avg_pool2d(x, size) return paddle.nn.functional.adaptive_avg_pool2d(x, size)
if resample == 'AREA' and len(x.shape) == 5: elif len(x.shape) == 5:
return paddle.nn.functional.adaptive_avg_pool3d(x, size) return paddle.nn.functional.adaptive_avg_pool3d(x, size)
helper = LayerHelper('{}_interp_v2'.format(resample_type), **locals()) helper = LayerHelper('{}_interp_v2'.format(resample_type), **locals())
...@@ -342,14 +345,13 @@ def interpolate(x, ...@@ -342,14 +345,13 @@ def interpolate(x,
out_shape = size out_shape = size
scale = scale_factor scale = scale_factor
if out_shape is not None and scale is not None: if out_shape is not None and scale is not None:
raise ValueError("Only one of size or scale_factor should be defined.") raise ValueError("Only one of size or scale_factor should be defined.")
if out_shape is not None: if out_shape is not None:
if isinstance(out_shape, Variable) and not in_dygraph_mode(): if isinstance(out_shape, Variable) and not in_dygraph_mode():
out_shape.stop_gradient = True out_shape.stop_gradient = True
inputs['OutSize'] = out_shape inputs['OutSize'] = out_shape
else: else:
if in_dygraph_mode(): if in_dygraph_mode():
if isinstance(out_shape, Variable): if isinstance(out_shape, Variable):
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册