提交 0fa0cbe0 编写于 作者: J Jiaying Zhao 提交者: GitHub

Merge pull request #1128 from smilejames/opencl

fix compilation problem
...@@ -47,7 +47,7 @@ void DepthwiseConvKernel<GPU_CL, float>::Compute( ...@@ -47,7 +47,7 @@ void DepthwiseConvKernel<GPU_CL, float>::Compute(
int nh = default_work_size[2]; int nh = default_work_size[2];
auto input = param.Input()->GetCLImage(); auto input = param.Input()->GetCLImage();
auto filter = param.Filter()->GetCLImage(); auto filter = param.Filter()->GetCLImage();
auto output = param.Output(); auto output = param.Output()->GetCLImage();
int stride = param.Strides()[0]; int stride = param.Strides()[0];
int offset = param.Offset(); int offset = param.Offset();
int input_c = param.Input()->CBlock(); int input_c = param.Input()->CBlock();
......
...@@ -58,7 +58,7 @@ void FetchKernel<GPU_CL, float>::Compute(const FetchParam<GPU_CL> &param) { ...@@ -58,7 +58,7 @@ void FetchKernel<GPU_CL, float>::Compute(const FetchParam<GPU_CL> &param) {
clEnqueueNDRangeKernel(this->cl_helper_.CLCommandQueue(), kernel, 3, NULL, clEnqueueNDRangeKernel(this->cl_helper_.CLCommandQueue(), kernel, 3, NULL,
default_work_size.data(), NULL, 0, NULL, NULL); default_work_size.data(), NULL, 0, NULL, NULL);
memcpy(out->data(), out_cl_tensor.Data(), out->memory_size()); memcpy(out->data<float>(), out_cl_tensor.Data<float>(), out->memory_size());
} }
template class FetchKernel<GPU_CL, float>; template class FetchKernel<GPU_CL, float>;
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册