未验证 提交 4fa3c452 编写于 作者: J Jiaying Zhao 提交者: GitHub

Merge pull request #1128 from smilejames/opencl

fix compilation problem
......@@ -47,7 +47,7 @@ void DepthwiseConvKernel<GPU_CL, float>::Compute(
int nh = default_work_size[2];
auto input = param.Input()->GetCLImage();
auto filter = param.Filter()->GetCLImage();
auto output = param.Output();
auto output = param.Output()->GetCLImage();
int stride = param.Strides()[0];
int offset = param.Offset();
int input_c = param.Input()->CBlock();
......
......@@ -58,7 +58,7 @@ void FetchKernel<GPU_CL, float>::Compute(const FetchParam<GPU_CL> &param) {
clEnqueueNDRangeKernel(this->cl_helper_.CLCommandQueue(), kernel, 3, NULL,
default_work_size.data(), NULL, 0, NULL, NULL);
memcpy(out->data(), out_cl_tensor.Data(), out->memory_size());
memcpy(out->data<float>(), out_cl_tensor.Data<float>(), out->memory_size());
}
template class FetchKernel<GPU_CL, float>;
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册