提交 6f0491bf 编写于 作者: H Huie 提交者: Yanzhan Yang

fix getgputime (#1950)

* 1.add density_prior_box for gpu.
2.add flatten2 for gpu.
3.add concat 4 inputs size for gpu.
4.fix pool.
5.fix transpose2
test=develop

* 1.fix GetGPUTime
test=develop
上级 4b1a4ca0
......@@ -451,6 +451,8 @@ double PaddleMobile<GPU_CL, float>::GetPredictTime() {
int input_height = 224;
int output_width = 224;
int output_height = 224;
int has_group = 0;
int filter_channel = 3;
status = clSetKernelArg(kernel, 0, sizeof(int), &c_block);
CL_CHECK_ERRORS(status);
status = clSetKernelArg(kernel, 1, sizeof(int), &w);
......@@ -479,6 +481,10 @@ double PaddleMobile<GPU_CL, float>::GetPredictTime() {
CL_CHECK_ERRORS(status);
status = clSetKernelArg(kernel, 13, sizeof(int), &output_height);
CL_CHECK_ERRORS(status);
status = clSetKernelArg(kernel, 14, sizeof(int), &filter_channel);
CL_CHECK_ERRORS(status);
status = clSetKernelArg(kernel, 15, sizeof(int), &has_group);
CL_CHECK_ERRORS(status);
// cl_event out_event = param.Output()->GetClEvent();
// cl_event wait_event = param.Input()->GetClEvent();
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册