diff --git a/modules/core/src/opencl/convert.cl b/modules/core/src/opencl/convert.cl index e0e7bd83a8fa070355267d2edc2236a4a334d9d6..e869d6d74359dc57ea702bf1ae5bdd9f099510c0 100644 --- a/modules/core/src/opencl/convert.cl +++ b/modules/core/src/opencl/convert.cl @@ -53,7 +53,10 @@ __kernel void convertTo(__global const uchar * srcptr, int src_step, int src_offset, __global uchar * dstptr, int dst_step, int dst_offset, int dst_rows, int dst_cols, - WT alpha, WT beta, int rowsPerWI) +#ifndef NO_SCALE + WT alpha, WT beta, +#endif + int rowsPerWI) { int x = get_global_id(0); int y0 = get_global_id(1) * rowsPerWI; @@ -68,7 +71,11 @@ __kernel void convertTo(__global const uchar * srcptr, int src_step, int src_off __global const srcT * src = (__global const srcT *)(srcptr + src_index); __global dstT * dst = (__global dstT *)(dstptr + dst_index); +#ifdef NO_SCALE + dst[0] = convertToDT(src[0]); +#else dst[0] = convertToDT(fma(convertToWT(src[0]), alpha, beta)); +#endif } } } diff --git a/modules/core/src/umatrix.cpp b/modules/core/src/umatrix.cpp index 48aa86635d0e8d6c60e168ce3eded73c9b19fb9f..9a991d7f301c18e31d94749bfca1e2fe7e5ed2e3 100644 --- a/modules/core/src/umatrix.cpp +++ b/modules/core/src/umatrix.cpp @@ -746,7 +746,7 @@ void UMat::convertTo(OutputArray _dst, int _type, double alpha, double beta) con ocl::typeToStr(sdepth), ocl::typeToStr(wdepth), ocl::typeToStr(ddepth), ocl::convertTypeStr(sdepth, wdepth, 1, cvt[0]), ocl::convertTypeStr(wdepth, ddepth, 1, cvt[1]), - doubleSupport ? " -D DOUBLE_SUPPORT" : "")); + doubleSupport ? " -D DOUBLE_SUPPORT" : "", noScale ? " -D NO_SCALE" : "")); if (!k.empty()) { UMat src = *this; @@ -757,7 +757,9 @@ void UMat::convertTo(OutputArray _dst, int _type, double alpha, double beta) con ocl::KernelArg srcarg = ocl::KernelArg::ReadOnlyNoSize(src), dstarg = ocl::KernelArg::WriteOnly(dst, cn); - if (wdepth == CV_32F) + if (noScale) + k.args(srcarg, dstarg, rowsPerWI); + else if (wdepth == CV_32F) k.args(srcarg, dstarg, alphaf, betaf, rowsPerWI); else k.args(srcarg, dstarg, alpha, beta, rowsPerWI);