cudaarithm.hpp 38.7 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42
/*M///////////////////////////////////////////////////////////////////////////////////////
//
//  IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.
//
//  By downloading, copying, installing or using the software you agree to this license.
//  If you do not agree to this license, do not download, install,
//  copy or use the software.
//
//
//                           License Agreement
//                For Open Source Computer Vision Library
//
// Copyright (C) 2000-2008, Intel Corporation, all rights reserved.
// Copyright (C) 2009, Willow Garage Inc., all rights reserved.
// Third party copyrights are property of their respective owners.
//
// Redistribution and use in source and binary forms, with or without modification,
// are permitted provided that the following conditions are met:
//
//   * Redistribution's of source code must retain the above copyright notice,
//     this list of conditions and the following disclaimer.
//
//   * Redistribution's in binary form must reproduce the above copyright notice,
//     this list of conditions and the following disclaimer in the documentation
//     and/or other materials provided with the distribution.
//
//   * The name of the copyright holders may not be used to endorse or promote products
//     derived from this software without specific prior written permission.
//
// This software is provided by the copyright holders and contributors "as is" and
// any express or implied warranties, including, but not limited to, the implied
// warranties of merchantability and fitness for a particular purpose are disclaimed.
// In no event shall the Intel Corporation or contributors be liable for any direct,
// indirect, incidental, special, exemplary, or consequential damages
// (including, but not limited to, procurement of substitute goods or services;
// loss of use, data, or profits; or business interruption) however caused
// and on any theory of liability, whether in contract, strict liability,
// or tort (including negligence or otherwise) arising in any way out of
// the use of this software, even if advised of the possibility of such damage.
//
//M*/

43 44
#ifndef __OPENCV_CUDAARITHM_HPP__
#define __OPENCV_CUDAARITHM_HPP__
45 46

#ifndef __cplusplus
47
#  error cudaarithm.hpp header must be compiled as C++
48 49
#endif

50
#include "opencv2/core/cuda.hpp"
51

M
Maksim Shabunin 已提交
52 53 54 55 56 57 58 59 60 61 62 63 64
/**
  @addtogroup cuda
  @{
    @defgroup cudaarithm Operations on Matrices
    @{
        @defgroup cudaarithm_core Core Operations on Matrices
        @defgroup cudaarithm_elem Per-element Operations
        @defgroup cudaarithm_reduce Matrix Reductions
        @defgroup cudaarithm_arithm Arithm Operations on Matrices
    @}
  @}
 */

65
namespace cv { namespace cuda {
66

M
Maksim Shabunin 已提交
67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85
//! @addtogroup cudaarithm
//! @{

//! @addtogroup cudaarithm_elem
//! @{

/** @brief Computes a matrix-matrix or matrix-scalar sum.

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar. Matrix should have the same size and type as src1 .
@param dst Destination matrix that has the same size and number of channels as the input array(s).
The depth is defined by dtype or src1 depth.
@param mask Optional operation mask, 8-bit single channel array, that specifies elements of the
destination array to be changed.
@param dtype Optional depth of the output array.
@param stream Stream for the asynchronous version.

@sa add
 */
86
CV_EXPORTS void add(InputArray src1, InputArray src2, OutputArray dst, InputArray mask = noArray(), int dtype = -1, Stream& stream = Stream::Null());
87

M
Maksim Shabunin 已提交
88 89 90 91 92 93 94 95 96 97 98 99 100
/** @brief Computes a matrix-matrix or matrix-scalar difference.

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar. Matrix should have the same size and type as src1 .
@param dst Destination matrix that has the same size and number of channels as the input array(s).
The depth is defined by dtype or src1 depth.
@param mask Optional operation mask, 8-bit single channel array, that specifies elements of the
destination array to be changed.
@param dtype Optional depth of the output array.
@param stream Stream for the asynchronous version.

@sa subtract
 */
101
CV_EXPORTS void subtract(InputArray src1, InputArray src2, OutputArray dst, InputArray mask = noArray(), int dtype = -1, Stream& stream = Stream::Null());
102

M
Maksim Shabunin 已提交
103 104 105 106 107 108 109 110 111 112 113 114
/** @brief Computes a matrix-matrix or matrix-scalar per-element product.

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar.
@param dst Destination matrix that has the same size and number of channels as the input array(s).
The depth is defined by dtype or src1 depth.
@param scale Optional scale factor.
@param dtype Optional depth of the output array.
@param stream Stream for the asynchronous version.

@sa multiply
 */
115
CV_EXPORTS void multiply(InputArray src1, InputArray src2, OutputArray dst, double scale = 1, int dtype = -1, Stream& stream = Stream::Null());
116

M
Maksim Shabunin 已提交
117 118 119 120 121 122 123 124 125 126 127 128 129 130
/** @brief Computes a matrix-matrix or matrix-scalar division.

@param src1 First source matrix or a scalar.
@param src2 Second source matrix or scalar.
@param dst Destination matrix that has the same size and number of channels as the input array(s).
The depth is defined by dtype or src1 depth.
@param scale Optional scale factor.
@param dtype Optional depth of the output array.
@param stream Stream for the asynchronous version.

This function, in contrast to divide, uses a round-down rounding mode.

@sa divide
 */
131 132
CV_EXPORTS void divide(InputArray src1, InputArray src2, OutputArray dst, double scale = 1, int dtype = -1, Stream& stream = Stream::Null());

133
//! computes element-wise weighted reciprocal of an array (dst = scale/src2)
134 135 136 137
static inline void divide(double src1, InputArray src2, OutputArray dst, int dtype = -1, Stream& stream = Stream::Null())
{
    divide(src1, src2, dst, 1.0, dtype, stream);
}
138

M
Maksim Shabunin 已提交
139 140 141 142 143 144 145 146 147
/** @brief Computes per-element absolute difference of two matrices (or of a matrix and scalar).

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar.
@param dst Destination matrix that has the same size and type as the input array(s).
@param stream Stream for the asynchronous version.

@sa absdiff
 */
148 149
CV_EXPORTS void absdiff(InputArray src1, InputArray src2, OutputArray dst, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
150 151 152 153 154 155 156 157
/** @brief Computes an absolute value of each matrix element.

@param src Source matrix.
@param dst Destination matrix with the same size and type as src .
@param stream Stream for the asynchronous version.

@sa abs
 */
158
CV_EXPORTS void abs(InputArray src, OutputArray dst, Stream& stream = Stream::Null());
159

M
Maksim Shabunin 已提交
160 161 162 163 164 165
/** @brief Computes a square value of each matrix element.

@param src Source matrix.
@param dst Destination matrix with the same size and type as src .
@param stream Stream for the asynchronous version.
 */
166
CV_EXPORTS void sqr(InputArray src, OutputArray dst, Stream& stream = Stream::Null());
167

M
Maksim Shabunin 已提交
168 169 170 171 172 173 174 175
/** @brief Computes a square root of each matrix element.

@param src Source matrix.
@param dst Destination matrix with the same size and type as src .
@param stream Stream for the asynchronous version.

@sa sqrt
 */
176
CV_EXPORTS void sqrt(InputArray src, OutputArray dst, Stream& stream = Stream::Null());
177

M
Maksim Shabunin 已提交
178 179 180 181 182 183 184 185
/** @brief Computes an exponent of each matrix element.

@param src Source matrix.
@param dst Destination matrix with the same size and type as src .
@param stream Stream for the asynchronous version.

@sa exp
 */
186
CV_EXPORTS void exp(InputArray src, OutputArray dst, Stream& stream = Stream::Null());
187

M
Maksim Shabunin 已提交
188 189 190 191 192 193 194 195
/** @brief Computes a natural logarithm of absolute value of each matrix element.

@param src Source matrix.
@param dst Destination matrix with the same size and type as src .
@param stream Stream for the asynchronous version.

@sa log
 */
196
CV_EXPORTS void log(InputArray src, OutputArray dst, Stream& stream = Stream::Null());
197

M
Maksim Shabunin 已提交
198 199 200 201 202 203 204 205 206 207 208 209 210
/** @brief Raises every matrix element to a power.

@param src Source matrix.
@param power Exponent of power.
@param dst Destination matrix with the same size and type as src .
@param stream Stream for the asynchronous version.

The function pow raises every element of the input matrix to power :

\f[\texttt{dst} (I) =  \fork{\texttt{src}(I)^power}{if \texttt{power} is integer}{|\texttt{src}(I)|^power}{otherwise}\f]

@sa pow
 */
211 212
CV_EXPORTS void pow(InputArray src, double power, OutputArray dst, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
213 214 215 216 217 218
/** @brief Compares elements of two matrices (or of a matrix and scalar).

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar.
@param dst Destination matrix that has the same size and type as the input array(s).
@param cmpop Flag specifying the relation between the elements to be checked:
219 220 221 222 223 224
-   **CMP_EQ:** a(.) == b(.)
-   **CMP_GT:** a(.) \< b(.)
-   **CMP_GE:** a(.) \<= b(.)
-   **CMP_LT:** a(.) \< b(.)
-   **CMP_LE:** a(.) \<= b(.)
-   **CMP_NE:** a(.) != b(.)
M
Maksim Shabunin 已提交
225 226 227 228
@param stream Stream for the asynchronous version.

@sa compare
 */
229 230
CV_EXPORTS void compare(InputArray src1, InputArray src2, OutputArray dst, int cmpop, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
231 232 233 234 235 236 237
/** @brief Performs a per-element bitwise inversion.

@param src Source matrix.
@param dst Destination matrix with the same size and type as src .
@param mask Optional operation mask. 8-bit single channel image.
@param stream Stream for the asynchronous version.
 */
238 239
CV_EXPORTS void bitwise_not(InputArray src, OutputArray dst, InputArray mask = noArray(), Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
240 241 242 243 244 245 246 247
/** @brief Performs a per-element bitwise disjunction of two matrices (or of matrix and scalar).

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar.
@param dst Destination matrix that has the same size and type as the input array(s).
@param mask Optional operation mask. 8-bit single channel image.
@param stream Stream for the asynchronous version.
 */
248 249
CV_EXPORTS void bitwise_or(InputArray src1, InputArray src2, OutputArray dst, InputArray mask = noArray(), Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
250 251 252 253 254 255 256 257
/** @brief Performs a per-element bitwise conjunction of two matrices (or of matrix and scalar).

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar.
@param dst Destination matrix that has the same size and type as the input array(s).
@param mask Optional operation mask. 8-bit single channel image.
@param stream Stream for the asynchronous version.
 */
258 259
CV_EXPORTS void bitwise_and(InputArray src1, InputArray src2, OutputArray dst, InputArray mask = noArray(), Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
260 261 262 263 264 265 266 267
/** @brief Performs a per-element bitwise exclusive or operation of two matrices (or of matrix and scalar).

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar.
@param dst Destination matrix that has the same size and type as the input array(s).
@param mask Optional operation mask. 8-bit single channel image.
@param stream Stream for the asynchronous version.
 */
268 269
CV_EXPORTS void bitwise_xor(InputArray src1, InputArray src2, OutputArray dst, InputArray mask = noArray(), Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
270 271 272 273 274 275 276
/** @brief Performs pixel by pixel right shift of an image by a constant value.

@param src Source matrix. Supports 1, 3 and 4 channels images with integers elements.
@param val Constant values, one per channel.
@param dst Destination matrix with the same size and type as src .
@param stream Stream for the asynchronous version.
 */
277 278
CV_EXPORTS void rshift(InputArray src, Scalar_<int> val, OutputArray dst, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
279 280
/** @brief Performs pixel by pixel right left of an image by a constant value.

281
@param src Source matrix. Supports 1, 3 and 4 channels images with CV_8U , CV_16U or CV_32S
M
Maksim Shabunin 已提交
282 283 284 285 286
depth.
@param val Constant values, one per channel.
@param dst Destination matrix with the same size and type as src .
@param stream Stream for the asynchronous version.
 */
287 288
CV_EXPORTS void lshift(InputArray src, Scalar_<int> val, OutputArray dst, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
289 290 291 292 293 294 295 296 297
/** @brief Computes the per-element minimum of two matrices (or a matrix and a scalar).

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar.
@param dst Destination matrix that has the same size and type as the input array(s).
@param stream Stream for the asynchronous version.

@sa min
 */
298 299
CV_EXPORTS void min(InputArray src1, InputArray src2, OutputArray dst, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
300 301 302 303 304 305 306 307 308
/** @brief Computes the per-element maximum of two matrices (or a matrix and a scalar).

@param src1 First source matrix or scalar.
@param src2 Second source matrix or scalar.
@param dst Destination matrix that has the same size and type as the input array(s).
@param stream Stream for the asynchronous version.

@sa max
 */
309 310
CV_EXPORTS void max(InputArray src1, InputArray src2, OutputArray dst, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331
/** @brief Computes the weighted sum of two arrays.

@param src1 First source array.
@param alpha Weight for the first array elements.
@param src2 Second source array of the same size and channel number as src1 .
@param beta Weight for the second array elements.
@param dst Destination array that has the same size and number of channels as the input arrays.
@param gamma Scalar added to each sum.
@param dtype Optional depth of the destination array. When both input arrays have the same depth,
dtype can be set to -1, which will be equivalent to src1.depth().
@param stream Stream for the asynchronous version.

The function addWeighted calculates the weighted sum of two arrays as follows:

\f[\texttt{dst} (I)= \texttt{saturate} ( \texttt{src1} (I)* \texttt{alpha} +  \texttt{src2} (I)* \texttt{beta} +  \texttt{gamma} )\f]

where I is a multi-dimensional index of array elements. In case of multi-channel arrays, each
channel is processed independently.

@sa addWeighted
 */
332
CV_EXPORTS void addWeighted(InputArray src1, double alpha, InputArray src2, double beta, double gamma, OutputArray dst,
333 334 335
                            int dtype = -1, Stream& stream = Stream::Null());

//! adds scaled array to another one (dst = alpha*src1 + src2)
336
static inline void scaleAdd(InputArray src1, double alpha, InputArray src2, OutputArray dst, Stream& stream = Stream::Null())
337 338 339
{
    addWeighted(src1, alpha, src2, 1.0, 0.0, dst, -1, stream);
}
340

M
Maksim Shabunin 已提交
341 342 343 344 345
/** @brief Applies a fixed-level threshold to each array element.

@param src Source array (single-channel).
@param dst Destination array with the same size and type as src .
@param thresh Threshold value.
346 347
@param maxval Maximum value to use with THRESH_BINARY and THRESH_BINARY_INV threshold types.
@param type Threshold type. For details, see threshold . The THRESH_OTSU and THRESH_TRIANGLE
M
Maksim Shabunin 已提交
348 349 350 351 352
threshold types are not supported.
@param stream Stream for the asynchronous version.

@sa threshold
 */
353 354
CV_EXPORTS double threshold(InputArray src, OutputArray dst, double thresh, double maxval, int type, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
355 356
/** @brief Computes magnitudes of complex matrix elements.

357 358
@param xy Source complex matrix in the interleaved format ( CV_32FC2 ).
@param magnitude Destination matrix of float magnitudes ( CV_32FC1 ).
M
Maksim Shabunin 已提交
359 360 361 362
@param stream Stream for the asynchronous version.

@sa magnitude
 */
363 364
CV_EXPORTS void magnitude(InputArray xy, OutputArray magnitude, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
365 366
/** @brief Computes squared magnitudes of complex matrix elements.

367 368
@param xy Source complex matrix in the interleaved format ( CV_32FC2 ).
@param magnitude Destination matrix of float magnitude squares ( CV_32FC1 ).
M
Maksim Shabunin 已提交
369 370
@param stream Stream for the asynchronous version.
 */
371 372
CV_EXPORTS void magnitudeSqr(InputArray xy, OutputArray magnitude, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
373 374 375
/** @overload
 computes magnitude of each (x(i), y(i)) vector
 supports only floating-point source
376 377 378
@param x Source matrix containing real components ( CV_32FC1 ).
@param y Source matrix containing imaginary components ( CV_32FC1 ).
@param magnitude Destination matrix of float magnitudes ( CV_32FC1 ).
M
Maksim Shabunin 已提交
379 380
@param stream Stream for the asynchronous version.
 */
381 382
CV_EXPORTS void magnitude(InputArray x, InputArray y, OutputArray magnitude, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
383 384 385
/** @overload
 computes squared magnitude of each (x(i), y(i)) vector
 supports only floating-point source
386 387 388
@param x Source matrix containing real components ( CV_32FC1 ).
@param y Source matrix containing imaginary components ( CV_32FC1 ).
@param magnitude Destination matrix of float magnitude squares ( CV_32FC1 ).
M
Maksim Shabunin 已提交
389 390
@param stream Stream for the asynchronous version.
*/
391 392
CV_EXPORTS void magnitudeSqr(InputArray x, InputArray y, OutputArray magnitude, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
393 394
/** @brief Computes polar angles of complex matrix elements.

395 396 397
@param x Source matrix containing real components ( CV_32FC1 ).
@param y Source matrix containing imaginary components ( CV_32FC1 ).
@param angle Destination matrix of angles ( CV_32FC1 ).
M
Maksim Shabunin 已提交
398 399 400 401 402
@param angleInDegrees Flag for angles that must be evaluated in degrees.
@param stream Stream for the asynchronous version.

@sa phase
 */
403 404
CV_EXPORTS void phase(InputArray x, InputArray y, OutputArray angle, bool angleInDegrees = false, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
405 406
/** @brief Converts Cartesian coordinates into polar.

407 408 409 410
@param x Source matrix containing real components ( CV_32FC1 ).
@param y Source matrix containing imaginary components ( CV_32FC1 ).
@param magnitude Destination matrix of float magnitudes ( CV_32FC1 ).
@param angle Destination matrix of angles ( CV_32FC1 ).
M
Maksim Shabunin 已提交
411 412 413 414 415
@param angleInDegrees Flag for angles that must be evaluated in degrees.
@param stream Stream for the asynchronous version.

@sa cartToPolar
 */
416 417
CV_EXPORTS void cartToPolar(InputArray x, InputArray y, OutputArray magnitude, OutputArray angle, bool angleInDegrees = false, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
418 419
/** @brief Converts polar coordinates into Cartesian.

420 421 422 423
@param magnitude Source matrix containing magnitudes ( CV_32FC1 ).
@param angle Source matrix containing angles ( CV_32FC1 ).
@param x Destination matrix of real components ( CV_32FC1 ).
@param y Destination matrix of imaginary components ( CV_32FC1 ).
M
Maksim Shabunin 已提交
424 425 426
@param angleInDegrees Flag that indicates angles in degrees.
@param stream Stream for the asynchronous version.
 */
427 428
CV_EXPORTS void polarToCart(InputArray magnitude, InputArray angle, OutputArray x, OutputArray y, bool angleInDegrees = false, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
429 430 431 432 433 434 435 436 437 438 439 440 441 442
//! @} cudaarithm_elem

//! @addtogroup cudaarithm_core
//! @{

/** @brief Makes a multi-channel matrix out of several single-channel matrices.

@param src Array/vector of source matrices.
@param n Number of source matrices.
@param dst Destination matrix.
@param stream Stream for the asynchronous version.

@sa merge
 */
443
CV_EXPORTS void merge(const GpuMat* src, size_t n, OutputArray dst, Stream& stream = Stream::Null());
M
Maksim Shabunin 已提交
444
/** @overload */
445 446
CV_EXPORTS void merge(const std::vector<GpuMat>& src, OutputArray dst, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
447 448 449 450 451 452 453 454
/** @brief Copies each plane of a multi-channel matrix into an array.

@param src Source matrix.
@param dst Destination array/vector of single-channel matrices.
@param stream Stream for the asynchronous version.

@sa split
 */
455
CV_EXPORTS void split(InputArray src, GpuMat* dst, Stream& stream = Stream::Null());
M
Maksim Shabunin 已提交
456
/** @overload */
457 458
CV_EXPORTS void split(InputArray src, std::vector<GpuMat>& dst, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
459 460 461 462 463 464 465 466
/** @brief Transposes a matrix.

@param src1 Source matrix. 1-, 4-, 8-byte element sizes are supported for now.
@param dst Destination matrix.
@param stream Stream for the asynchronous version.

@sa transpose
 */
467
CV_EXPORTS void transpose(InputArray src1, OutputArray dst, Stream& stream = Stream::Null());
468

M
Maksim Shabunin 已提交
469 470
/** @brief Flips a 2D matrix around vertical, horizontal, or both axes.

471 472
@param src Source matrix. Supports 1, 3 and 4 channels images with CV_8U, CV_16U, CV_32S or
CV_32F depth.
M
Maksim Shabunin 已提交
473 474 475 476 477 478 479 480 481
@param dst Destination matrix.
@param flipCode Flip mode for the source:
-   0 Flips around x-axis.
-   \> 0 Flips around y-axis.
-   \< 0 Flips around both axes.
@param stream Stream for the asynchronous version.

@sa flip
 */
482 483
CV_EXPORTS void flip(InputArray src, OutputArray dst, int flipCode, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
484 485
/** @brief Base class for transform using lookup table.
 */
486 487 488
class CV_EXPORTS LookUpTable : public Algorithm
{
public:
M
Maksim Shabunin 已提交
489 490 491
    /** @brief Transforms the source matrix into the destination matrix using the given look-up table:
    dst(I) = lut(src(I)) .

492
    @param src Source matrix. CV_8UC1 and CV_8UC3 matrices are supported for now.
M
Maksim Shabunin 已提交
493 494 495
    @param dst Destination matrix.
    @param stream Stream for the asynchronous version.
     */
496 497 498
    virtual void transform(InputArray src, OutputArray dst, Stream& stream = Stream::Null()) = 0;
};

M
Maksim Shabunin 已提交
499 500
/** @brief Creates implementation for cuda::LookUpTable .

501
@param lut Look-up table of 256 elements. It is a continuous CV_8U matrix.
M
Maksim Shabunin 已提交
502
 */
503
CV_EXPORTS Ptr<LookUpTable> createLookUpTable(InputArray lut);
504

M
Maksim Shabunin 已提交
505 506
/** @brief Forms a border around an image.

507
@param src Source image. CV_8UC1 , CV_8UC4 , CV_32SC1 , and CV_32FC1 types are supported.
M
Maksim Shabunin 已提交
508 509 510 511 512 513 514
@param dst Destination image with the same type as src. The size is
Size(src.cols+left+right, src.rows+top+bottom) .
@param top
@param bottom
@param left
@param right Number of pixels in each direction from the source image rectangle to extrapolate.
For example: top=1, bottom=1, left=1, right=1 mean that 1 pixel-wide border needs to be built.
515 516
@param borderType Border type. See borderInterpolate for details. BORDER_REFLECT101 ,
BORDER_REPLICATE , BORDER_CONSTANT , BORDER_REFLECT and BORDER_WRAP are supported for now.
M
Maksim Shabunin 已提交
517 518 519
@param value Border value.
@param stream Stream for the asynchronous version.
 */
520 521 522
CV_EXPORTS void copyMakeBorder(InputArray src, OutputArray dst, int top, int bottom, int left, int right, int borderType,
                               Scalar value = Scalar(), Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
523 524 525 526 527 528 529 530
//! @} cudaarithm_core

//! @addtogroup cudaarithm_reduce
//! @{

/** @brief Returns the norm of a matrix (or difference of two matrices).

@param src1 Source matrix. Any matrices except 64F are supported.
531 532
@param normType Norm type. NORM_L1 , NORM_L2 , and NORM_INF are supported for now.
@param mask optional operation mask; it must have the same size as src1 and CV_8UC1 type.
M
Maksim Shabunin 已提交
533 534 535 536
@param buf Optional buffer to avoid extra memory allocations. It is resized automatically.

@sa norm
 */
537
CV_EXPORTS double norm(InputArray src1, int normType, InputArray mask, GpuMat& buf);
M
Maksim Shabunin 已提交
538 539 540
/** @overload
uses new buffer, no mask
*/
541 542 543 544 545
static inline double norm(InputArray src, int normType)
{
    GpuMat buf;
    return norm(src, normType, GpuMat(), buf);
}
M
Maksim Shabunin 已提交
546 547 548
/** @overload
no mask
*/
549 550 551 552
static inline double norm(InputArray src, int normType, GpuMat& buf)
{
    return norm(src, normType, GpuMat(), buf);
}
553

M
Maksim Shabunin 已提交
554 555 556 557
/** @brief Returns the difference of two matrices.

@param src1 Source matrix. Any matrices except 64F are supported.
@param src2 Second source matrix (if any) with the same size and type as src1.
558
@param normType Norm type. NORM_L1 , NORM_L2 , and NORM_INF are supported for now.
M
Maksim Shabunin 已提交
559 560 561 562
@param buf Optional buffer to avoid extra memory allocations. It is resized automatically.

@sa norm
 */
563
CV_EXPORTS double norm(InputArray src1, InputArray src2, GpuMat& buf, int normType=NORM_L2);
M
Maksim Shabunin 已提交
564 565 566
/** @overload
uses new buffer
*/
567 568 569 570 571
static inline double norm(InputArray src1, InputArray src2, int normType=NORM_L2)
{
    GpuMat buf;
    return norm(src1, src2, buf, normType);
}
572

M
Maksim Shabunin 已提交
573 574
/** @brief Returns the sum of matrix elements.

575 576
@param src Source image of any depth except for CV_64F .
@param mask optional operation mask; it must have the same size as src1 and CV_8UC1 type.
M
Maksim Shabunin 已提交
577 578 579 580
@param buf Optional buffer to avoid extra memory allocations. It is resized automatically.

@sa sum
 */
581
CV_EXPORTS Scalar sum(InputArray src, InputArray mask, GpuMat& buf);
M
Maksim Shabunin 已提交
582 583 584
/** @overload
uses new buffer, no mask
*/
585 586 587 588 589
static inline Scalar sum(InputArray src)
{
    GpuMat buf;
    return sum(src, GpuMat(), buf);
}
M
Maksim Shabunin 已提交
590 591 592
/** @overload
no mask
*/
593 594 595 596
static inline Scalar sum(InputArray src, GpuMat& buf)
{
    return sum(src, GpuMat(), buf);
}
597

M
Maksim Shabunin 已提交
598 599
/** @brief Returns the sum of absolute values for matrix elements.

600 601
@param src Source image of any depth except for CV_64F .
@param mask optional operation mask; it must have the same size as src1 and CV_8UC1 type.
M
Maksim Shabunin 已提交
602 603
@param buf Optional buffer to avoid extra memory allocations. It is resized automatically.
 */
604
CV_EXPORTS Scalar absSum(InputArray src, InputArray mask, GpuMat& buf);
M
Maksim Shabunin 已提交
605 606 607
/** @overload
uses new buffer, no mask
*/
608 609 610 611 612
static inline Scalar absSum(InputArray src)
{
    GpuMat buf;
    return absSum(src, GpuMat(), buf);
}
M
Maksim Shabunin 已提交
613 614 615
/** @overload
no mask
*/
616 617 618 619
static inline Scalar absSum(InputArray src, GpuMat& buf)
{
    return absSum(src, GpuMat(), buf);
}
620

M
Maksim Shabunin 已提交
621 622
/** @brief Returns the squared sum of matrix elements.

623 624
@param src Source image of any depth except for CV_64F .
@param mask optional operation mask; it must have the same size as src1 and CV_8UC1 type.
M
Maksim Shabunin 已提交
625 626
@param buf Optional buffer to avoid extra memory allocations. It is resized automatically.
 */
627
CV_EXPORTS Scalar sqrSum(InputArray src, InputArray mask, GpuMat& buf);
M
Maksim Shabunin 已提交
628 629 630
/** @overload
uses new buffer, no mask
*/
631 632 633 634 635
static inline Scalar sqrSum(InputArray src)
{
    GpuMat buf;
    return sqrSum(src, GpuMat(), buf);
}
M
Maksim Shabunin 已提交
636 637 638
/** @overload
no mask
*/
639 640 641 642
static inline Scalar sqrSum(InputArray src, GpuMat& buf)
{
    return sqrSum(src, GpuMat(), buf);
}
643

M
Maksim Shabunin 已提交
644 645 646 647 648 649 650 651
/** @brief Finds global minimum and maximum matrix elements and returns their values.

@param src Single-channel source image.
@param minVal Pointer to the returned minimum value. Use NULL if not required.
@param maxVal Pointer to the returned maximum value. Use NULL if not required.
@param mask Optional mask to select a sub-matrix.
@param buf Optional buffer to avoid extra memory allocations. It is resized automatically.

652
The function does not work with CV_64F images on GPUs with the compute capability \< 1.3.
M
Maksim Shabunin 已提交
653 654 655

@sa minMaxLoc
 */
656
CV_EXPORTS void minMax(InputArray src, double* minVal, double* maxVal, InputArray mask, GpuMat& buf);
M
Maksim Shabunin 已提交
657 658 659
/** @overload
uses new buffer
*/
660 661 662 663 664
static inline void minMax(InputArray src, double* minVal, double* maxVal=0, InputArray mask=noArray())
{
    GpuMat buf;
    minMax(src, minVal, maxVal, mask, buf);
}
665

M
Maksim Shabunin 已提交
666 667 668 669 670 671 672 673 674 675 676 677
/** @brief Finds global minimum and maximum matrix elements and returns their values with locations.

@param src Single-channel source image.
@param minVal Pointer to the returned minimum value. Use NULL if not required.
@param maxVal Pointer to the returned maximum value. Use NULL if not required.
@param minLoc Pointer to the returned minimum location. Use NULL if not required.
@param maxLoc Pointer to the returned maximum location. Use NULL if not required.
@param mask Optional mask to select a sub-matrix.
@param valbuf Optional values buffer to avoid extra memory allocations. It is resized
automatically.
@param locbuf Optional locations buffer to avoid extra memory allocations. It is resized
automatically.
678
The function does not work with CV_64F images on GPU with the compute capability \< 1.3.
M
Maksim Shabunin 已提交
679 680 681

@sa minMaxLoc
 */
682 683
CV_EXPORTS void minMaxLoc(InputArray src, double* minVal, double* maxVal, Point* minLoc, Point* maxLoc,
                          InputArray mask, GpuMat& valbuf, GpuMat& locbuf);
M
Maksim Shabunin 已提交
684 685 686
/** @overload
uses new buffer
*/
687 688 689 690 691 692
static inline void minMaxLoc(InputArray src, double* minVal, double* maxVal=0, Point* minLoc=0, Point* maxLoc=0,
                             InputArray mask=noArray())
{
    GpuMat valBuf, locBuf;
    minMaxLoc(src, minVal, maxVal, minLoc, maxLoc, mask, valBuf, locBuf);
}
693

M
Maksim Shabunin 已提交
694 695 696 697 698
/** @brief Counts non-zero matrix elements.

@param src Single-channel source image.
@param buf Optional buffer to avoid extra memory allocations. It is resized automatically.

699
The function does not work with CV_64F images on GPUs with the compute capability \< 1.3.
M
Maksim Shabunin 已提交
700 701 702

@sa countNonZero
 */
703
CV_EXPORTS int countNonZero(InputArray src, GpuMat& buf);
M
Maksim Shabunin 已提交
704 705 706
/** @overload
uses new buffer
*/
707 708 709 710 711
static inline int countNonZero(const GpuMat& src)
{
    GpuMat buf;
    return countNonZero(src, buf);
}
712

M
Maksim Shabunin 已提交
713 714 715 716 717 718 719
/** @brief Reduces a matrix to a vector.

@param mtx Source 2D matrix.
@param vec Destination vector. Its size and type is defined by dim and dtype parameters.
@param dim Dimension index along which the matrix is reduced. 0 means that the matrix is reduced
to a single row. 1 means that the matrix is reduced to a single column.
@param reduceOp Reduction operation that could be one of the following:
720 721 722
-   **CV_REDUCE_SUM** The output is the sum of all rows/columns of the matrix.
-   **CV_REDUCE_AVG** The output is the mean vector of all rows/columns of the matrix.
-   **CV_REDUCE_MAX** The output is the maximum (column/row-wise) of all rows/columns of the
M
Maksim Shabunin 已提交
723
matrix.
724
-   **CV_REDUCE_MIN** The output is the minimum (column/row-wise) of all rows/columns of the
M
Maksim Shabunin 已提交
725 726
matrix.
@param dtype When it is negative, the destination vector will have the same type as the source
727
matrix. Otherwise, its type will be CV_MAKE_TYPE(CV_MAT_DEPTH(dtype), mtx.channels()) .
M
Maksim Shabunin 已提交
728 729 730 731 732
@param stream Stream for the asynchronous version.

The function reduce reduces the matrix to a vector by treating the matrix rows/columns as a set of
1D vectors and performing the specified operation on the vectors until a single row/column is
obtained. For example, the function can be used to compute horizontal and vertical projections of a
733
raster image. In case of CV_REDUCE_SUM and CV_REDUCE_AVG , the output may have a larger element
M
Maksim Shabunin 已提交
734 735 736 737 738
bit-depth to preserve accuracy. And multi-channel arrays are also supported in these two reduction
modes.

@sa reduce
 */
739
CV_EXPORTS void reduce(InputArray mtx, OutputArray vec, int dim, int reduceOp, int dtype = -1, Stream& stream = Stream::Null());
740

M
Maksim Shabunin 已提交
741 742
/** @brief Computes a mean value and a standard deviation of matrix elements.

743
@param mtx Source matrix. CV_8UC1 matrices are supported for now.
M
Maksim Shabunin 已提交
744 745 746 747 748 749
@param mean Mean value.
@param stddev Standard deviation value.
@param buf Optional buffer to avoid extra memory allocations. It is resized automatically.

@sa meanStdDev
 */
750
CV_EXPORTS void meanStdDev(InputArray mtx, Scalar& mean, Scalar& stddev, GpuMat& buf);
M
Maksim Shabunin 已提交
751 752 753
/** @overload
uses new buffer
*/
754 755 756 757 758
static inline void meanStdDev(InputArray src, Scalar& mean, Scalar& stddev)
{
    GpuMat buf;
    meanStdDev(src, mean, stddev, buf);
}
759

M
Maksim Shabunin 已提交
760 761
/** @brief Computes a standard deviation of integral images.

762 763
@param src Source image. Only the CV_32SC1 type is supported.
@param sqr Squared source image. Only the CV_32FC1 type is supported.
M
Maksim Shabunin 已提交
764 765 766 767
@param dst Destination image with the same type and size as src .
@param rect Rectangular window.
@param stream Stream for the asynchronous version.
 */
768 769
CV_EXPORTS void rectStdDev(InputArray src, InputArray sqr, OutputArray dst, Rect rect, Stream& stream = Stream::Null());

M
Maksim Shabunin 已提交
770 771 772 773 774 775 776 777
/** @brief Normalizes the norm or value range of an array.

@param src Input array.
@param dst Output array of the same size as src .
@param alpha Norm value to normalize to or the lower range boundary in case of the range
normalization.
@param beta Upper range boundary in case of the range normalization; it is not used for the norm
normalization.
778
@param norm_type Normalization type ( NORM_MINMAX , NORM_L2 , NORM_L1 or NORM_INF ).
M
Maksim Shabunin 已提交
779
@param dtype When negative, the output array has the same type as src; otherwise, it has the same
780
number of channels as src and the depth =CV_MAT_DEPTH(dtype).
M
Maksim Shabunin 已提交
781
@param mask Optional operation mask.
782 783
@param norm_buf Optional buffer to avoid extra memory allocations. It is resized automatically.
@param cvt_buf Optional buffer to avoid extra memory allocations. It is resized automatically.
M
Maksim Shabunin 已提交
784 785 786

@sa normalize
 */
787 788
CV_EXPORTS void normalize(InputArray src, OutputArray dst, double alpha, double beta,
                          int norm_type, int dtype, InputArray mask, GpuMat& norm_buf, GpuMat& cvt_buf);
M
Maksim Shabunin 已提交
789 790 791
/** @overload
uses new buffers
*/
792 793 794 795 796 797 798
static inline void normalize(InputArray src, OutputArray dst, double alpha = 1, double beta = 0,
                             int norm_type = NORM_L2, int dtype = -1, InputArray mask = noArray())
{
    GpuMat norm_buf;
    GpuMat cvt_buf;
    normalize(src, dst, alpha, beta, norm_type, dtype, mask, norm_buf, cvt_buf);
}
799

M
Maksim Shabunin 已提交
800 801
/** @brief Computes an integral image.

802 803
@param src Source image. Only CV_8UC1 images are supported for now.
@param sum Integral image containing 32-bit unsigned integer values packed into CV_32SC1 .
M
Maksim Shabunin 已提交
804 805 806 807 808
@param buffer Optional buffer to avoid extra memory allocations. It is resized automatically.
@param stream Stream for the asynchronous version.

@sa integral
 */
809 810 811 812 813
CV_EXPORTS void integral(InputArray src, OutputArray sum, GpuMat& buffer, Stream& stream = Stream::Null());
static inline void integralBuffered(InputArray src, OutputArray sum, GpuMat& buffer, Stream& stream = Stream::Null())
{
    integral(src, sum, buffer, stream);
}
M
Maksim Shabunin 已提交
814 815 816
/** @overload
uses new buffer
*/
817 818 819 820 821
static inline void integral(InputArray src, OutputArray sum, Stream& stream = Stream::Null())
{
    GpuMat buffer;
    integral(src, sum, buffer, stream);
}
822

M
Maksim Shabunin 已提交
823 824
/** @brief Computes a squared integral image.

825
@param src Source image. Only CV_8UC1 images are supported for now.
M
Maksim Shabunin 已提交
826
@param sqsum Squared integral image containing 64-bit unsigned integer values packed into
827
CV_64FC1 .
M
Maksim Shabunin 已提交
828 829 830
@param buf Optional buffer to avoid extra memory allocations. It is resized automatically.
@param stream Stream for the asynchronous version.
 */
831
CV_EXPORTS void sqrIntegral(InputArray src, OutputArray sqsum, GpuMat& buf, Stream& stream = Stream::Null());
M
Maksim Shabunin 已提交
832 833 834
/** @overload
uses new buffer
*/
835 836 837 838 839 840
static inline void sqrIntegral(InputArray src, OutputArray sqsum, Stream& stream = Stream::Null())
{
    GpuMat buffer;
    sqrIntegral(src, sqsum, buffer, stream);
}

M
Maksim Shabunin 已提交
841 842 843 844 845 846 847
//! @} cudaarithm_reduce

//! @addtogroup cudaarithm_arithm
//! @{

/** @brief Performs generalized matrix multiplication.

848 849
@param src1 First multiplied input matrix that should have CV_32FC1 , CV_64FC1 , CV_32FC2 , or
CV_64FC2 type.
M
Maksim Shabunin 已提交
850 851 852 853 854 855 856
@param src2 Second multiplied input matrix of the same type as src1 .
@param alpha Weight of the matrix product.
@param src3 Third optional delta matrix added to the matrix product. It should have the same type
as src1 and src2 .
@param beta Weight of src3 .
@param dst Destination matrix. It has the proper size and the same type as input matrices.
@param flags Operation flags:
857 858 859
-   **GEMM_1_T** transpose src1
-   **GEMM_2_T** transpose src2
-   **GEMM_3_T** transpose src3
M
Maksim Shabunin 已提交
860 861 862
@param stream Stream for the asynchronous version.

The function performs generalized matrix multiplication similar to the gemm functions in BLAS level
863
3. For example, gemm(src1, src2, alpha, src3, beta, dst, GEMM_1_T + GEMM_3_T) corresponds to
M
Maksim Shabunin 已提交
864 865 866

\f[\texttt{dst} =  \texttt{alpha} \cdot \texttt{src1} ^T  \cdot \texttt{src2} +  \texttt{beta} \cdot \texttt{src3} ^T\f]

867
@note Transposition operation doesn't support CV_64FC2 input type.
M
Maksim Shabunin 已提交
868 869 870

@sa gemm
 */
871 872
CV_EXPORTS void gemm(InputArray src1, InputArray src2, double alpha,
                     InputArray src3, double beta, OutputArray dst, int flags = 0, Stream& stream = Stream::Null());
873

M
Maksim Shabunin 已提交
874 875 876 877 878 879 880 881 882 883
/** @brief Performs a per-element multiplication of two Fourier spectrums.

@param src1 First spectrum.
@param src2 Second spectrum with the same size and type as a .
@param dst Destination spectrum.
@param flags Mock parameter used for CPU/CUDA interfaces similarity.
@param conjB Optional flag to specify if the second spectrum needs to be conjugated before the
multiplication.
@param stream Stream for the asynchronous version.

884
Only full (not packed) CV_32FC2 complex spectrums in the interleaved format are supported for now.
M
Maksim Shabunin 已提交
885 886 887

@sa mulSpectrums
 */
888
CV_EXPORTS void mulSpectrums(InputArray src1, InputArray src2, OutputArray dst, int flags, bool conjB=false, Stream& stream = Stream::Null());
889

M
Maksim Shabunin 已提交
890 891 892 893 894 895 896 897 898 899 900
/** @brief Performs a per-element multiplication of two Fourier spectrums and scales the result.

@param src1 First spectrum.
@param src2 Second spectrum with the same size and type as a .
@param dst Destination spectrum.
@param flags Mock parameter used for CPU/CUDA interfaces similarity.
@param scale Scale constant.
@param conjB Optional flag to specify if the second spectrum needs to be conjugated before the
multiplication.
@param stream Stream for the asynchronous version.

901
Only full (not packed) CV_32FC2 complex spectrums in the interleaved format are supported for now.
M
Maksim Shabunin 已提交
902 903 904

@sa mulSpectrums
 */
905
CV_EXPORTS void mulAndScaleSpectrums(InputArray src1, InputArray src2, OutputArray dst, int flags, float scale, bool conjB=false, Stream& stream = Stream::Null());
906

M
Maksim Shabunin 已提交
907 908 909 910
/** @brief Performs a forward or inverse discrete Fourier transform (1D or 2D) of the floating point matrix.

@param src Source matrix (real or complex).
@param dst Destination matrix (real or complex).
911
@param dft_size Size of a discrete Fourier transform.
M
Maksim Shabunin 已提交
912
@param flags Optional flags:
913 914 915 916
-   **DFT_ROWS** transforms each individual row of the source matrix.
-   **DFT_SCALE** scales the result: divide it by the number of elements in the transform
(obtained from dft_size ).
-   **DFT_INVERSE** inverts DFT. Use for complex-complex cases (real-complex and complex-real
M
Maksim Shabunin 已提交
917
cases are always forward and inverse, respectively).
918
-   **DFT_REAL_OUTPUT** specifies the output as real. The source matrix is the result of
M
Maksim Shabunin 已提交
919 920 921 922 923 924 925 926 927 928
real-complex transform, so the destination matrix must be real.
@param stream Stream for the asynchronous version.

Use to handle real matrices ( CV32FC1 ) and complex matrices in the interleaved format ( CV32FC2 ).

The source matrix should be continuous, otherwise reallocation and data copying is performed. The
function chooses an operation mode depending on the flags, size, and channel count of the source
matrix:

-   If the source matrix is complex and the output is not specified as real, the destination
929
matrix is complex and has the dft_size size and CV_32FC2 type. The destination matrix
M
Maksim Shabunin 已提交
930 931 932
contains a full result of the DFT (forward or inverse).
-   If the source matrix is complex and the output is specified as real, the function assumes that
its input is the result of the forward transform (see the next item). The destination matrix
933 934 935 936
has the dft_size size and CV_32FC1 type. It contains the result of the inverse DFT.
-   If the source matrix is real (its type is CV_32FC1 ), forward DFT is performed. The result of
the DFT is packed into complex ( CV_32FC2 ) matrix. So, the width of the destination matrix
is dft_size.width / 2 + 1 . But if the source is a single column, the height is reduced
M
Maksim Shabunin 已提交
937 938 939 940
instead of the width.

@sa dft
 */
941
CV_EXPORTS void dft(InputArray src, OutputArray dst, Size dft_size, int flags=0, Stream& stream = Stream::Null());
942

M
Maksim Shabunin 已提交
943 944
/** @brief Base class for convolution (or cross-correlation) operator. :
 */
945 946 947
class CV_EXPORTS Convolution : public Algorithm
{
public:
M
Maksim Shabunin 已提交
948 949
    /** @brief Computes a convolution (or cross-correlation) of two images.

950
    @param image Source image. Only CV_32FC1 images are supported for now.
M
Maksim Shabunin 已提交
951 952 953 954 955 956 957
    @param templ Template image. The size is not greater than the image size. The type is the same as
    image .
    @param result Result image. If image is *W x H* and templ is *w x h*, then result must be *W-w+1 x
    H-h+1*.
    @param ccorr Flags to evaluate cross-correlation instead of convolution.
    @param stream Stream for the asynchronous version.
     */
958 959 960
    virtual void convolve(InputArray image, InputArray templ, OutputArray result, bool ccorr = false, Stream& stream = Stream::Null()) = 0;
};

M
Maksim Shabunin 已提交
961 962
/** @brief Creates implementation for cuda::Convolution .

963 964
@param user_block_size Block size. If you leave default value Size(0,0) then automatic
estimation of block size will be used (which is optimized for speed). By varying user_block_size
M
Maksim Shabunin 已提交
965 966
you can reduce memory requirements at the cost of speed.
 */
967
CV_EXPORTS Ptr<Convolution> createConvolution(Size user_block_size = Size());
968

M
Maksim Shabunin 已提交
969 970 971 972
//! @} cudaarithm_arithm

//! @} cudaarithm

973
}} // namespace cv { namespace cuda {
974

975
#endif /* __OPENCV_CUDAARITHM_HPP__ */