/*M/////////////////////////////////////////////////////////////////////////////////////// // // IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING. // // By downloading, copying, installing or using the software you agree to this license. // If you do not agree to this license, do not download, install, // copy or use the software. // // // License Agreement // For Open Source Computer Vision Library // // Copyright (C) 2008-2013, Itseez Inc., all rights reserved. // Third party copyrights are property of their respective owners. // // Redistribution and use in source and binary forms, with or without modification, // are permitted provided that the following conditions are met: // // * Redistribution's of source code must retain the above copyright notice, // this list of conditions and the following disclaimer. // // * Redistribution's in binary form must reproduce the above copyright notice, // this list of conditions and the following disclaimer in the documentation // and/or other materials provided with the distribution. // // * The name of Itseez Inc. may not be used to endorse or promote products // derived from this software without specific prior written permission. // // This software is provided by the copyright holders and contributors "as is" and // any express or implied warranties, including, but not limited to, the implied // warranties of merchantability and fitness for a particular purpose are disclaimed. // In no event shall the copyright holders or contributors be liable for any direct, // indirect, incidental, special, exemplary, or consequential damages // (including, but not limited to, procurement of substitute goods or services; // loss of use, data, or profits; or business interruption) however caused // and on any theory of liability, whether in contract, strict liability, // or tort (including negligence or otherwise) arising in any way out of // the use of this software, even if advised of the possibility of such damage. // //M*/ #include "precomp.hpp" #include #include "cascadedetect.hpp" #include "opencv2/objdetect/objdetect_c.h" #include "opencl_kernels.hpp" namespace cv { template void copyVectorToUMat(const std::vector<_Tp>& v, UMat& um) { if(v.empty()) um.release(); Mat(1, (int)(v.size()*sizeof(v[0])), CV_8U, (void*)&v[0]).copyTo(um); } void groupRectangles(std::vector& rectList, int groupThreshold, double eps, std::vector* weights, std::vector* levelWeights) { if( groupThreshold <= 0 || rectList.empty() ) { if( weights ) { size_t i, sz = rectList.size(); weights->resize(sz); for( i = 0; i < sz; i++ ) (*weights)[i] = 1; } return; } std::vector labels; int nclasses = partition(rectList, labels, SimilarRects(eps)); std::vector rrects(nclasses); std::vector rweights(nclasses, 0); std::vector rejectLevels(nclasses, 0); std::vector rejectWeights(nclasses, DBL_MIN); int i, j, nlabels = (int)labels.size(); for( i = 0; i < nlabels; i++ ) { int cls = labels[i]; rrects[cls].x += rectList[i].x; rrects[cls].y += rectList[i].y; rrects[cls].width += rectList[i].width; rrects[cls].height += rectList[i].height; rweights[cls]++; } if ( levelWeights && weights && !weights->empty() && !levelWeights->empty() ) { for( i = 0; i < nlabels; i++ ) { int cls = labels[i]; if( (*weights)[i] > rejectLevels[cls] ) { rejectLevels[cls] = (*weights)[i]; rejectWeights[cls] = (*levelWeights)[i]; } else if( ( (*weights)[i] == rejectLevels[cls] ) && ( (*levelWeights)[i] > rejectWeights[cls] ) ) rejectWeights[cls] = (*levelWeights)[i]; } } for( i = 0; i < nclasses; i++ ) { Rect r = rrects[i]; float s = 1.f/rweights[i]; rrects[i] = Rect(saturate_cast(r.x*s), saturate_cast(r.y*s), saturate_cast(r.width*s), saturate_cast(r.height*s)); } rectList.clear(); if( weights ) weights->clear(); if( levelWeights ) levelWeights->clear(); for( i = 0; i < nclasses; i++ ) { Rect r1 = rrects[i]; int n1 = rweights[i]; double w1 = rejectWeights[i]; int l1 = rejectLevels[i]; // filter out rectangles which don't have enough similar rectangles if( n1 <= groupThreshold ) continue; // filter out small face rectangles inside large rectangles for( j = 0; j < nclasses; j++ ) { int n2 = rweights[j]; if( j == i || n2 <= groupThreshold ) continue; Rect r2 = rrects[j]; int dx = saturate_cast( r2.width * eps ); int dy = saturate_cast( r2.height * eps ); if( i != j && r1.x >= r2.x - dx && r1.y >= r2.y - dy && r1.x + r1.width <= r2.x + r2.width + dx && r1.y + r1.height <= r2.y + r2.height + dy && (n2 > std::max(3, n1) || n1 < 3) ) break; } if( j == nclasses ) { rectList.push_back(r1); if( weights ) weights->push_back(l1); if( levelWeights ) levelWeights->push_back(w1); } } } class MeanshiftGrouping { public: MeanshiftGrouping(const Point3d& densKer, const std::vector& posV, const std::vector& wV, double eps, int maxIter = 20) { densityKernel = densKer; weightsV = wV; positionsV = posV; positionsCount = (int)posV.size(); meanshiftV.resize(positionsCount); distanceV.resize(positionsCount); iterMax = maxIter; modeEps = eps; for (unsigned i = 0; i& modesV, std::vector& resWeightsV, const double eps) { for (size_t i=0; i positionsV; std::vector weightsV; Point3d densityKernel; int positionsCount; std::vector meanshiftV; std::vector distanceV; int iterMax; double modeEps; Point3d getNewValue(const Point3d& inPt) const { Point3d resPoint(.0); Point3d ratPoint(.0); for (size_t i=0; i& rectList, double detectThreshold, std::vector* foundWeights, std::vector& scales, Size winDetSize) { int detectionCount = (int)rectList.size(); std::vector hits(detectionCount), resultHits; std::vector hitWeights(detectionCount), resultWeights; Point2d hitCenter; for (int i=0; i < detectionCount; i++) { hitWeights[i] = (*foundWeights)[i]; hitCenter = (rectList[i].tl() + rectList[i].br())*(0.5); //center of rectangles hits[i] = Point3d(hitCenter.x, hitCenter.y, std::log(scales[i])); } rectList.clear(); if (foundWeights) foundWeights->clear(); double logZ = std::log(1.3); Point3d smothing(8, 16, logZ); MeanshiftGrouping msGrouping(smothing, hits, hitWeights, 1e-5, 100); msGrouping.getModes(resultHits, resultWeights, 1); for (unsigned i=0; i < resultHits.size(); ++i) { double scale = std::exp(resultHits[i].z); hitCenter.x = resultHits[i].x; hitCenter.y = resultHits[i].y; Size s( int(winDetSize.width * scale), int(winDetSize.height * scale) ); Rect resultRect( int(hitCenter.x-s.width/2), int(hitCenter.y-s.height/2), int(s.width), int(s.height) ); if (resultWeights[i] > detectThreshold) { rectList.push_back(resultRect); foundWeights->push_back(resultWeights[i]); } } } void groupRectangles(std::vector& rectList, int groupThreshold, double eps) { groupRectangles(rectList, groupThreshold, eps, 0, 0); } void groupRectangles(std::vector& rectList, std::vector& weights, int groupThreshold, double eps) { groupRectangles(rectList, groupThreshold, eps, &weights, 0); } //used for cascade detection algorithm for ROC-curve calculating void groupRectangles(std::vector& rectList, std::vector& rejectLevels, std::vector& levelWeights, int groupThreshold, double eps) { groupRectangles(rectList, groupThreshold, eps, &rejectLevels, &levelWeights); } //can be used for HOG detection algorithm only void groupRectangles_meanshift(std::vector& rectList, std::vector& foundWeights, std::vector& foundScales, double detectThreshold, Size winDetSize) { groupRectangles_meanshift(rectList, detectThreshold, &foundWeights, foundScales, winDetSize); } FeatureEvaluator::~FeatureEvaluator() {} bool FeatureEvaluator::read(const FileNode&, Size _origWinSize) { origWinSize = _origWinSize; localSize = lbufSize = Size(0, 0); if (scaleData.empty()) scaleData = makePtr >(); else scaleData->clear(); return true; } Ptr FeatureEvaluator::clone() const { return Ptr(); } int FeatureEvaluator::getFeatureType() const {return -1;} bool FeatureEvaluator::setWindow(Point, int) { return true; } void FeatureEvaluator::getUMats(std::vector& bufs) { if (!(sbufFlag & USBUF_VALID)) { sbuf.copyTo(usbuf); sbufFlag |= USBUF_VALID; } bufs.clear(); bufs.push_back(uscaleData); bufs.push_back(usbuf); bufs.push_back(ufbuf); } void FeatureEvaluator::getMats() { if (!(sbufFlag & SBUF_VALID)) { usbuf.copyTo(sbuf); sbufFlag |= SBUF_VALID; } } float FeatureEvaluator::calcOrd(int) const { return 0.; } int FeatureEvaluator::calcCat(int) const { return 0; } bool FeatureEvaluator::updateScaleData( Size imgsz, const std::vector& _scales ) { if( scaleData.empty() ) scaleData = makePtr >(); size_t i, nscales = _scales.size(); bool recalcOptFeatures = nscales != scaleData->size(); scaleData->resize(nscales); int layer_dy = 0; Point layer_ofs(0,0); Size prevBufSize = sbufSize; sbufSize.width = std::max(sbufSize.width, (int)alignSize(cvRound(imgsz.width/_scales[0]) + 31, 32)); recalcOptFeatures = recalcOptFeatures || sbufSize.width != prevBufSize.width; for( i = 0; i < nscales; i++ ) { FeatureEvaluator::ScaleData& s = scaleData->at(i); if( !recalcOptFeatures && fabs(s.scale - _scales[i]) > FLT_EPSILON*100*_scales[i] ) recalcOptFeatures = true; float sc = _scales[i]; Size sz; sz.width = cvRound(imgsz.width/sc); sz.height = cvRound(imgsz.height/sc); s.ystep = sc >= 2 ? 1 : 2; s.scale = sc; s.szi = Size(sz.width+1, sz.height+1); if( layer_ofs.x + s.szi.width > sbufSize.width ) { layer_ofs = Point(0, layer_ofs.y + layer_dy); layer_dy = s.szi.height; } s.layer_ofs = layer_ofs.y*sbufSize.width + layer_ofs.x; layer_ofs.x += s.szi.width; } layer_ofs.y += layer_dy; sbufSize.height = std::max(sbufSize.height, layer_ofs.y); recalcOptFeatures = recalcOptFeatures || sbufSize.height != prevBufSize.height; return recalcOptFeatures; } bool FeatureEvaluator::setImage( InputArray _image, const std::vector& _scales ) { Size imgsz = _image.size(); bool recalcOptFeatures = updateScaleData(imgsz, _scales); size_t i, nscales = scaleData->size(); Size sz0 = scaleData->at(0).szi; sz0 = Size(std::max(rbuf.cols, (int)alignSize(sz0.width, 16)), std::max(rbuf.rows, sz0.height)); if (recalcOptFeatures) { computeOptFeatures(); copyVectorToUMat(*scaleData, uscaleData); } if (_image.isUMat() && localSize.area() > 0) { usbuf.create(sbufSize.height*nchannels, sbufSize.width, CV_32S); urbuf.create(sz0, CV_8U); for (i = 0; i < nscales; i++) { const ScaleData& s = scaleData->at(i); UMat dst(urbuf, Rect(0, 0, s.szi.width - 1, s.szi.height - 1)); resize(_image, dst, dst.size(), 1. / s.scale, 1. / s.scale, INTER_LINEAR); computeChannels((int)i, dst); } sbufFlag = USBUF_VALID; } else { Mat image = _image.getMat(); sbuf.create(sbufSize.height*nchannels, sbufSize.width, CV_32S); rbuf.create(sz0, CV_8U); for (i = 0; i < nscales; i++) { const ScaleData& s = scaleData->at(i); Mat dst(s.szi.height - 1, s.szi.width - 1, CV_8U, rbuf.data); resize(image, dst, dst.size(), 1. / s.scale, 1. / s.scale, INTER_LINEAR); computeChannels((int)i, dst); } sbufFlag = SBUF_VALID; } return true; } //---------------------------------------------- HaarEvaluator --------------------------------------- bool HaarEvaluator::Feature :: read( const FileNode& node ) { FileNode rnode = node[CC_RECTS]; FileNodeIterator it = rnode.begin(), it_end = rnode.end(); int ri; for( ri = 0; ri < RECT_NUM; ri++ ) { rect[ri].r = Rect(); rect[ri].weight = 0.f; } for(ri = 0; it != it_end; ++it, ri++) { FileNodeIterator it2 = (*it).begin(); it2 >> rect[ri].r.x >> rect[ri].r.y >> rect[ri].r.width >> rect[ri].r.height >> rect[ri].weight; } tilted = (int)node[CC_TILTED] != 0; return true; } HaarEvaluator::HaarEvaluator() { optfeaturesPtr = 0; pwin = 0; localSize = Size(4, 2); lbufSize = Size(0, 0); nchannels = 0; } HaarEvaluator::~HaarEvaluator() { } bool HaarEvaluator::read(const FileNode& node, Size _origWinSize) { if (!FeatureEvaluator::read(node, _origWinSize)) return false; size_t i, n = node.size(); CV_Assert(n > 0); if(features.empty()) features = makePtr >(); if(optfeatures.empty()) optfeatures = makePtr >(); if (optfeatures_lbuf.empty()) optfeatures_lbuf = makePtr >(); features->resize(n); FileNodeIterator it = node.begin(); hasTiltedFeatures = false; std::vector& ff = *features; sbufSize = Size(); ufbuf.release(); for(i = 0; i < n; i++, ++it) { if(!ff[i].read(*it)) return false; if( ff[i].tilted ) hasTiltedFeatures = true; } nchannels = hasTiltedFeatures ? 3 : 2; normrect = Rect(1, 1, origWinSize.width - 2, origWinSize.height - 2); if (ocl::haveOpenCL()) { String vname = ocl::Device::getDefault().vendor(); if (vname == "Advanced Micro Devices, Inc." || vname == "AMD") localSize = Size(8, 8); lbufSize = Size(origWinSize.width + localSize.width, origWinSize.height + localSize.height); if (lbufSize.area() > 1024) lbufSize = Size(0, 0); } return true; } Ptr HaarEvaluator::clone() const { Ptr ret = makePtr(); *ret = *this; return ret; } void HaarEvaluator::computeChannels(int scaleIdx, InputArray img) { const ScaleData& s = scaleData->at(scaleIdx); tofs = (int)sbufSize.area(); sqofs = hasTiltedFeatures ? tofs*2 : tofs; if (img.isUMat()) { int sx = s.layer_ofs % sbufSize.width; int sy = s.layer_ofs / sbufSize.width; int sqy = sy + (sqofs / sbufSize.width); UMat sum(usbuf, Rect(sx, sy, s.szi.width, s.szi.height)); UMat sqsum(usbuf, Rect(sx, sqy, s.szi.width, s.szi.height)); sqsum.flags = (sqsum.flags & ~UMat::DEPTH_MASK) | CV_32F; if (hasTiltedFeatures) { int sty = sy + (tofs / sbufSize.width); UMat tilted(usbuf, Rect(sx, sty, s.szi.width, s.szi.height)); integral(img, sum, sqsum, tilted, CV_32S, CV_32F); } else { UMatData* u = sqsum.u; integral(img, sum, sqsum, noArray(), CV_32S, CV_32F); CV_Assert(sqsum.u == u && sqsum.size() == s.szi && sqsum.type()==CV_32F); } } else { Mat sum(s.szi, CV_32S, sbuf.ptr() + s.layer_ofs, sbuf.step); Mat sqsum(s.szi, CV_32F, sum.ptr() + sqofs, sbuf.step); if (hasTiltedFeatures) { Mat tilted(s.szi, CV_32S, sum.ptr() + tofs, sbuf.step); integral(img, sum, sqsum, tilted, CV_32S, CV_32F); } else integral(img, sum, sqsum, noArray(), CV_32S, CV_32F); } } void HaarEvaluator::computeOptFeatures() { int sstep = sbufSize.width; CV_SUM_OFS( nofs[0], nofs[1], nofs[2], nofs[3], 0, normrect, sstep ); size_t fi, nfeatures = features->size(); const std::vector& ff = *features; optfeatures->resize(nfeatures); optfeaturesPtr = &(*optfeatures)[0]; for( fi = 0; fi < nfeatures; fi++ ) optfeaturesPtr[fi].setOffsets( ff[fi], sstep, tofs ); optfeatures_lbuf->resize(nfeatures); for( fi = 0; fi < nfeatures; fi++ ) optfeatures_lbuf->at(fi).setOffsets(ff[fi], lbufSize.width > 0 ? lbufSize.width : sstep, tofs); copyVectorToUMat(*optfeatures_lbuf, ufbuf); } bool HaarEvaluator::setWindow( Point pt, int scaleIdx ) { const ScaleData& s = getScaleData(scaleIdx); if( pt.x < 0 || pt.y < 0 || pt.x + origWinSize.width >= s.szi.width || pt.y + origWinSize.height >= s.szi.height ) return false; pwin = &sbuf.at(pt) + s.layer_ofs; const float* pq = (const float*)(pwin + sqofs); int valsum = CALC_SUM_OFS(nofs, pwin); float valsqsum = CALC_SUM_OFS(nofs, pq); double nf = (double)normrect.area() * valsqsum - (double)valsum * valsum; if( nf > 0. ) nf = std::sqrt(nf); else nf = 1.; varianceNormFactor = (float)(1./nf); return true; } void HaarEvaluator::OptFeature::setOffsets( const Feature& _f, int step, int _tofs ) { weight[0] = _f.rect[0].weight; weight[1] = _f.rect[1].weight; weight[2] = _f.rect[2].weight; if( _f.tilted ) { CV_TILTED_OFS( ofs[0][0], ofs[0][1], ofs[0][2], ofs[0][3], _tofs, _f.rect[0].r, step ); CV_TILTED_OFS( ofs[1][0], ofs[1][1], ofs[1][2], ofs[1][3], _tofs, _f.rect[1].r, step ); CV_TILTED_OFS( ofs[2][0], ofs[2][1], ofs[2][2], ofs[2][3], _tofs, _f.rect[2].r, step ); } else { CV_SUM_OFS( ofs[0][0], ofs[0][1], ofs[0][2], ofs[0][3], 0, _f.rect[0].r, step ); CV_SUM_OFS( ofs[1][0], ofs[1][1], ofs[1][2], ofs[1][3], 0, _f.rect[1].r, step ); CV_SUM_OFS( ofs[2][0], ofs[2][1], ofs[2][2], ofs[2][3], 0, _f.rect[2].r, step ); } } Rect HaarEvaluator::getNormRect() const { return normrect; } int HaarEvaluator::getSquaresOffset() const { return sqofs; } //---------------------------------------------- LBPEvaluator ------------------------------------- bool LBPEvaluator::Feature :: read(const FileNode& node ) { FileNode rnode = node[CC_RECT]; FileNodeIterator it = rnode.begin(); it >> rect.x >> rect.y >> rect.width >> rect.height; return true; } LBPEvaluator::LBPEvaluator() { features = makePtr >(); optfeatures = makePtr >(); scaleData = makePtr >(); } LBPEvaluator::~LBPEvaluator() { } bool LBPEvaluator::read( const FileNode& node, Size _origWinSize ) { if (!FeatureEvaluator::read(node, _origWinSize)) return false; if(features.empty()) features = makePtr >(); if(optfeatures.empty()) optfeatures = makePtr >(); if (optfeatures_lbuf.empty()) optfeatures_lbuf = makePtr >(); features->resize(node.size()); optfeaturesPtr = 0; FileNodeIterator it = node.begin(), it_end = node.end(); std::vector& ff = *features; for(int i = 0; it != it_end; ++it, i++) { if(!ff[i].read(*it)) return false; } nchannels = 1; if (ocl::haveOpenCL()) { const ocl::Device& device = ocl::Device::getDefault(); String vname = device.vendor(); if ((vname == "Advanced Micro Devices, Inc." || vname == "AMD") && !device.hostUnifiedMemory()) localSize = Size(8, 8); } return true; } Ptr LBPEvaluator::clone() const { Ptr ret = makePtr(); *ret = *this; return ret; } void LBPEvaluator::computeChannels(int scaleIdx, InputArray _img) { const ScaleData& s = scaleData->at(scaleIdx); if (_img.isUMat()) { int sx = s.layer_ofs % sbufSize.width; int sy = s.layer_ofs / sbufSize.width; UMat sum(usbuf, Rect(sx, sy, s.szi.width, s.szi.height)); integral(_img, sum, noArray(), noArray(), CV_32S); } else { Mat sum(s.szi, CV_32S, sbuf.ptr() + s.layer_ofs, sbuf.step); integral(_img, sum, noArray(), noArray(), CV_32S); } } void LBPEvaluator::computeOptFeatures() { int sstep = sbufSize.width; size_t fi, nfeatures = features->size(); const std::vector& ff = *features; optfeatures->resize(nfeatures); optfeaturesPtr = &(*optfeatures)[0]; for( fi = 0; fi < nfeatures; fi++ ) optfeaturesPtr[fi].setOffsets( ff[fi], sstep ); copyVectorToUMat(*optfeatures, ufbuf); } void LBPEvaluator::OptFeature::setOffsets( const Feature& _f, int step ) { Rect tr = _f.rect; int w0 = tr.width; int h0 = tr.height; CV_SUM_OFS( ofs[0], ofs[1], ofs[4], ofs[5], 0, tr, step ); tr.x += 2*w0; CV_SUM_OFS( ofs[2], ofs[3], ofs[6], ofs[7], 0, tr, step ); tr.y += 2*h0; CV_SUM_OFS( ofs[10], ofs[11], ofs[14], ofs[15], 0, tr, step ); tr.x -= 2*w0; CV_SUM_OFS( ofs[8], ofs[9], ofs[12], ofs[13], 0, tr, step ); } bool LBPEvaluator::setWindow( Point pt, int scaleIdx ) { CV_Assert(0 <= scaleIdx && scaleIdx < (int)scaleData->size()); const ScaleData& s = scaleData->at(scaleIdx); if( pt.x < 0 || pt.y < 0 || pt.x + origWinSize.width >= s.szi.width || pt.y + origWinSize.height >= s.szi.height ) return false; pwin = &sbuf.at(pt) + s.layer_ofs; return true; } Ptr FeatureEvaluator::create( int featureType ) { return featureType == HAAR ? Ptr(new HaarEvaluator) : featureType == LBP ? Ptr(new LBPEvaluator) : Ptr(); } //---------------------------------------- Classifier Cascade -------------------------------------------- CascadeClassifierImpl::CascadeClassifierImpl() { } CascadeClassifierImpl::~CascadeClassifierImpl() { } bool CascadeClassifierImpl::empty() const { return !oldCascade && data.stages.empty(); } bool CascadeClassifierImpl::load(const String& filename) { oldCascade.release(); data = Data(); featureEvaluator.release(); FileStorage fs(filename, FileStorage::READ); if( !fs.isOpened() ) return false; if( read_(fs.getFirstTopLevelNode()) ) return true; fs.release(); oldCascade.reset((CvHaarClassifierCascade*)cvLoad(filename.c_str(), 0, 0, 0)); return !oldCascade.empty(); } void CascadeClassifierImpl::read(const FileNode& node) { read_(node); } int CascadeClassifierImpl::runAt( Ptr& evaluator, Point pt, int scaleIdx, double& weight ) { assert( !oldCascade && (data.featureType == FeatureEvaluator::HAAR || data.featureType == FeatureEvaluator::LBP || data.featureType == FeatureEvaluator::HOG) ); if( !evaluator->setWindow(pt, scaleIdx) ) return -1; if( data.maxNodesPerTree == 1 ) { if( data.featureType == FeatureEvaluator::HAAR ) return predictOrderedStump( *this, evaluator, weight ); else if( data.featureType == FeatureEvaluator::LBP ) return predictCategoricalStump( *this, evaluator, weight ); else return -2; } else { if( data.featureType == FeatureEvaluator::HAAR ) return predictOrdered( *this, evaluator, weight ); else if( data.featureType == FeatureEvaluator::LBP ) return predictCategorical( *this, evaluator, weight ); else return -2; } } void CascadeClassifierImpl::setMaskGenerator(const Ptr& _maskGenerator) { maskGenerator=_maskGenerator; } Ptr CascadeClassifierImpl::getMaskGenerator() { return maskGenerator; } Ptr createFaceDetectionMaskGenerator() { #ifdef HAVE_TEGRA_OPTIMIZATION return tegra::getCascadeClassifierMaskGenerator(*this); #else return Ptr(); #endif } class CascadeClassifierInvoker : public ParallelLoopBody { public: CascadeClassifierInvoker( CascadeClassifierImpl& _cc, int _nscales, int _nstripes, const FeatureEvaluator::ScaleData* _scaleData, const int* _stripeSizes, std::vector& _vec, std::vector& _levels, std::vector& _weights, bool outputLevels, const Mat& _mask, Mutex* _mtx) { classifier = &_cc; nscales = _nscales; nstripes = _nstripes; scaleData = _scaleData; stripeSizes = _stripeSizes; rectangles = &_vec; rejectLevels = outputLevels ? &_levels : 0; levelWeights = outputLevels ? &_weights : 0; mask = _mask; mtx = _mtx; } void operator()(const Range& range) const { Ptr evaluator = classifier->featureEvaluator->clone(); double gypWeight = 0.; Size origWinSize = classifier->data.origWinSize; for( int scaleIdx = 0; scaleIdx < nscales; scaleIdx++ ) { const FeatureEvaluator::ScaleData& s = scaleData[scaleIdx]; float scalingFactor = s.scale; int yStep = s.ystep; int stripeSize = stripeSizes[scaleIdx]; int y0 = range.start*stripeSize; Size szw = s.getWorkingSize(origWinSize); int y1 = std::min(range.end*stripeSize, szw.height); Size winSize(cvRound(origWinSize.width * scalingFactor), cvRound(origWinSize.height * scalingFactor)); for( int y = y0; y < y1; y += yStep ) { for( int x = 0; x < szw.width; x += yStep ) { int result = classifier->runAt(evaluator, Point(x, y), scaleIdx, gypWeight); if( rejectLevels ) { if( result == 1 ) result = -(int)classifier->data.stages.size(); if( classifier->data.stages.size() + result == 0 ) { mtx->lock(); rectangles->push_back(Rect(cvRound(x*scalingFactor), cvRound(y*scalingFactor), winSize.width, winSize.height)); rejectLevels->push_back(-result); levelWeights->push_back(gypWeight); mtx->unlock(); } } else if( result > 0 ) { mtx->lock(); rectangles->push_back(Rect(cvRound(x*scalingFactor), cvRound(y*scalingFactor), winSize.width, winSize.height)); mtx->unlock(); } if( result == 0 ) x += yStep; } } } } CascadeClassifierImpl* classifier; std::vector* rectangles; int nscales, nstripes; const FeatureEvaluator::ScaleData* scaleData; const int* stripeSizes; std::vector *rejectLevels; std::vector *levelWeights; std::vector scales; Mat mask; Mutex* mtx; }; struct getRect { Rect operator ()(const CvAvgComp& e) const { return e.rect; } }; struct getNeighbors { int operator ()(const CvAvgComp& e) const { return e.neighbors; } }; bool CascadeClassifierImpl::ocl_detectMultiScaleNoGrouping( const std::vector& scales, std::vector& candidates ) { int featureType = getFeatureType(); std::vector bufs; featureEvaluator->getUMats(bufs); Size localsz = featureEvaluator->getLocalSize(); if( localsz.area() == 0 ) return false; Size lbufSize = featureEvaluator->getLocalBufSize(); size_t localsize[] = { localsz.width, localsz.height }; const int grp_per_CU = 12; size_t globalsize[] = { grp_per_CU*ocl::Device::getDefault().maxComputeUnits()*localsize[0], localsize[1] }; bool ok = false; ufacepos.create(1, MAX_FACES*3+1, CV_32S); UMat ufacepos_count(ufacepos, Rect(0, 0, 1, 1)); ufacepos_count.setTo(Scalar::all(0)); if( ustages.empty() ) { copyVectorToUMat(data.stages, ustages); if (!data.stumps.empty()) copyVectorToUMat(data.stumps, unodes); else copyVectorToUMat(data.nodes, unodes); copyVectorToUMat(data.leaves, uleaves); if( !data.subsets.empty() ) copyVectorToUMat(data.subsets, usubsets); } int nstages = (int)data.stages.size(); if( featureType == FeatureEvaluator::HAAR ) { Ptr haar = featureEvaluator.dynamicCast(); if( haar.empty() ) return false; if( haarKernel.empty() ) { String opts; if (lbufSize.area()) opts = format("-D LOCAL_SIZE_X=%d -D LOCAL_SIZE_Y=%d -D SUM_BUF_SIZE=%d -D SUM_BUF_STEP=%d -D NODE_COUNT=%d", localsz.width, localsz.height, lbufSize.area(), lbufSize.width, data.maxNodesPerTree); else opts = format("-D LOCAL_SIZE_X=%d -D LOCAL_SIZE_Y=%d -D NODE_COUNT=%d", localsz.width, localsz.height, data.maxNodesPerTree); haarKernel.create("runHaarClassifier", ocl::objdetect::cascadedetect_oclsrc, opts); if( haarKernel.empty() ) return false; } Rect normrect = haar->getNormRect(); int sqofs = haar->getSquaresOffset(); int splitstage_ocl = 1; haarKernel.args((int)scales.size(), ocl::KernelArg::PtrReadOnly(bufs[0]), // scaleData ocl::KernelArg::ReadOnlyNoSize(bufs[1]), // sum ocl::KernelArg::PtrReadOnly(bufs[2]), // optfeatures // cascade classifier splitstage_ocl, nstages, ocl::KernelArg::PtrReadOnly(ustages), ocl::KernelArg::PtrReadOnly(unodes), ocl::KernelArg::PtrReadOnly(uleaves), ocl::KernelArg::PtrWriteOnly(ufacepos), // positions normrect, sqofs, data.origWinSize, (int)MAX_FACES); ok = haarKernel.run(2, globalsize, localsize, true); } else if( featureType == FeatureEvaluator::LBP ) { if (data.maxNodesPerTree > 1) return false; Ptr lbp = featureEvaluator.dynamicCast(); if( lbp.empty() ) return false; if( lbpKernel.empty() ) { String opts; if (lbufSize.area()) opts = format("-D LOCAL_SIZE_X=%d -D LOCAL_SIZE_Y=%d -D SUM_BUF_SIZE=%d -D SUM_BUF_STEP=%d", localsz.width, localsz.height, lbufSize.area(), lbufSize.width); else opts = format("-D LOCAL_SIZE_X=%d -D LOCAL_SIZE_Y=%d", localsz.width, localsz.height); lbpKernel.create("runLBPClassifierStumpSimple", ocl::objdetect::cascadedetect_oclsrc, opts); if( lbpKernel.empty() ) return false; } int splitstage_ocl = 1; int subsetSize = (data.ncategories + 31)/32; lbpKernel.args((int)scales.size(), ocl::KernelArg::PtrReadOnly(bufs[0]), // scaleData ocl::KernelArg::ReadOnlyNoSize(bufs[1]), // sum ocl::KernelArg::PtrReadOnly(bufs[2]), // optfeatures // cascade classifier splitstage_ocl, nstages, ocl::KernelArg::PtrReadOnly(ustages), ocl::KernelArg::PtrReadOnly(unodes), ocl::KernelArg::PtrReadOnly(usubsets), subsetSize, ocl::KernelArg::PtrWriteOnly(ufacepos), // positions data.origWinSize, (int)MAX_FACES); ok = lbpKernel.run(2, globalsize, localsize, true); } if( ok ) { Mat facepos = ufacepos.getMat(ACCESS_READ); const int* fptr = facepos.ptr(); int nfaces = fptr[0]; nfaces = std::min(nfaces, (int)MAX_FACES); for( int i = 0; i < nfaces; i++ ) { const FeatureEvaluator::ScaleData& s = featureEvaluator->getScaleData(fptr[i*3 + 1]); candidates.push_back(Rect(cvRound(fptr[i*3 + 2]*s.scale), cvRound(fptr[i*3 + 3]*s.scale), cvRound(data.origWinSize.width*s.scale), cvRound(data.origWinSize.height*s.scale))); } } return ok; } bool CascadeClassifierImpl::isOldFormatCascade() const { return !oldCascade.empty(); } int CascadeClassifierImpl::getFeatureType() const { return featureEvaluator->getFeatureType(); } Size CascadeClassifierImpl::getOriginalWindowSize() const { return data.origWinSize; } void* CascadeClassifierImpl::getOldCascade() { return oldCascade; } static void detectMultiScaleOldFormat( const Mat& image, Ptr oldCascade, std::vector& objects, std::vector& rejectLevels, std::vector& levelWeights, std::vector& vecAvgComp, double scaleFactor, int minNeighbors, int flags, Size minObjectSize, Size maxObjectSize, bool outputRejectLevels = false ) { MemStorage storage(cvCreateMemStorage(0)); CvMat _image = image; CvSeq* _objects = cvHaarDetectObjectsForROC( &_image, oldCascade, storage, rejectLevels, levelWeights, scaleFactor, minNeighbors, flags, minObjectSize, maxObjectSize, outputRejectLevels ); Seq(_objects).copyTo(vecAvgComp); objects.resize(vecAvgComp.size()); std::transform(vecAvgComp.begin(), vecAvgComp.end(), objects.begin(), getRect()); } void CascadeClassifierImpl::detectMultiScaleNoGrouping( InputArray _image, std::vector& candidates, std::vector& rejectLevels, std::vector& levelWeights, double scaleFactor, Size minObjectSize, Size maxObjectSize, bool outputRejectLevels ) { Size imgsz = _image.size(); Mat grayImage; _InputArray gray; candidates.clear(); rejectLevels.clear(); levelWeights.clear(); if( maxObjectSize.height == 0 || maxObjectSize.width == 0 ) maxObjectSize = imgsz; bool use_ocl = tryOpenCL && ocl::useOpenCL() && featureEvaluator->getLocalSize().area() > 0 && ocl::Device::getDefault().type() != ocl::Device::TYPE_CPU && (data.minNodesPerTree == data.maxNodesPerTree) && !isOldFormatCascade() && maskGenerator.empty() && !outputRejectLevels; /*if( use_ocl ) { if (_image.channels() > 1) cvtColor(_image, ugrayImage, COLOR_BGR2GRAY); else if (_image.isUMat()) ugrayImage = _image.getUMat(); else _image.copyTo(ugrayImage); gray = ugrayImage; } else*/ { if (_image.channels() > 1) cvtColor(_image, grayImage, COLOR_BGR2GRAY); else if (_image.isMat()) grayImage = _image.getMat(); else _image.copyTo(grayImage); gray = grayImage; } std::vector scales; scales.reserve(1024); for( double factor = 1; ; factor *= scaleFactor ) { Size originalWindowSize = getOriginalWindowSize(); Size windowSize( cvRound(originalWindowSize.width*factor), cvRound(originalWindowSize.height*factor) ); if( windowSize.width > maxObjectSize.width || windowSize.height > maxObjectSize.height || windowSize.width > imgsz.width || windowSize.height > imgsz.height ) break; if( windowSize.width < minObjectSize.width || windowSize.height < minObjectSize.height ) continue; scales.push_back((float)factor); } if( !featureEvaluator->setImage(gray, scales) ) return; // OpenCL code if( use_ocl && ocl_detectMultiScaleNoGrouping( scales, candidates )) return; tryOpenCL = false; // CPU code featureEvaluator->getMats(); { Mat currentMask; if (maskGenerator) currentMask = maskGenerator->generateMask(gray.getMat()); size_t i, nscales = scales.size(); cv::AutoBuffer stripeSizeBuf(nscales); int* stripeSizes = stripeSizeBuf; const FeatureEvaluator::ScaleData* s = &featureEvaluator->getScaleData(0); Size szw = s->getWorkingSize(data.origWinSize); int nstripes = cvCeil(szw.width/32.); for( i = 0; i < nscales; i++ ) { szw = s[i].getWorkingSize(data.origWinSize); stripeSizes[i] = std::max((szw.height/s[i].ystep + nstripes-1)/nstripes, 1)*s[i].ystep; } CascadeClassifierInvoker invoker(*this, (int)nscales, nstripes, s, stripeSizes, candidates, rejectLevels, levelWeights, outputRejectLevels, currentMask, &mtx); parallel_for_(Range(0, nstripes), invoker); } } void CascadeClassifierImpl::detectMultiScale( InputArray _image, std::vector& objects, std::vector& rejectLevels, std::vector& levelWeights, double scaleFactor, int minNeighbors, int flags, Size minObjectSize, Size maxObjectSize, bool outputRejectLevels ) { CV_Assert( scaleFactor > 1 && _image.depth() == CV_8U ); if( empty() ) return; if( isOldFormatCascade() ) { Mat image = _image.getMat(); std::vector fakeVecAvgComp; detectMultiScaleOldFormat( image, oldCascade, objects, rejectLevels, levelWeights, fakeVecAvgComp, scaleFactor, minNeighbors, flags, minObjectSize, maxObjectSize, outputRejectLevels ); } else { detectMultiScaleNoGrouping( _image, objects, rejectLevels, levelWeights, scaleFactor, minObjectSize, maxObjectSize, outputRejectLevels ); const double GROUP_EPS = 0.2; if( outputRejectLevels ) { groupRectangles( objects, rejectLevels, levelWeights, minNeighbors, GROUP_EPS ); } else { groupRectangles( objects, minNeighbors, GROUP_EPS ); } } } void CascadeClassifierImpl::detectMultiScale( InputArray _image, std::vector& objects, double scaleFactor, int minNeighbors, int flags, Size minObjectSize, Size maxObjectSize) { std::vector fakeLevels; std::vector fakeWeights; detectMultiScale( _image, objects, fakeLevels, fakeWeights, scaleFactor, minNeighbors, flags, minObjectSize, maxObjectSize ); } void CascadeClassifierImpl::detectMultiScale( InputArray _image, std::vector& objects, std::vector& numDetections, double scaleFactor, int minNeighbors, int flags, Size minObjectSize, Size maxObjectSize ) { Mat image = _image.getMat(); CV_Assert( scaleFactor > 1 && image.depth() == CV_8U ); if( empty() ) return; std::vector fakeLevels; std::vector fakeWeights; if( isOldFormatCascade() ) { std::vector vecAvgComp; detectMultiScaleOldFormat( image, oldCascade, objects, fakeLevels, fakeWeights, vecAvgComp, scaleFactor, minNeighbors, flags, minObjectSize, maxObjectSize ); numDetections.resize(vecAvgComp.size()); std::transform(vecAvgComp.begin(), vecAvgComp.end(), numDetections.begin(), getNeighbors()); } else { detectMultiScaleNoGrouping( image, objects, fakeLevels, fakeWeights, scaleFactor, minObjectSize, maxObjectSize ); const double GROUP_EPS = 0.2; groupRectangles( objects, numDetections, minNeighbors, GROUP_EPS ); } } CascadeClassifierImpl::Data::Data() { stageType = featureType = ncategories = maxNodesPerTree = 0; } bool CascadeClassifierImpl::Data::read(const FileNode &root) { static const float THRESHOLD_EPS = 1e-5f; // load stage params String stageTypeStr = (String)root[CC_STAGE_TYPE]; if( stageTypeStr == CC_BOOST ) stageType = BOOST; else return false; String featureTypeStr = (String)root[CC_FEATURE_TYPE]; if( featureTypeStr == CC_HAAR ) featureType = FeatureEvaluator::HAAR; else if( featureTypeStr == CC_LBP ) featureType = FeatureEvaluator::LBP; else if( featureTypeStr == CC_HOG ) featureType = FeatureEvaluator::HOG; else return false; origWinSize.width = (int)root[CC_WIDTH]; origWinSize.height = (int)root[CC_HEIGHT]; CV_Assert( origWinSize.height > 0 && origWinSize.width > 0 ); // load feature params FileNode fn = root[CC_FEATURE_PARAMS]; if( fn.empty() ) return false; ncategories = fn[CC_MAX_CAT_COUNT]; int subsetSize = (ncategories + 31)/32, nodeStep = 3 + ( ncategories>0 ? subsetSize : 1 ); // load stages fn = root[CC_STAGES]; if( fn.empty() ) return false; stages.reserve(fn.size()); classifiers.clear(); nodes.clear(); stumps.clear(); FileNodeIterator it = fn.begin(), it_end = fn.end(); minNodesPerTree = INT_MAX; maxNodesPerTree = 0; for( int si = 0; it != it_end; si++, ++it ) { FileNode fns = *it; Stage stage; stage.threshold = (float)fns[CC_STAGE_THRESHOLD] - THRESHOLD_EPS; fns = fns[CC_WEAK_CLASSIFIERS]; if(fns.empty()) return false; stage.ntrees = (int)fns.size(); stage.first = (int)classifiers.size(); stages.push_back(stage); classifiers.reserve(stages[si].first + stages[si].ntrees); FileNodeIterator it1 = fns.begin(), it1_end = fns.end(); for( ; it1 != it1_end; ++it1 ) // weak trees { FileNode fnw = *it1; FileNode internalNodes = fnw[CC_INTERNAL_NODES]; FileNode leafValues = fnw[CC_LEAF_VALUES]; if( internalNodes.empty() || leafValues.empty() ) return false; DTree tree; tree.nodeCount = (int)internalNodes.size()/nodeStep; minNodesPerTree = std::min(minNodesPerTree, tree.nodeCount); maxNodesPerTree = std::max(maxNodesPerTree, tree.nodeCount); classifiers.push_back(tree); nodes.reserve(nodes.size() + tree.nodeCount); leaves.reserve(leaves.size() + leafValues.size()); if( subsetSize > 0 ) subsets.reserve(subsets.size() + tree.nodeCount*subsetSize); FileNodeIterator internalNodesIter = internalNodes.begin(), internalNodesEnd = internalNodes.end(); for( ; internalNodesIter != internalNodesEnd; ) // nodes { DTreeNode node; node.left = (int)*internalNodesIter; ++internalNodesIter; node.right = (int)*internalNodesIter; ++internalNodesIter; node.featureIdx = (int)*internalNodesIter; ++internalNodesIter; if( subsetSize > 0 ) { for( int j = 0; j < subsetSize; j++, ++internalNodesIter ) subsets.push_back((int)*internalNodesIter); node.threshold = 0.f; } else { node.threshold = (float)*internalNodesIter; ++internalNodesIter; } nodes.push_back(node); } internalNodesIter = leafValues.begin(), internalNodesEnd = leafValues.end(); for( ; internalNodesIter != internalNodesEnd; ++internalNodesIter ) // leaves leaves.push_back((float)*internalNodesIter); } } if( maxNodesPerTree == 1 ) { int nodeOfs = 0, leafOfs = 0; size_t nstages = stages.size(); for( size_t stageIdx = 0; stageIdx < nstages; stageIdx++ ) { const Stage& stage = stages[stageIdx]; int ntrees = stage.ntrees; for( int i = 0; i < ntrees; i++, nodeOfs++, leafOfs+= 2 ) { const DTreeNode& node = nodes[nodeOfs]; stumps.push_back(Stump(node.featureIdx, node.threshold, leaves[leafOfs], leaves[leafOfs+1])); } } } return true; } bool CascadeClassifierImpl::read_(const FileNode& root) { tryOpenCL = true; haarKernel = ocl::Kernel(); lbpKernel = ocl::Kernel(); ustages.release(); unodes.release(); uleaves.release(); if( !data.read(root) ) return false; // load features featureEvaluator = FeatureEvaluator::create(data.featureType); FileNode fn = root[CC_FEATURES]; if( fn.empty() ) return false; return featureEvaluator->read(fn, data.origWinSize); } template<> void DefaultDeleter::operator ()(CvHaarClassifierCascade* obj) const { cvReleaseHaarClassifierCascade(&obj); } BaseCascadeClassifier::~BaseCascadeClassifier() { } CascadeClassifier::CascadeClassifier() {} CascadeClassifier::CascadeClassifier(const String& filename) { load(filename); } CascadeClassifier::~CascadeClassifier() { } bool CascadeClassifier::empty() const { return cc.empty() || cc->empty(); } bool CascadeClassifier::load( const String& filename ) { cc = makePtr(); if(!cc->load(filename)) cc.release(); return !empty(); } bool CascadeClassifier::read(const FileNode &root) { Ptr ccimpl = makePtr(); bool ok = ccimpl->read_(root); if( ok ) cc = ccimpl.staticCast(); else cc.release(); return ok; } void CascadeClassifier::detectMultiScale( InputArray image, CV_OUT std::vector& objects, double scaleFactor, int minNeighbors, int flags, Size minSize, Size maxSize ) { CV_Assert(!empty()); cc->detectMultiScale(image, objects, scaleFactor, minNeighbors, flags, minSize, maxSize); } void CascadeClassifier::detectMultiScale( InputArray image, CV_OUT std::vector& objects, CV_OUT std::vector& numDetections, double scaleFactor, int minNeighbors, int flags, Size minSize, Size maxSize ) { CV_Assert(!empty()); cc->detectMultiScale(image, objects, numDetections, scaleFactor, minNeighbors, flags, minSize, maxSize); } void CascadeClassifier::detectMultiScale( InputArray image, CV_OUT std::vector& objects, CV_OUT std::vector& rejectLevels, CV_OUT std::vector& levelWeights, double scaleFactor, int minNeighbors, int flags, Size minSize, Size maxSize, bool outputRejectLevels ) { CV_Assert(!empty()); cc->detectMultiScale(image, objects, rejectLevels, levelWeights, scaleFactor, minNeighbors, flags, minSize, maxSize, outputRejectLevels); } bool CascadeClassifier::isOldFormatCascade() const { CV_Assert(!empty()); return cc->isOldFormatCascade(); } Size CascadeClassifier::getOriginalWindowSize() const { CV_Assert(!empty()); return cc->getOriginalWindowSize(); } int CascadeClassifier::getFeatureType() const { CV_Assert(!empty()); return cc->getFeatureType(); } void* CascadeClassifier::getOldCascade() { CV_Assert(!empty()); return cc->getOldCascade(); } void CascadeClassifier::setMaskGenerator(const Ptr& maskGenerator) { CV_Assert(!empty()); cc->setMaskGenerator(maskGenerator); } Ptr CascadeClassifier::getMaskGenerator() { CV_Assert(!empty()); return cc->getMaskGenerator(); } } // namespace cv