// This file is part of OpenCV project. // It is subject to the license terms in the LICENSE file found in the top-level directory // of this distribution and at http://opencv.org/license.html #include "precomp.hpp" #if defined _WIN32 && defined HAVE_MSMF /* Media Foundation-based Video Capturing module is based on videoInput library by Evgeny Pereguda: http://www.codeproject.com/Articles/559437/Capturing-of-video-from-web-camera-on-Windows-7-an Originally licensed under The Code Project Open License (CPOL) 1.02: http://www.codeproject.com/info/cpol10.aspx */ //require Windows 8 for some of the formats defined otherwise could baseline on lower version #if WINVER < _WIN32_WINNT_WIN8 #undef WINVER #define WINVER _WIN32_WINNT_WIN8 #endif #include #include #include #include #include #include #include #include #include #ifdef HAVE_MSMF_DXVA #include #include #endif #include #include #include #include #include #include #include #include #include #ifdef _MSC_VER #pragma warning(disable:4503) #pragma comment(lib, "mfplat") #pragma comment(lib, "mf") #pragma comment(lib, "mfuuid") #pragma comment(lib, "Strmiids") #pragma comment(lib, "Mfreadwrite") #ifdef HAVE_MSMF_DXVA #pragma comment(lib, "d3d11") // MFCreateDXGIDeviceManager() is available since Win8 only. // To avoid OpenCV loading failure on Win7 use dynamic detection of this symbol. // Details: https://github.com/opencv/opencv/issues/11858 typedef HRESULT (WINAPI *FN_MFCreateDXGIDeviceManager)(UINT *resetToken, IMFDXGIDeviceManager **ppDeviceManager); static bool pMFCreateDXGIDeviceManager_initialized = false; static FN_MFCreateDXGIDeviceManager pMFCreateDXGIDeviceManager = NULL; static void init_MFCreateDXGIDeviceManager() { HMODULE h = LoadLibraryExA("mfplat.dll", NULL, LOAD_LIBRARY_SEARCH_SYSTEM32); if (h) { pMFCreateDXGIDeviceManager = (FN_MFCreateDXGIDeviceManager)GetProcAddress(h, "MFCreateDXGIDeviceManager"); } pMFCreateDXGIDeviceManager_initialized = true; } #endif #pragma comment(lib, "Shlwapi.lib") #endif #include #include #include // QISearch struct IMFMediaType; struct IMFActivate; struct IMFMediaSource; struct IMFAttributes; namespace { template class ComPtr { public: ComPtr() { } ComPtr(T* lp) { p = lp; } ComPtr(_In_ const ComPtr& lp) { p = lp.p; } virtual ~ComPtr() { } T** operator&() { CV_Assert(p == NULL); return p.operator&(); } T* operator->() const { CV_Assert(p != NULL); return p.operator->(); } operator bool() { return p.operator!=(NULL); } T* Get() const { return p; } void Release() { if (p) p.Release(); } // query for U interface template HRESULT As(_Out_ ComPtr& lp) const { lp.Release(); return p->QueryInterface(__uuidof(U), reinterpret_cast((T**)&lp)); } private: _COM_SMARTPTR_TYPEDEF(T, __uuidof(T)); TPtr p; }; #define _ComPtr ComPtr template inline T absDiff(T a, T b) { return a >= b ? a - b : b - a; } //================================================================================================== // Structure for collecting info about types of video which are supported by current video device struct MediaType { UINT32 width; UINT32 height; INT32 stride; // stride is negative if image is bottom-up UINT32 isFixedSize; UINT32 frameRateNum; UINT32 frameRateDenom; UINT32 aspectRatioNum; UINT32 aspectRatioDenom; UINT32 sampleSize; UINT32 interlaceMode; GUID majorType; // video or audio GUID subType; // fourCC MediaType(IMFMediaType *pType = 0) : width(0), height(0), stride(0), isFixedSize(true), frameRateNum(1), frameRateDenom(1), aspectRatioNum(1), aspectRatioDenom(1), sampleSize(0), interlaceMode(0), majorType(MFMediaType_Video), subType({ 0 }) { if (pType) { MFGetAttributeSize(pType, MF_MT_FRAME_SIZE, &width, &height); pType->GetUINT32(MF_MT_DEFAULT_STRIDE, (UINT32*)&stride); // value is stored as UINT32 but should be casted to INT3) pType->GetUINT32(MF_MT_FIXED_SIZE_SAMPLES, &isFixedSize); MFGetAttributeRatio(pType, MF_MT_FRAME_RATE, &frameRateNum, &frameRateDenom); MFGetAttributeRatio(pType, MF_MT_PIXEL_ASPECT_RATIO, &aspectRatioNum, &aspectRatioDenom); pType->GetUINT32(MF_MT_SAMPLE_SIZE, &sampleSize); pType->GetUINT32(MF_MT_INTERLACE_MODE, &interlaceMode); pType->GetGUID(MF_MT_MAJOR_TYPE, &majorType); pType->GetGUID(MF_MT_SUBTYPE, &subType); } } static MediaType createDefault() { MediaType res; res.width = 640; res.height = 480; res.setFramerate(30.0); return res; } inline bool isEmpty() const { return width == 0 && height == 0; } _ComPtr createMediaType() const { _ComPtr res; MFCreateMediaType(&res); if (width != 0 || height != 0) MFSetAttributeSize(res.Get(), MF_MT_FRAME_SIZE, width, height); if (stride != 0) res->SetUINT32(MF_MT_DEFAULT_STRIDE, stride); res->SetUINT32(MF_MT_FIXED_SIZE_SAMPLES, isFixedSize); if (frameRateNum != 0 || frameRateDenom != 0) MFSetAttributeRatio(res.Get(), MF_MT_FRAME_RATE, frameRateNum, frameRateDenom); if (aspectRatioNum != 0 || aspectRatioDenom != 0) MFSetAttributeRatio(res.Get(), MF_MT_PIXEL_ASPECT_RATIO, aspectRatioNum, aspectRatioDenom); if (sampleSize > 0) res->SetUINT32(MF_MT_SAMPLE_SIZE, sampleSize); res->SetUINT32(MF_MT_INTERLACE_MODE, interlaceMode); if (majorType != GUID()) res->SetGUID(MF_MT_MAJOR_TYPE, majorType); if (subType != GUID()) res->SetGUID(MF_MT_SUBTYPE, subType); return res; } void setFramerate(double fps) { frameRateNum = (UINT32)cvRound(fps * 1000.0); frameRateDenom = 1000; } double getFramerate() const { return frameRateDenom != 0 ? ((double)frameRateNum) / ((double)frameRateDenom) : 0; } LONGLONG getFrameStep() const { const double fps = getFramerate(); return (LONGLONG)(fps > 0 ? 1e7 / fps : 0); } inline unsigned long resolutionDiff(const MediaType& other) const { const unsigned long wdiff = absDiff(width, other.width); const unsigned long hdiff = absDiff(height, other.height); return wdiff + hdiff; } // check if 'this' is better than 'other' comparing to reference bool isBetterThan(const MediaType& other, const MediaType& ref) const { const unsigned long thisDiff = resolutionDiff(ref); const unsigned long otherDiff = other.resolutionDiff(ref); if (thisDiff < otherDiff) return true; if (thisDiff == otherDiff) { if (width > other.width) return true; if (width == other.width && height > other.height) return true; if (width == other.width && height == other.height) { const double thisRateDiff = absDiff(getFramerate(), ref.getFramerate()); const double otherRateDiff = absDiff(other.getFramerate(), ref.getFramerate()); if (thisRateDiff < otherRateDiff) return true; } } return false; } }; void printFormat(std::ostream& out, const GUID& fmt) { #define PRNT(FMT) else if (fmt == FMT) out << #FMT; if (fmt == MFVideoFormat_Base) out << "Base"; PRNT(MFVideoFormat_RGB32) PRNT(MFVideoFormat_ARGB32) PRNT(MFVideoFormat_RGB24) PRNT(MFVideoFormat_RGB555) PRNT(MFVideoFormat_RGB565) PRNT(MFVideoFormat_RGB8) else { char fourcc[5] = { 0 }; memcpy(fourcc, &fmt.Data1, 4); out << fourcc; } #undef PRNT } std::ostream& operator<<(std::ostream& out, const MediaType& mt) { out << "(" << mt.width << "x" << mt.height << " @ " << mt.getFramerate() << ") "; printFormat(out, mt.subType); return out; } //================================================================================================== // Class for creating of Media Foundation context class Media_Foundation { public: ~Media_Foundation(void) { /*CV_Assert(SUCCEEDED(MFShutdown()));*/ CoUninitialize(); } static Media_Foundation& getInstance() { static Media_Foundation instance; return instance; } private: Media_Foundation(void) { CoInitialize(0); CV_Assert(SUCCEEDED(MFStartup(MF_VERSION))); } }; //================================================================================================== class SourceReaderCB : public IMFSourceReaderCallback { public: static const size_t MSMF_READER_MAX_QUEUE_SIZE = 3; SourceReaderCB() : m_nRefCount(0), m_hEvent(CreateEvent(NULL, FALSE, FALSE, NULL)), m_bEOS(FALSE), m_hrStatus(S_OK), m_reader(NULL), m_dwStreamIndex(0) { } // IUnknown methods STDMETHODIMP QueryInterface(REFIID iid, void** ppv) CV_OVERRIDE { #ifdef _MSC_VER #pragma warning(push) #pragma warning(disable:4838) #endif static const QITAB qit[] = { QITABENT(SourceReaderCB, IMFSourceReaderCallback), { 0 }, }; #ifdef _MSC_VER #pragma warning(pop) #endif return QISearch(this, qit, iid, ppv); } STDMETHODIMP_(ULONG) AddRef() CV_OVERRIDE { return InterlockedIncrement(&m_nRefCount); } STDMETHODIMP_(ULONG) Release() CV_OVERRIDE { ULONG uCount = InterlockedDecrement(&m_nRefCount); if (uCount == 0) { delete this; } return uCount; } STDMETHODIMP OnReadSample(HRESULT hrStatus, DWORD dwStreamIndex, DWORD dwStreamFlags, LONGLONG llTimestamp, IMFSample *pSample) CV_OVERRIDE { HRESULT hr = 0; cv::AutoLock lock(m_mutex); if (SUCCEEDED(hrStatus)) { if (pSample) { CV_LOG_DEBUG(NULL, "videoio(MSMF): got frame at " << llTimestamp); if (m_capturedFrames.size() >= MSMF_READER_MAX_QUEUE_SIZE) { #if 0 CV_LOG_DEBUG(NULL, "videoio(MSMF): drop frame (not processed). Timestamp=" << m_capturedFrames.front().timestamp); m_capturedFrames.pop(); #else // this branch reduces latency if we drop frames due to slow processing. // avoid fetching of already outdated frames from the queue's front. CV_LOG_DEBUG(NULL, "videoio(MSMF): drop previous frames (not processed): " << m_capturedFrames.size()); std::queue().swap(m_capturedFrames); // similar to missing m_capturedFrames.clean(); #endif } m_capturedFrames.emplace(CapturedFrameInfo{ llTimestamp, _ComPtr(pSample), hrStatus }); } } else { CV_LOG_WARNING(NULL, "videoio(MSMF): OnReadSample() is called with error status: " << hrStatus); } if (MF_SOURCE_READERF_ENDOFSTREAM & dwStreamFlags) { // Reached the end of the stream. m_bEOS = true; } m_hrStatus = hrStatus; if (FAILED(hr = m_reader->ReadSample(dwStreamIndex, 0, NULL, NULL, NULL, NULL))) { CV_LOG_WARNING(NULL, "videoio(MSMF): async ReadSample() call is failed with error status: " << hr); m_bEOS = true; } if (pSample || m_bEOS) { SetEvent(m_hEvent); } return S_OK; } STDMETHODIMP OnEvent(DWORD, IMFMediaEvent *) CV_OVERRIDE { return S_OK; } STDMETHODIMP OnFlush(DWORD) CV_OVERRIDE { return S_OK; } HRESULT Wait(DWORD dwMilliseconds, _ComPtr& mediaSample, LONGLONG& sampleTimestamp, BOOL& pbEOS) { pbEOS = FALSE; for (;;) { { cv::AutoLock lock(m_mutex); pbEOS = m_bEOS && m_capturedFrames.empty(); if (pbEOS) return m_hrStatus; if (!m_capturedFrames.empty()) { CV_Assert(!m_capturedFrames.empty()); CapturedFrameInfo frameInfo = m_capturedFrames.front(); m_capturedFrames.pop(); CV_LOG_DEBUG(NULL, "videoio(MSMF): handle frame at " << frameInfo.timestamp); mediaSample = frameInfo.sample; CV_Assert(mediaSample); sampleTimestamp = frameInfo.timestamp; ResetEvent(m_hEvent); // event is auto-reset, but we need this forced reset due time gap between wait() and mutex hold. return frameInfo.hrStatus; } } CV_LOG_DEBUG(NULL, "videoio(MSMF): waiting for frame... "); DWORD dwResult = WaitForSingleObject(m_hEvent, dwMilliseconds); if (dwResult == WAIT_TIMEOUT) { return E_PENDING; } else if (dwResult != WAIT_OBJECT_0) { return HRESULT_FROM_WIN32(GetLastError()); } } } private: // Destructor is private. Caller should call Release. virtual ~SourceReaderCB() { CV_LOG_INFO(NULL, "terminating async callback"); } public: long m_nRefCount; // Reference count. cv::Mutex m_mutex; HANDLE m_hEvent; BOOL m_bEOS; HRESULT m_hrStatus; IMFSourceReader *m_reader; DWORD m_dwStreamIndex; struct CapturedFrameInfo { LONGLONG timestamp; _ComPtr sample; HRESULT hrStatus; }; std::queue m_capturedFrames; }; //================================================================================================== // Enumerate and store supported formats and finds format which is most similar to the one requested class FormatStorage { public: struct MediaID { DWORD stream; DWORD media; MediaID() : stream(0), media(0) {} void nextStream() { stream++; media = 0; } void nextMedia() { media++; } bool operator<(const MediaID& other) const { return (stream < other.stream) || (stream == other.stream && media < other.media); } }; void read(IMFSourceReader* source) { HRESULT hr = S_OK; MediaID cur; while (SUCCEEDED(hr)) { _ComPtr raw_type; hr = source->GetNativeMediaType(cur.stream, cur.media, &raw_type); if (hr == MF_E_NO_MORE_TYPES) { hr = S_OK; cur.nextStream(); } else if (SUCCEEDED(hr)) { formats[cur] = MediaType(raw_type.Get()); cur.nextMedia(); } } } std::pair findBestVideoFormat(const MediaType& newType) { std::pair best; std::map::const_iterator i = formats.begin(); for (; i != formats.end(); ++i) { if (i->second.majorType != MFMediaType_Video) continue; if (newType.isEmpty()) // file input - choose first returned media type { best = *i; break; } if (best.second.isEmpty() || i->second.isBetterThan(best.second, newType)) { best = *i; } } return best; } private: std::map formats; }; //================================================================================================== // Enumerates devices and activates one of them class DeviceList { public: DeviceList() : devices(NULL), count(0) {} ~DeviceList() { if (devices) { for (UINT32 i = 0; i < count; ++i) if (devices[i]) devices[i]->Release(); CoTaskMemFree(devices); } } UINT32 read(IID sourceType = MF_DEVSOURCE_ATTRIBUTE_SOURCE_TYPE_VIDCAP_GUID) { _ComPtr attr; if (FAILED(MFCreateAttributes(&attr, 1)) || FAILED(attr->SetGUID(MF_DEVSOURCE_ATTRIBUTE_SOURCE_TYPE, sourceType))) { CV_Error(CV_StsError, "Failed to create attributes"); } if (FAILED(MFEnumDeviceSources(attr.Get(), &devices, &count))) { CV_LOG_DEBUG(NULL, "Failed to enumerate MSMF devices"); return 0; } return count; } _ComPtr activateSource(UINT32 index) { _ComPtr result; if (count == 0 || index >= count || FAILED(devices[index]->ActivateObject(__uuidof(IMFMediaSource), (void**)&result))) { CV_LOG_DEBUG(NULL, "Failed to activate media source (device " << index << ")"); } return result; } private: IMFActivate** devices; UINT32 count; }; } // namespace:: //================================================================================================== /******* Capturing video from camera or file via Microsoft Media Foundation **********/ class CvCapture_MSMF : public cv::IVideoCapture { public: typedef enum { MODE_SW = 0, MODE_HW = 1 } MSMFCapture_Mode; CvCapture_MSMF(); virtual ~CvCapture_MSMF(); virtual bool open(int); virtual bool open(const cv::String&); virtual void close(); virtual double getProperty(int) const CV_OVERRIDE; virtual bool setProperty(int, double) CV_OVERRIDE; virtual bool grabFrame() CV_OVERRIDE; virtual bool retrieveFrame(int, cv::OutputArray) CV_OVERRIDE; virtual bool isOpened() const CV_OVERRIDE { return isOpen; } virtual int getCaptureDomain() CV_OVERRIDE { return CV_CAP_MSMF; } protected: bool configureOutput(MediaType newType, cv::uint32_t outFormat); bool setTime(double time, bool rough); bool configureHW(bool enable); template bool readComplexPropery(long prop, long& val) const; template bool writeComplexProperty(long prop, double val, long flags); _ComPtr getDefaultSourceConfig(UINT32 num = 10); bool initStream(DWORD streamID, const MediaType& mt); Media_Foundation& MF; cv::String filename; int camid; MSMFCapture_Mode captureMode; #ifdef HAVE_MSMF_DXVA _ComPtr D3DDev; _ComPtr D3DMgr; #endif _ComPtr videoFileSource; DWORD dwStreamIndex; MediaType nativeFormat; MediaType captureFormat; int outputFormat; bool convertFormat; MFTIME duration; LONGLONG frameStep; _ComPtr videoSample; LONGLONG sampleTime; bool isOpen; _ComPtr readCallback; // non-NULL for "live" streams (camera capture) }; CvCapture_MSMF::CvCapture_MSMF(): MF(Media_Foundation::getInstance()), filename(""), camid(-1), captureMode(MODE_SW), #ifdef HAVE_MSMF_DXVA D3DDev(NULL), D3DMgr(NULL), #endif videoFileSource(NULL), videoSample(NULL), outputFormat(CV_CAP_MODE_BGR), convertFormat(true), sampleTime(0), isOpen(false) { configureHW(true); } CvCapture_MSMF::~CvCapture_MSMF() { close(); configureHW(false); } void CvCapture_MSMF::close() { if (isOpen) { isOpen = false; videoSample.Release(); videoFileSource.Release(); camid = -1; filename.clear(); } readCallback.Release(); } bool CvCapture_MSMF::initStream(DWORD streamID, const MediaType& mt) { CV_LOG_DEBUG(NULL, "Init stream " << streamID << " with MediaType " << mt); _ComPtr mediaTypeOut = mt.createMediaType(); if (FAILED(videoFileSource->SetStreamSelection((DWORD)MF_SOURCE_READER_ALL_STREAMS, false))) { CV_LOG_WARNING(NULL, "Failed to reset streams"); return false; } if (FAILED(videoFileSource->SetStreamSelection(streamID, true))) { CV_LOG_WARNING(NULL, "Failed to select stream " << streamID); return false; } HRESULT hr = videoFileSource->SetCurrentMediaType(streamID, NULL, mediaTypeOut.Get()); if (hr == MF_E_TOPO_CODEC_NOT_FOUND) { CV_LOG_WARNING(NULL, "Failed to set mediaType (stream " << streamID << ", " << mt << "(codec not found)"); return false; } else if (hr == MF_E_INVALIDMEDIATYPE) { CV_LOG_WARNING(NULL, "Failed to set mediaType (stream " << streamID << ", " << mt << "(unsupported media type)"); return false; } else if (FAILED(hr)) { CV_LOG_WARNING(NULL, "Failed to set mediaType (stream " << streamID << ", " << mt << "(HRESULT " << hr << ")"); return false; } captureFormat = mt; return true; } _ComPtr CvCapture_MSMF::getDefaultSourceConfig(UINT32 num) { CV_Assert(num > 0); _ComPtr res; if (FAILED(MFCreateAttributes(&res, num)) || FAILED(res->SetUINT32(MF_READWRITE_ENABLE_HARDWARE_TRANSFORMS, true)) || FAILED(res->SetUINT32(MF_SOURCE_READER_DISABLE_DXVA, false)) || FAILED(res->SetUINT32(MF_SOURCE_READER_ENABLE_VIDEO_PROCESSING, false)) || FAILED(res->SetUINT32(MF_SOURCE_READER_ENABLE_ADVANCED_VIDEO_PROCESSING, true)) ) { CV_Error(CV_StsError, "Failed to create attributes"); } #ifdef HAVE_MSMF_DXVA if (D3DMgr) { if (FAILED(res->SetUnknown(MF_SOURCE_READER_D3D_MANAGER, D3DMgr.Get()))) { CV_Error(CV_StsError, "Failed to create attributes"); } } #endif return res; } bool CvCapture_MSMF::configureHW(bool enable) { #ifdef HAVE_MSMF_DXVA if ((enable && D3DMgr && D3DDev) || (!enable && !D3DMgr && !D3DDev)) return true; if (!pMFCreateDXGIDeviceManager_initialized) init_MFCreateDXGIDeviceManager(); if (enable && !pMFCreateDXGIDeviceManager) return false; bool reopen = isOpen; int prevcam = camid; cv::String prevfile = filename; close(); if (enable) { D3D_FEATURE_LEVEL levels[] = { D3D_FEATURE_LEVEL_11_1, D3D_FEATURE_LEVEL_11_0, D3D_FEATURE_LEVEL_10_1, D3D_FEATURE_LEVEL_10_0, D3D_FEATURE_LEVEL_9_3, D3D_FEATURE_LEVEL_9_2, D3D_FEATURE_LEVEL_9_1 }; if (SUCCEEDED(D3D11CreateDevice(NULL, D3D_DRIVER_TYPE_HARDWARE, NULL, D3D11_CREATE_DEVICE_BGRA_SUPPORT | D3D11_CREATE_DEVICE_VIDEO_SUPPORT, levels, sizeof(levels) / sizeof(*levels), D3D11_SDK_VERSION, &D3DDev, NULL, NULL))) { // NOTE: Getting ready for multi-threaded operation _ComPtr D3DDevMT; UINT mgrRToken; if (SUCCEEDED(D3DDev->QueryInterface(IID_PPV_ARGS(&D3DDevMT)))) { D3DDevMT->SetMultithreadProtected(TRUE); D3DDevMT.Release(); if (SUCCEEDED(pMFCreateDXGIDeviceManager(&mgrRToken, &D3DMgr))) { if (SUCCEEDED(D3DMgr->ResetDevice(D3DDev.Get(), mgrRToken))) { captureMode = MODE_HW; return reopen ? (prevcam >= 0 ? open(prevcam) : open(prevfile.c_str())) : true; } D3DMgr.Release(); } } D3DDev.Release(); } return false; } else { if (D3DMgr) D3DMgr.Release(); if (D3DDev) D3DDev.Release(); captureMode = MODE_SW; return reopen ? (prevcam >= 0 ? open(prevcam) : open(prevfile.c_str())) : true; } #else return !enable; #endif } bool CvCapture_MSMF::configureOutput(MediaType newType, cv::uint32_t outFormat) { FormatStorage formats; formats.read(videoFileSource.Get()); std::pair bestMatch = formats.findBestVideoFormat(newType); if (bestMatch.second.isEmpty()) { CV_LOG_DEBUG(NULL, "Can not find video stream with requested parameters"); return false; } dwStreamIndex = bestMatch.first.stream; nativeFormat = bestMatch.second; MediaType newFormat = nativeFormat; if (convertFormat) { switch (outFormat) { case CV_CAP_MODE_BGR: case CV_CAP_MODE_RGB: newFormat.subType = captureMode == MODE_HW ? MFVideoFormat_RGB32 : MFVideoFormat_RGB24; newFormat.stride = (captureMode == MODE_HW ? 4 : 3) * newFormat.width; newFormat.sampleSize = newFormat.stride * newFormat.height; break; case CV_CAP_MODE_GRAY: newFormat.subType = MFVideoFormat_YUY2; newFormat.stride = newFormat.width; newFormat.sampleSize = newFormat.stride * newFormat.height * 3 / 2; break; case CV_CAP_MODE_YUYV: newFormat.subType = MFVideoFormat_YUY2; newFormat.stride = 2 * newFormat.width; newFormat.sampleSize = newFormat.stride * newFormat.height; break; default: return false; } newFormat.interlaceMode = MFVideoInterlace_Progressive; newFormat.isFixedSize = true; if (nativeFormat.subType == MFVideoFormat_MP43) //Unable to estimate FPS for MP43 newFormat.frameRateNum = 0; } // we select native format first and then our requested format (related issue #12822) if (!newType.isEmpty()) // camera input initStream(dwStreamIndex, nativeFormat); return initStream(dwStreamIndex, newFormat); } bool CvCapture_MSMF::open(int index) { close(); if (index < 0) return false; DeviceList devices; UINT32 count = devices.read(); if (count == 0 || static_cast(index) > count) { CV_LOG_DEBUG(NULL, "Device " << index << " not found (total " << count << " devices)"); return false; } _ComPtr attr = getDefaultSourceConfig(); _ComPtr cb = new SourceReaderCB(); attr->SetUnknown(MF_SOURCE_READER_ASYNC_CALLBACK, cb.Get()); _ComPtr src = devices.activateSource(index); if (!src.Get() || FAILED(MFCreateSourceReaderFromMediaSource(src.Get(), attr.Get(), &videoFileSource))) { CV_LOG_DEBUG(NULL, "Failed to create source reader"); return false; } isOpen = true; camid = index; readCallback = cb; duration = 0; if (configureOutput(MediaType::createDefault(), outputFormat)) { frameStep = captureFormat.getFrameStep(); } return isOpen; } bool CvCapture_MSMF::open(const cv::String& _filename) { close(); if (_filename.empty()) return false; // Set source reader parameters _ComPtr attr = getDefaultSourceConfig(); cv::AutoBuffer unicodeFileName(_filename.length() + 1); MultiByteToWideChar(CP_ACP, 0, _filename.c_str(), -1, unicodeFileName.data(), (int)_filename.length() + 1); if (SUCCEEDED(MFCreateSourceReaderFromURL(unicodeFileName.data(), attr.Get(), &videoFileSource))) { isOpen = true; sampleTime = 0; if (configureOutput(MediaType(), outputFormat)) { frameStep = captureFormat.getFrameStep(); filename = _filename; PROPVARIANT var; HRESULT hr; if (SUCCEEDED(hr = videoFileSource->GetPresentationAttribute((DWORD)MF_SOURCE_READER_MEDIASOURCE, MF_PD_DURATION, &var)) && var.vt == VT_UI8) { duration = var.uhVal.QuadPart; PropVariantClear(&var); } else duration = 0; } } return isOpen; } bool CvCapture_MSMF::grabFrame() { CV_TRACE_FUNCTION(); if (readCallback) // async "live" capture mode { HRESULT hr = 0; SourceReaderCB* reader = ((SourceReaderCB*)readCallback.Get()); if (!reader->m_reader) { // Initiate capturing with async callback reader->m_reader = videoFileSource.Get(); reader->m_dwStreamIndex = dwStreamIndex; if (FAILED(hr = videoFileSource->ReadSample(dwStreamIndex, 0, NULL, NULL, NULL, NULL))) { CV_LOG_ERROR(NULL, "videoio(MSMF): can't grab frame - initial async ReadSample() call failed: " << hr); reader->m_reader = NULL; return false; } } BOOL bEOS = false; if (FAILED(hr = reader->Wait(10000, videoSample, sampleTime, bEOS))) // 10 sec { CV_LOG_WARNING(NULL, "videoio(MSMF): can't grab frame. Error: " << hr); return false; } if (bEOS) { CV_LOG_WARNING(NULL, "videoio(MSMF): EOS signal. Capture stream is lost"); return false; } CV_LOG_DEBUG(NULL, "videoio(MSMF): grabbed frame " << sampleTime); return true; } else if (isOpen) { DWORD streamIndex, flags; videoSample.Release(); HRESULT hr; for(;;) { CV_TRACE_REGION("ReadSample"); if (!SUCCEEDED(hr = videoFileSource->ReadSample( dwStreamIndex, // Stream index. 0, // Flags. &streamIndex, // Receives the actual stream index. &flags, // Receives status flags. &sampleTime, // Receives the time stamp. &videoSample // Receives the sample or NULL. ))) break; if (streamIndex != dwStreamIndex) break; if (flags & (MF_SOURCE_READERF_ERROR | MF_SOURCE_READERF_ALLEFFECTSREMOVED | MF_SOURCE_READERF_ENDOFSTREAM)) break; if (videoSample) break; if (flags & MF_SOURCE_READERF_STREAMTICK) { CV_LOG_DEBUG(NULL, "videoio(MSMF): Stream tick detected. Retrying to grab the frame"); } } if (SUCCEEDED(hr)) { if (streamIndex != dwStreamIndex) { CV_LOG_DEBUG(NULL, "videoio(MSMF): Wrong stream read. Abort capturing"); close(); } else if (flags & MF_SOURCE_READERF_ERROR) { CV_LOG_DEBUG(NULL, "videoio(MSMF): Stream reading error. Abort capturing"); close(); } else if (flags & MF_SOURCE_READERF_ALLEFFECTSREMOVED) { CV_LOG_DEBUG(NULL, "videoio(MSMF): Stream decoding error. Abort capturing"); close(); } else if (flags & MF_SOURCE_READERF_ENDOFSTREAM) { sampleTime += frameStep; CV_LOG_DEBUG(NULL, "videoio(MSMF): End of stream detected"); } else { sampleTime += frameStep; if (flags & MF_SOURCE_READERF_NEWSTREAM) { CV_LOG_DEBUG(NULL, "videoio(MSMF): New stream detected"); } if (flags & MF_SOURCE_READERF_NATIVEMEDIATYPECHANGED) { CV_LOG_DEBUG(NULL, "videoio(MSMF): Stream native media type changed"); } if (flags & MF_SOURCE_READERF_CURRENTMEDIATYPECHANGED) { CV_LOG_DEBUG(NULL, "videoio(MSMF): Stream current media type changed"); } return true; } } } return false; } bool CvCapture_MSMF::retrieveFrame(int, cv::OutputArray frame) { CV_TRACE_FUNCTION(); CV_LOG_DEBUG(NULL, "videoio(MSMF): retrieve video frame start..."); do { if (!videoSample) break; _ComPtr buf = NULL; CV_TRACE_REGION("get_contiguous_buffer"); if (!SUCCEEDED(videoSample->ConvertToContiguousBuffer(&buf))) { CV_TRACE_REGION("get_buffer"); DWORD bcnt = 0; if (!SUCCEEDED(videoSample->GetBufferCount(&bcnt))) break; if (bcnt == 0) break; if (!SUCCEEDED(videoSample->GetBufferByIndex(0, &buf))) break; } bool lock2d = false; BYTE* ptr = NULL; LONG pitch = 0; DWORD maxsize = 0, cursize = 0; // "For 2-D buffers, the Lock2D method is more efficient than the Lock method" // see IMFMediaBuffer::Lock method documentation: https://msdn.microsoft.com/en-us/library/windows/desktop/bb970366(v=vs.85).aspx _ComPtr buffer2d; if (convertFormat) { if (SUCCEEDED(buf.As(buffer2d))) { CV_TRACE_REGION_NEXT("lock2d"); if (SUCCEEDED(buffer2d->Lock2D(&ptr, &pitch))) { lock2d = true; } } } if (ptr == NULL) { CV_Assert(lock2d == false); CV_TRACE_REGION_NEXT("lock"); if (!SUCCEEDED(buf->Lock(&ptr, &maxsize, &cursize))) { break; } } if (!ptr) break; if (convertFormat) { if (lock2d || (unsigned int)cursize == captureFormat.sampleSize) { switch (outputFormat) { case CV_CAP_MODE_YUYV: cv::Mat(captureFormat.height, captureFormat.width, CV_8UC2, ptr, pitch).copyTo(frame); break; case CV_CAP_MODE_BGR: if (captureMode == MODE_HW) cv::cvtColor(cv::Mat(captureFormat.height, captureFormat.width, CV_8UC4, ptr, pitch), frame, cv::COLOR_BGRA2BGR); else cv::Mat(captureFormat.height, captureFormat.width, CV_8UC3, ptr, pitch).copyTo(frame); break; case CV_CAP_MODE_RGB: if (captureMode == MODE_HW) cv::cvtColor(cv::Mat(captureFormat.height, captureFormat.width, CV_8UC4, ptr, pitch), frame, cv::COLOR_BGRA2BGR); else cv::cvtColor(cv::Mat(captureFormat.height, captureFormat.width, CV_8UC3, ptr, pitch), frame, cv::COLOR_BGR2RGB); break; case CV_CAP_MODE_GRAY: cv::Mat(captureFormat.height, captureFormat.width, CV_8UC1, ptr, pitch).copyTo(frame); break; default: frame.release(); break; } } else frame.release(); } else { cv::Mat(1, cursize, CV_8UC1, ptr, pitch).copyTo(frame); } CV_TRACE_REGION_NEXT("unlock"); if (lock2d) buffer2d->Unlock2D(); else buf->Unlock(); CV_LOG_DEBUG(NULL, "videoio(MSMF): retrieve video frame done!"); return !frame.empty(); } while (0); frame.release(); return false; } bool CvCapture_MSMF::setTime(double time, bool rough) { PROPVARIANT var; if (SUCCEEDED(videoFileSource->GetPresentationAttribute((DWORD)MF_SOURCE_READER_MEDIASOURCE, MF_SOURCE_READER_MEDIASOURCE_CHARACTERISTICS, &var)) && var.vt == VT_UI4 && var.ulVal & MFMEDIASOURCE_CAN_SEEK) { videoSample.Release(); bool useGrabbing = time > 0 && !rough && !(var.ulVal & MFMEDIASOURCE_HAS_SLOW_SEEK); PropVariantClear(&var); sampleTime = (useGrabbing && time >= frameStep) ? (LONGLONG)floor(time + 0.5) - frameStep : (LONGLONG)floor(time + 0.5); var.vt = VT_I8; var.hVal.QuadPart = sampleTime; bool resOK = SUCCEEDED(videoFileSource->SetCurrentPosition(GUID_NULL, var)); PropVariantClear(&var); if (resOK && useGrabbing) { LONGLONG timeborder = (LONGLONG)floor(time + 0.5) - frameStep / 2; do { resOK = grabFrame(); videoSample.Release(); } while (resOK && sampleTime < timeborder); } return resOK; } return false; } template bool CvCapture_MSMF::readComplexPropery(long prop, long & val) const { _ComPtr ctrl; if (FAILED(videoFileSource->GetServiceForStream((DWORD)MF_SOURCE_READER_MEDIASOURCE, GUID_NULL, IID_PPV_ARGS(&ctrl)))) { CV_LOG_DEBUG(NULL, "Failed to get service for stream"); return false; } long paramVal, paramFlag; if (FAILED(ctrl->Get(prop, ¶mVal, ¶mFlag))) { CV_LOG_DEBUG(NULL, "Failed to get property " << prop); // we continue } // fallback - get default value long minVal, maxVal, stepVal; if (FAILED(ctrl->GetRange(prop, &minVal, &maxVal, &stepVal, ¶mVal, ¶mFlag))) { CV_LOG_DEBUG(NULL, "Failed to get default value for property " << prop); return false; } val = paramVal; return true; } double CvCapture_MSMF::getProperty( int property_id ) const { long cVal = 0; if (isOpen) switch (property_id) { case CV_CAP_PROP_FORMAT: return outputFormat; case CV_CAP_PROP_MODE: return captureMode; case CV_CAP_PROP_CONVERT_RGB: return convertFormat ? 1 : 0; case CV_CAP_PROP_SAR_NUM: return captureFormat.aspectRatioNum; case CV_CAP_PROP_SAR_DEN: return captureFormat.aspectRatioDenom; case CV_CAP_PROP_FRAME_WIDTH: return captureFormat.width; case CV_CAP_PROP_FRAME_HEIGHT: return captureFormat.height; case CV_CAP_PROP_FOURCC: return captureFormat.subType.Data1; case CV_CAP_PROP_FPS: return captureFormat.getFramerate(); case CV_CAP_PROP_FRAME_COUNT: if (duration != 0) return floor(((double)duration / 1e7)* captureFormat.getFramerate() + 0.5); else break; case CV_CAP_PROP_POS_FRAMES: return floor(((double)sampleTime / 1e7)* captureFormat.getFramerate() + 0.5); case CV_CAP_PROP_POS_MSEC: return (double)sampleTime / 1e4; case CV_CAP_PROP_POS_AVI_RATIO: if (duration != 0) return (double)sampleTime / duration; else break; case CV_CAP_PROP_BRIGHTNESS: if (readComplexPropery(VideoProcAmp_Brightness, cVal)) return cVal; break; case CV_CAP_PROP_CONTRAST: if (readComplexPropery(VideoProcAmp_Contrast, cVal)) return cVal; break; case CV_CAP_PROP_SATURATION: if (readComplexPropery(VideoProcAmp_Saturation, cVal)) return cVal; break; case CV_CAP_PROP_HUE: if (readComplexPropery(VideoProcAmp_Hue, cVal)) return cVal; break; case CV_CAP_PROP_GAIN: if (readComplexPropery(VideoProcAmp_Gain, cVal)) return cVal; break; case CV_CAP_PROP_SHARPNESS: if (readComplexPropery(VideoProcAmp_Sharpness, cVal)) return cVal; break; case CV_CAP_PROP_GAMMA: if (readComplexPropery(VideoProcAmp_Gamma, cVal)) return cVal; break; case CV_CAP_PROP_BACKLIGHT: if (readComplexPropery(VideoProcAmp_BacklightCompensation, cVal)) return cVal; break; case CV_CAP_PROP_MONOCHROME: if (readComplexPropery(VideoProcAmp_ColorEnable, cVal)) return cVal == 0 ? 1 : 0; break; case CV_CAP_PROP_TEMPERATURE: if (readComplexPropery(VideoProcAmp_WhiteBalance, cVal)) return cVal; break; case CV_CAP_PROP_PAN: if (readComplexPropery(CameraControl_Pan, cVal)) return cVal; break; case CV_CAP_PROP_TILT: if (readComplexPropery(CameraControl_Tilt, cVal)) return cVal; break; case CV_CAP_PROP_ROLL: if (readComplexPropery(CameraControl_Roll, cVal)) return cVal; break; case CV_CAP_PROP_IRIS: if (readComplexPropery(CameraControl_Iris, cVal)) return cVal; break; case CV_CAP_PROP_EXPOSURE: case CV_CAP_PROP_AUTO_EXPOSURE: if (readComplexPropery(CameraControl_Exposure, cVal)) { if (property_id == CV_CAP_PROP_EXPOSURE) return cVal; else return cVal == VideoProcAmp_Flags_Auto; } break; case CV_CAP_PROP_ZOOM: if (readComplexPropery(CameraControl_Zoom, cVal)) return cVal; break; case CV_CAP_PROP_FOCUS: case CV_CAP_PROP_AUTOFOCUS: if (readComplexPropery(CameraControl_Focus, cVal)) { if (property_id == CV_CAP_PROP_FOCUS) return cVal; else return cVal == VideoProcAmp_Flags_Auto; } break; case CV_CAP_PROP_WHITE_BALANCE_BLUE_U: case CV_CAP_PROP_WHITE_BALANCE_RED_V: case CV_CAP_PROP_RECTIFICATION: case CV_CAP_PROP_TRIGGER: case CV_CAP_PROP_TRIGGER_DELAY: case CV_CAP_PROP_GUID: case CV_CAP_PROP_ISO_SPEED: case CV_CAP_PROP_SETTINGS: case CV_CAP_PROP_BUFFERSIZE: default: break; } return -1; } template bool CvCapture_MSMF::writeComplexProperty(long prop, double val, long flags) { _ComPtr ctrl; if (FAILED(videoFileSource->GetServiceForStream((DWORD)MF_SOURCE_READER_MEDIASOURCE, GUID_NULL, IID_PPV_ARGS(&ctrl)))) { CV_LOG_DEBUG(NULL, "Failed get service for stream"); return false; } if (FAILED(ctrl->Set(prop, (long)val, flags))) { CV_LOG_DEBUG(NULL, "Failed to set property " << prop); return false; } return true; } bool CvCapture_MSMF::setProperty( int property_id, double value ) { MediaType newFormat = captureFormat; if (isOpen) switch (property_id) { case CV_CAP_PROP_MODE: switch ((MSMFCapture_Mode)((int)value)) { case MODE_SW: return configureHW(false); case MODE_HW: return configureHW(true); default: return false; } case CV_CAP_PROP_FORMAT: return configureOutput(newFormat, (int)cvRound(value)); case CV_CAP_PROP_CONVERT_RGB: convertFormat = (value != 0); return configureOutput(newFormat, outputFormat); case CV_CAP_PROP_SAR_NUM: if (value > 0) { newFormat.aspectRatioNum = (UINT32)cvRound(value); return configureOutput(newFormat, outputFormat); } break; case CV_CAP_PROP_SAR_DEN: if (value > 0) { newFormat.aspectRatioDenom = (UINT32)cvRound(value); return configureOutput(newFormat, outputFormat); } break; case CV_CAP_PROP_FRAME_WIDTH: if (value >= 0) { newFormat.width = (UINT32)cvRound(value); return configureOutput(newFormat, outputFormat); } break; case CV_CAP_PROP_FRAME_HEIGHT: if (value >= 0) { newFormat.height = (UINT32)cvRound(value); return configureOutput(newFormat, outputFormat); } break; case CV_CAP_PROP_FPS: if (value >= 0) { newFormat.setFramerate(value); return configureOutput(newFormat, outputFormat); } break; case CV_CAP_PROP_FOURCC: break; case CV_CAP_PROP_FRAME_COUNT: break; case CV_CAP_PROP_POS_AVI_RATIO: if (duration != 0) return setTime(duration * value, true); break; case CV_CAP_PROP_POS_FRAMES: if (std::fabs(captureFormat.getFramerate()) > 0) return setTime(value * 1e7 / captureFormat.getFramerate(), false); break; case CV_CAP_PROP_POS_MSEC: return setTime(value * 1e4, false); case CV_CAP_PROP_BRIGHTNESS: return writeComplexProperty(VideoProcAmp_Brightness, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_CONTRAST: return writeComplexProperty(VideoProcAmp_Contrast, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_SATURATION: return writeComplexProperty(VideoProcAmp_Saturation, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_HUE: return writeComplexProperty(VideoProcAmp_Hue, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_GAIN: return writeComplexProperty(VideoProcAmp_Gain, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_SHARPNESS: return writeComplexProperty(VideoProcAmp_Sharpness, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_GAMMA: return writeComplexProperty(VideoProcAmp_Gamma, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_BACKLIGHT: return writeComplexProperty(VideoProcAmp_BacklightCompensation, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_MONOCHROME: return writeComplexProperty(VideoProcAmp_ColorEnable, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_TEMPERATURE: return writeComplexProperty(VideoProcAmp_WhiteBalance, value, VideoProcAmp_Flags_Manual); case CV_CAP_PROP_PAN: return writeComplexProperty(CameraControl_Pan, value, CameraControl_Flags_Manual); case CV_CAP_PROP_TILT: return writeComplexProperty(CameraControl_Tilt, value, CameraControl_Flags_Manual); case CV_CAP_PROP_ROLL: return writeComplexProperty(CameraControl_Roll, value, CameraControl_Flags_Manual); case CV_CAP_PROP_IRIS: return writeComplexProperty(CameraControl_Iris, value, CameraControl_Flags_Manual); case CV_CAP_PROP_EXPOSURE: return writeComplexProperty(CameraControl_Exposure, value, CameraControl_Flags_Manual); case CV_CAP_PROP_AUTO_EXPOSURE: return writeComplexProperty(CameraControl_Exposure, value, value != 0 ? VideoProcAmp_Flags_Auto : VideoProcAmp_Flags_Manual); case CV_CAP_PROP_ZOOM: return writeComplexProperty(CameraControl_Zoom, value, CameraControl_Flags_Manual); case CV_CAP_PROP_FOCUS: return writeComplexProperty(CameraControl_Focus, value, CameraControl_Flags_Manual); case CV_CAP_PROP_AUTOFOCUS: return writeComplexProperty(CameraControl_Focus, value, value != 0 ? CameraControl_Flags_Auto : CameraControl_Flags_Manual); case CV_CAP_PROP_WHITE_BALANCE_BLUE_U: case CV_CAP_PROP_WHITE_BALANCE_RED_V: case CV_CAP_PROP_RECTIFICATION: case CV_CAP_PROP_TRIGGER: case CV_CAP_PROP_TRIGGER_DELAY: case CV_CAP_PROP_GUID: case CV_CAP_PROP_ISO_SPEED: case CV_CAP_PROP_SETTINGS: case CV_CAP_PROP_BUFFERSIZE: default: break; } return false; } cv::Ptr cv::cvCreateCapture_MSMF( int index ) { cv::Ptr capture = cv::makePtr(); if (capture) { capture->open(index); if (capture->isOpened()) return capture; } return cv::Ptr(); } cv::Ptr cv::cvCreateCapture_MSMF (const cv::String& filename) { cv::Ptr capture = cv::makePtr(); if (capture) { capture->open(filename); if (capture->isOpened()) return capture; } return cv::Ptr(); } // // // Media Foundation-based Video Writer // // class CvVideoWriter_MSMF : public cv::IVideoWriter { public: CvVideoWriter_MSMF(); virtual ~CvVideoWriter_MSMF(); virtual bool open(const cv::String& filename, int fourcc, double fps, cv::Size frameSize, bool isColor); virtual void close(); virtual void write(cv::InputArray); virtual double getProperty(int) const { return 0; } virtual bool setProperty(int, double) { return false; } virtual bool isOpened() const { return initiated; } int getCaptureDomain() const CV_OVERRIDE { return cv::CAP_MSMF; } private: Media_Foundation& MF; UINT32 videoWidth; UINT32 videoHeight; double fps; UINT32 bitRate; UINT32 frameSize; GUID encodingFormat; GUID inputFormat; DWORD streamIndex; _ComPtr sinkWriter; bool initiated; LONGLONG rtStart; UINT64 rtDuration; static const GUID FourCC2GUID(int fourcc); }; CvVideoWriter_MSMF::CvVideoWriter_MSMF(): MF(Media_Foundation::getInstance()), videoWidth(0), videoHeight(0), fps(0), bitRate(0), frameSize(0), encodingFormat(), inputFormat(), streamIndex(0), initiated(false), rtStart(0), rtDuration(0) { } CvVideoWriter_MSMF::~CvVideoWriter_MSMF() { close(); } const GUID CvVideoWriter_MSMF::FourCC2GUID(int fourcc) { switch(fourcc) { case CV_FOURCC_MACRO('d', 'v', '2', '5'): return MFVideoFormat_DV25; break; case CV_FOURCC_MACRO('d', 'v', '5', '0'): return MFVideoFormat_DV50; break; case CV_FOURCC_MACRO('d', 'v', 'c', ' '): return MFVideoFormat_DVC; break; case CV_FOURCC_MACRO('d', 'v', 'h', '1'): return MFVideoFormat_DVH1; break; case CV_FOURCC_MACRO('d', 'v', 'h', 'd'): return MFVideoFormat_DVHD; break; case CV_FOURCC_MACRO('d', 'v', 's', 'd'): return MFVideoFormat_DVSD; break; case CV_FOURCC_MACRO('d', 'v', 's', 'l'): return MFVideoFormat_DVSL; break; #if (WINVER >= 0x0602) case CV_FOURCC_MACRO('H', '2', '6', '3'): // Available only for Win 8 target. return MFVideoFormat_H263; break; #endif case CV_FOURCC_MACRO('H', '2', '6', '4'): return MFVideoFormat_H264; break; case CV_FOURCC_MACRO('M', '4', 'S', '2'): return MFVideoFormat_M4S2; break; case CV_FOURCC_MACRO('M', 'J', 'P', 'G'): return MFVideoFormat_MJPG; break; case CV_FOURCC_MACRO('M', 'P', '4', '3'): return MFVideoFormat_MP43; break; case CV_FOURCC_MACRO('M', 'P', '4', 'S'): return MFVideoFormat_MP4S; break; case CV_FOURCC_MACRO('M', 'P', '4', 'V'): return MFVideoFormat_MP4V; break; case CV_FOURCC_MACRO('M', 'P', 'G', '1'): return MFVideoFormat_MPG1; break; case CV_FOURCC_MACRO('M', 'S', 'S', '1'): return MFVideoFormat_MSS1; break; case CV_FOURCC_MACRO('M', 'S', 'S', '2'): return MFVideoFormat_MSS2; break; case CV_FOURCC_MACRO('W', 'M', 'V', '1'): return MFVideoFormat_WMV1; break; case CV_FOURCC_MACRO('W', 'M', 'V', '2'): return MFVideoFormat_WMV2; break; case CV_FOURCC_MACRO('W', 'M', 'V', '3'): return MFVideoFormat_WMV3; break; case CV_FOURCC_MACRO('W', 'V', 'C', '1'): return MFVideoFormat_WVC1; break; default: return MFVideoFormat_H264; } } bool CvVideoWriter_MSMF::open( const cv::String& filename, int fourcc, double _fps, cv::Size _frameSize, bool /*isColor*/ ) { if (initiated) close(); videoWidth = _frameSize.width; videoHeight = _frameSize.height; fps = _fps; bitRate = (UINT32)fps*videoWidth*videoHeight; // 1-bit per pixel encodingFormat = FourCC2GUID(fourcc); inputFormat = MFVideoFormat_RGB32; _ComPtr mediaTypeOut; _ComPtr mediaTypeIn; _ComPtr spAttr; if (// Set the output media type. SUCCEEDED(MFCreateMediaType(&mediaTypeOut)) && SUCCEEDED(mediaTypeOut->SetGUID(MF_MT_MAJOR_TYPE, MFMediaType_Video)) && SUCCEEDED(mediaTypeOut->SetGUID(MF_MT_SUBTYPE, encodingFormat)) && SUCCEEDED(mediaTypeOut->SetUINT32(MF_MT_AVG_BITRATE, bitRate)) && SUCCEEDED(mediaTypeOut->SetUINT32(MF_MT_INTERLACE_MODE, MFVideoInterlace_Progressive)) && SUCCEEDED(MFSetAttributeSize(mediaTypeOut.Get(), MF_MT_FRAME_SIZE, videoWidth, videoHeight)) && SUCCEEDED(MFSetAttributeRatio(mediaTypeOut.Get(), MF_MT_FRAME_RATE, (UINT32)(fps * 1000), 1000)) && SUCCEEDED(MFSetAttributeRatio(mediaTypeOut.Get(), MF_MT_PIXEL_ASPECT_RATIO, 1, 1)) && // Set the input media type. SUCCEEDED(MFCreateMediaType(&mediaTypeIn)) && SUCCEEDED(mediaTypeIn->SetGUID(MF_MT_MAJOR_TYPE, MFMediaType_Video)) && SUCCEEDED(mediaTypeIn->SetGUID(MF_MT_SUBTYPE, inputFormat)) && SUCCEEDED(mediaTypeIn->SetUINT32(MF_MT_INTERLACE_MODE, MFVideoInterlace_Progressive)) && SUCCEEDED(mediaTypeIn->SetUINT32(MF_MT_DEFAULT_STRIDE, 4 * videoWidth)) && //Assume BGR32 input SUCCEEDED(MFSetAttributeSize(mediaTypeIn.Get(), MF_MT_FRAME_SIZE, videoWidth, videoHeight)) && SUCCEEDED(MFSetAttributeRatio(mediaTypeIn.Get(), MF_MT_FRAME_RATE, (UINT32)(fps * 1000), 1000)) && SUCCEEDED(MFSetAttributeRatio(mediaTypeIn.Get(), MF_MT_PIXEL_ASPECT_RATIO, 1, 1)) && // Set sink writer parameters SUCCEEDED(MFCreateAttributes(&spAttr, 10)) && SUCCEEDED(spAttr->SetUINT32(MF_READWRITE_ENABLE_HARDWARE_TRANSFORMS, true)) && SUCCEEDED(spAttr->SetUINT32(MF_SINK_WRITER_DISABLE_THROTTLING, true)) ) { // Create the sink writer cv::AutoBuffer unicodeFileName(filename.length() + 1); MultiByteToWideChar(CP_ACP, 0, filename.c_str(), -1, unicodeFileName.data(), (int)filename.length() + 1); HRESULT hr = MFCreateSinkWriterFromURL(unicodeFileName.data(), NULL, spAttr.Get(), &sinkWriter); if (SUCCEEDED(hr)) { // Configure the sink writer and tell it start to start accepting data if (SUCCEEDED(sinkWriter->AddStream(mediaTypeOut.Get(), &streamIndex)) && SUCCEEDED(sinkWriter->SetInputMediaType(streamIndex, mediaTypeIn.Get(), NULL)) && SUCCEEDED(sinkWriter->BeginWriting())) { initiated = true; rtStart = 0; MFFrameRateToAverageTimePerFrame((UINT32)(fps * 1000), 1000, &rtDuration); return true; } } } return false; } void CvVideoWriter_MSMF::close() { if (initiated) { initiated = false; sinkWriter->Finalize(); sinkWriter.Release(); } } void CvVideoWriter_MSMF::write(cv::InputArray img) { if (img.empty() || (img.channels() != 1 && img.channels() != 3 && img.channels() != 4) || (UINT32)img.cols() != videoWidth || (UINT32)img.rows() != videoHeight) return; const LONG cbWidth = 4 * videoWidth; const DWORD cbBuffer = cbWidth * videoHeight; _ComPtr sample; _ComPtr buffer; BYTE *pData = NULL; // Prepare a media sample. if (SUCCEEDED(MFCreateSample(&sample)) && // Set sample time stamp and duration. SUCCEEDED(sample->SetSampleTime(rtStart)) && SUCCEEDED(sample->SetSampleDuration(rtDuration)) && // Create a memory buffer. SUCCEEDED(MFCreateMemoryBuffer(cbBuffer, &buffer)) && // Set the data length of the buffer. SUCCEEDED(buffer->SetCurrentLength(cbBuffer)) && // Add the buffer to the sample. SUCCEEDED(sample->AddBuffer(buffer.Get())) && // Lock the buffer. SUCCEEDED(buffer->Lock(&pData, NULL, NULL))) { // Copy the video frame to the buffer. cv::cvtColor(img.getMat(), cv::Mat(videoHeight, videoWidth, CV_8UC4, pData, cbWidth), img.channels() > 1 ? cv::COLOR_BGR2BGRA : cv::COLOR_GRAY2BGRA); buffer->Unlock(); // Send media sample to the Sink Writer. if (SUCCEEDED(sinkWriter->WriteSample(streamIndex, sample.Get()))) { rtStart += rtDuration; } } } cv::Ptr cv::cvCreateVideoWriter_MSMF( const cv::String& filename, int fourcc, double fps, cv::Size frameSize, int isColor ) { cv::Ptr writer = cv::makePtr(); if (writer) { writer->open(filename, fourcc, fps, frameSize, isColor != 0); if (writer->isOpened()) return writer; } return cv::Ptr(); } #endif