cap_ffmpeg_impl.hpp 75.5 KB
Newer Older
1 2 3 4 5 6 7 8 9
/*M///////////////////////////////////////////////////////////////////////////////////////
//
//  IMPORTANT: READ BEFORE DOWNLOADING, COPYING, INSTALLING OR USING.
//
//  By downloading, copying, installing or using the software you agree to this license.
//  If you do not agree to this license, do not download, install,
//  copy or use the software.
//
//
V
Vadim Pisarevsky 已提交
10
//                          License Agreement
11 12
//                For Open Source Computer Vision Library
//
V
Vadim Pisarevsky 已提交
13 14
// Copyright (C) 2000-2008, Intel Corporation, all rights reserved.
// Copyright (C) 2009, Willow Garage Inc., all rights reserved.
15 16 17 18 19 20 21 22 23 24 25 26
// Third party copyrights are property of their respective owners.
//
// Redistribution and use in source and binary forms, with or without modification,
// are permitted provided that the following conditions are met:
//
//   * Redistribution's of source code must retain the above copyright notice,
//     this list of conditions and the following disclaimer.
//
//   * Redistribution's in binary form must reproduce the above copyright notice,
//     this list of conditions and the following disclaimer in the documentation
//     and/or other materials provided with the distribution.
//
V
Vadim Pisarevsky 已提交
27
//   * The name of the copyright holders may not be used to endorse or promote products
28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
//     derived from this software without specific prior written permission.
//
// This software is provided by the copyright holders and contributors "as is" and
// any express or implied warranties, including, but not limited to, the implied
// warranties of merchantability and fitness for a particular purpose are disclaimed.
// In no event shall the Intel Corporation or contributors be liable for any direct,
// indirect, incidental, special, exemplary, or consequential damages
// (including, but not limited to, procurement of substitute goods or services;
// loss of use, data, or profits; or business interruption) however caused
// and on any theory of liability, whether in contract, strict liability,
// or tort (including negligence or otherwise) arising in any way out of
// the use of this software, even if advised of the possibility of such damage.
//
//M*/

#include "cap_ffmpeg_api.hpp"
44 45 46
#if !(defined(WIN32) || defined(_WIN32) || defined(WINCE))
# include <pthread.h>
#endif
47
#include <assert.h>
48
#include <algorithm>
V
Vadim Pisarevsky 已提交
49
#include <limits>
50

51 52
#define CALC_FFMPEG_VERSION(a,b,c) ( a<<16 | b<<8 | c )

53 54 55 56
#if defined _MSC_VER && _MSC_VER >= 1200
#pragma warning( disable: 4244 4510 4512 4610 )
#endif

A
Andrey Kamaev 已提交
57 58 59 60
#ifdef __GNUC__
#  pragma GCC diagnostic ignored "-Wdeprecated-declarations"
#endif

61 62 63 64
#ifdef __cplusplus
extern "C" {
#endif

65 66
#include "ffmpeg_codecs.hpp"

V
Vadim Pisarevsky 已提交
67 68
#include <libavutil/mathematics.h>

69 70 71 72
#if LIBAVUTIL_BUILD > CALC_FFMPEG_VERSION(51,11,0)
  #include <libavutil/opt.h>
#endif

P
Peter Rekdal Sunde 已提交
73 74 75 76 77
#if LIBAVUTIL_BUILD >= (LIBAVUTIL_VERSION_MICRO >= 100 \
    ? CALC_FFMPEG_VERSION(51, 63, 100) : CALC_FFMPEG_VERSION(54, 6, 0))
#include <libavutil/imgutils.h>
#endif

78 79
#include <libavcodec/avcodec.h>
#include <libswscale/swscale.h>
80 81 82 83 84 85 86 87 88 89 90 91 92 93 94

#ifdef __cplusplus
}
#endif

#if defined _MSC_VER && _MSC_VER >= 1200
#pragma warning( default: 4244 4510 4512 4610 )
#endif

#ifdef NDEBUG
#define CV_WARN(message)
#else
#define CV_WARN(message) fprintf(stderr, "warning: %s (%s:%d)\n", message, __FILE__, __LINE__)
#endif

95 96
#if defined WIN32 || defined _WIN32
    #include <windows.h>
97 98 99 100 101 102 103
    #if defined _MSC_VER && _MSC_VER < 1900
    struct timespec
    {
        time_t tv_sec;
        long   tv_nsec;
    };
  #endif
104 105 106
#elif defined __linux__ || defined __APPLE__
    #include <unistd.h>
    #include <stdio.h>
V
Vadim Pisarevsky 已提交
107
    #include <sys/types.h>
108
    #include <sys/time.h>
109
#if defined __APPLE__
110
    #include <sys/sysctl.h>
111 112
    #include <mach/clock.h>
    #include <mach/mach.h>
113
#endif
114
#endif
115

V
Vadim Pisarevsky 已提交
116 117 118 119 120 121 122 123 124 125
#ifndef MIN
#define MIN(a, b) ((a) < (b) ? (a) : (b))
#endif

#if defined(__APPLE__)
#define AV_NOPTS_VALUE_ ((int64_t)0x8000000000000000LL)
#else
#define AV_NOPTS_VALUE_ ((int64_t)AV_NOPTS_VALUE)
#endif

126 127 128 129
#ifndef AVERROR_EOF
#define AVERROR_EOF (-MKTAG( 'E','O','F',' '))
#endif

130 131 132 133 134 135 136 137
#if LIBAVCODEC_BUILD >= CALC_FFMPEG_VERSION(54,25,0)
#  define CV_CODEC_ID AVCodecID
#  define CV_CODEC(name) AV_##name
#else
#  define CV_CODEC_ID CodecID
#  define CV_CODEC(name) name
#endif

J
jisli 已提交
138 139 140 141 142 143 144 145 146 147 148 149 150 151
#if LIBAVUTIL_BUILD < (LIBAVUTIL_VERSION_MICRO >= 100 \
    ? CALC_FFMPEG_VERSION(51, 74, 100) : CALC_FFMPEG_VERSION(51, 42, 0))
#define AVPixelFormat PixelFormat
#define AV_PIX_FMT_BGR24 PIX_FMT_BGR24
#define AV_PIX_FMT_RGB24 PIX_FMT_RGB24
#define AV_PIX_FMT_GRAY8 PIX_FMT_GRAY8
#define AV_PIX_FMT_YUV422P PIX_FMT_YUV422P
#define AV_PIX_FMT_YUV420P PIX_FMT_YUV420P
#define AV_PIX_FMT_YUV444P PIX_FMT_YUV444P
#define AV_PIX_FMT_YUVJ420P PIX_FMT_YUVJ420P
#define AV_PIX_FMT_GRAY16LE PIX_FMT_GRAY16LE
#define AV_PIX_FMT_GRAY16BE PIX_FMT_GRAY16BE
#endif

152 153 154 155 156 157 158 159 160 161
#if LIBAVUTIL_BUILD >= (LIBAVUTIL_VERSION_MICRO >= 100 \
    ? CALC_FFMPEG_VERSION(52, 38, 100) : CALC_FFMPEG_VERSION(52, 13, 0))
#define USE_AV_FRAME_GET_BUFFER 1
#else
#define USE_AV_FRAME_GET_BUFFER 0
#ifndef AV_NUM_DATA_POINTERS // required for 0.7.x/0.8.x ffmpeg releases
#define AV_NUM_DATA_POINTERS 4
#endif
#endif

162

163 164 165 166 167 168 169 170 171
#ifndef USE_AV_INTERRUPT_CALLBACK
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 21, 0)
#define USE_AV_INTERRUPT_CALLBACK 1
#else
#define USE_AV_INTERRUPT_CALLBACK 0
#endif
#endif

#if USE_AV_INTERRUPT_CALLBACK
172 173
#define LIBAVFORMAT_INTERRUPT_OPEN_TIMEOUT_MS 30000
#define LIBAVFORMAT_INTERRUPT_READ_TIMEOUT_MS 30000
174 175 176 177

#ifdef WIN32
// http://stackoverflow.com/questions/5404277/porting-clock-gettime-to-windows

178
static
179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198
inline LARGE_INTEGER get_filetime_offset()
{
    SYSTEMTIME s;
    FILETIME f;
    LARGE_INTEGER t;

    s.wYear = 1970;
    s.wMonth = 1;
    s.wDay = 1;
    s.wHour = 0;
    s.wMinute = 0;
    s.wSecond = 0;
    s.wMilliseconds = 0;
    SystemTimeToFileTime(&s, &f);
    t.QuadPart = f.dwHighDateTime;
    t.QuadPart <<= 32;
    t.QuadPart |= f.dwLowDateTime;
    return t;
}

199
static
200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243
inline void get_monotonic_time(timespec *tv)
{
    LARGE_INTEGER           t;
    FILETIME				f;
    double                  microseconds;
    static LARGE_INTEGER    offset;
    static double           frequencyToMicroseconds;
    static int              initialized = 0;
    static BOOL             usePerformanceCounter = 0;

    if (!initialized)
    {
        LARGE_INTEGER performanceFrequency;
        initialized = 1;
        usePerformanceCounter = QueryPerformanceFrequency(&performanceFrequency);
        if (usePerformanceCounter)
        {
            QueryPerformanceCounter(&offset);
            frequencyToMicroseconds = (double)performanceFrequency.QuadPart / 1000000.;
        }
        else
        {
            offset = get_filetime_offset();
            frequencyToMicroseconds = 10.;
        }
    }

    if (usePerformanceCounter)
    {
        QueryPerformanceCounter(&t);
    } else {
        GetSystemTimeAsFileTime(&f);
        t.QuadPart = f.dwHighDateTime;
        t.QuadPart <<= 32;
        t.QuadPart |= f.dwLowDateTime;
    }

    t.QuadPart -= offset.QuadPart;
    microseconds = (double)t.QuadPart / frequencyToMicroseconds;
    t.QuadPart = microseconds;
    tv->tv_sec = t.QuadPart / 1000000;
    tv->tv_nsec = (t.QuadPart % 1000000) * 1000;
}
#else
244
static
245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260
inline void get_monotonic_time(timespec *time)
{
#if defined(__APPLE__) && defined(__MACH__)
    clock_serv_t cclock;
    mach_timespec_t mts;
    host_get_clock_service(mach_host_self(), CALENDAR_CLOCK, &cclock);
    clock_get_time(cclock, &mts);
    mach_port_deallocate(mach_task_self(), cclock);
    time->tv_sec = mts.tv_sec;
    time->tv_nsec = mts.tv_nsec;
#else
    clock_gettime(CLOCK_MONOTONIC, time);
#endif
}
#endif

261
static
262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277
inline timespec get_monotonic_time_diff(timespec start, timespec end)
{
    timespec temp;
    if (end.tv_nsec - start.tv_nsec < 0)
    {
        temp.tv_sec = end.tv_sec - start.tv_sec - 1;
        temp.tv_nsec = 1000000000 + end.tv_nsec - start.tv_nsec;
    }
    else
    {
        temp.tv_sec = end.tv_sec - start.tv_sec;
        temp.tv_nsec = end.tv_nsec - start.tv_nsec;
    }
    return temp;
}

278
static
279 280 281 282 283 284 285
inline double get_monotonic_time_diff_ms(timespec time1, timespec time2)
{
    timespec delta = get_monotonic_time_diff(time1, time2);
    double milliseconds = delta.tv_sec * 1000 + (double)delta.tv_nsec / 1000000.0;

    return milliseconds;
}
286
#endif // USE_AV_INTERRUPT_CALLBACK
287

288
static int get_number_of_cpus(void)
289
{
V
Vadim Pisarevsky 已提交
290 291 292
#if LIBAVFORMAT_BUILD < CALC_FFMPEG_VERSION(52, 111, 0)
    return 1;
#elif defined WIN32 || defined _WIN32
293 294
    SYSTEM_INFO sysinfo;
    GetSystemInfo( &sysinfo );
V
Vadim Pisarevsky 已提交
295

296 297 298 299 300 301
    return (int)sysinfo.dwNumberOfProcessors;
#elif defined __linux__
    return (int)sysconf( _SC_NPROCESSORS_ONLN );
#elif defined __APPLE__
    int numCPU=0;
    int mib[4];
V
Vadim Pisarevsky 已提交
302 303 304
    size_t len = sizeof(numCPU);

    // set the mib for hw.ncpu
305 306
    mib[0] = CTL_HW;
    mib[1] = HW_AVAILCPU;  // alternatively, try HW_NCPU;
V
Vadim Pisarevsky 已提交
307 308

    // get the number of CPUs from the system
309
    sysctl(mib, 2, &numCPU, &len, NULL, 0);
V
Vadim Pisarevsky 已提交
310 311

    if( numCPU < 1 )
312 313 314
    {
        mib[1] = HW_NCPU;
        sysctl( mib, 2, &numCPU, &len, NULL, 0 );
V
Vadim Pisarevsky 已提交
315

316 317 318 319 320 321 322 323 324 325 326
        if( numCPU < 1 )
            numCPU = 1;
    }

    return (int)numCPU;
#else
    return 1;
#endif
}


327 328 329 330 331 332 333 334 335 336
struct Image_FFMPEG
{
    unsigned char* data;
    int step;
    int width;
    int height;
    int cn;
};


337
#if USE_AV_INTERRUPT_CALLBACK
338 339 340 341 342 343 344
struct AVInterruptCallbackMetadata
{
    timespec value;
    unsigned int timeout_after_ms;
    int timeout;
};

345
static
346 347 348 349 350 351
inline void _opencv_ffmpeg_free(void** ptr)
{
    if(*ptr) free(*ptr);
    *ptr = 0;
}

352
static
353 354 355 356 357
inline int _opencv_ffmpeg_interrupt_callback(void *ptr)
{
    AVInterruptCallbackMetadata* metadata = (AVInterruptCallbackMetadata*)ptr;
    assert(metadata);

358 359 360 361 362
    if (metadata->timeout_after_ms == 0)
    {
        return 0; // timeout is disabled
    }

363 364 365 366 367 368 369
    timespec now;
    get_monotonic_time(&now);

    metadata->timeout = get_monotonic_time_diff_ms(metadata->value, now) > metadata->timeout_after_ms;

    return metadata->timeout ? -1 : 0;
}
370
#endif
371

P
Peter Rekdal Sunde 已提交
372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404
static
inline void _opencv_ffmpeg_av_packet_unref(AVPacket *pkt)
{
#if LIBAVCODEC_BUILD >= (LIBAVCODEC_VERSION_MICRO >= 100 \
    ? CALC_FFMPEG_VERSION(55, 25, 100) : CALC_FFMPEG_VERSION(55, 16, 0))
    av_packet_unref(pkt);
#else
    av_free_packet(pkt);
#endif
};

static
inline void _opencv_ffmpeg_av_image_fill_arrays(void *frame, uint8_t *ptr, enum AVPixelFormat pix_fmt, int width, int height)
{
#if LIBAVUTIL_BUILD >= (LIBAVUTIL_VERSION_MICRO >= 100 \
    ? CALC_FFMPEG_VERSION(51, 63, 100) : CALC_FFMPEG_VERSION(54, 6, 0))
    av_image_fill_arrays(((AVFrame*)frame)->data, ((AVFrame*)frame)->linesize, ptr, pix_fmt, width, height, 1);
#else
    avpicture_fill((AVPicture*)frame, ptr, pix_fmt, width, height);
#endif
};

static
inline int _opencv_ffmpeg_av_image_get_buffer_size(enum AVPixelFormat pix_fmt, int width, int height)
{
#if LIBAVUTIL_BUILD >= (LIBAVUTIL_VERSION_MICRO >= 100 \
    ? CALC_FFMPEG_VERSION(51, 63, 100) : CALC_FFMPEG_VERSION(54, 6, 0))
    return av_image_get_buffer_size(pix_fmt, width, height, 1);
#else
    return avpicture_get_size(pix_fmt, width, height);
#endif
};

405

406 407 408 409 410
struct CvCapture_FFMPEG
{
    bool open( const char* filename );
    void close();

411
    double getProperty(int) const;
412 413 414 415 416
    bool setProperty(int, double);
    bool grabFrame();
    bool retrieveFrame(int, unsigned char** data, int* step, int* width, int* height, int* cn);

    void init();
V
Vadim Pisarevsky 已提交
417 418 419

    void    seek(int64_t frame_number);
    void    seek(double sec);
420
    bool    slowSeek( int framenumber );
V
Vadim Pisarevsky 已提交
421

422 423 424 425
    int64_t get_total_frames() const;
    double  get_duration_sec() const;
    double  get_fps() const;
    int     get_bitrate() const;
426
    AVRational get_sample_aspect_ratio(AVStream *stream) const;
V
Vadim Pisarevsky 已提交
427

428
    double  r2d(AVRational r) const;
V
Vadim Pisarevsky 已提交
429 430 431 432 433 434 435
    int64_t dts_to_frame_number(int64_t dts);
    double  dts_to_sec(int64_t dts);

    AVFormatContext * ic;
    AVCodec         * avcodec;
    int               video_stream;
    AVStream        * video_st;
436 437
    AVFrame         * picture;
    AVFrame           rgb_picture;
V
Vadim Pisarevsky 已提交
438 439 440 441
    int64_t           picture_pts;

    AVPacket          packet;
    Image_FFMPEG      frame;
442
    struct SwsContext *img_convert_ctx;
V
Vadim Pisarevsky 已提交
443 444 445 446

    int64_t frame_number, first_frame_number;

    double eps_zero;
447 448 449 450 451 452 453 454
/*
   'filename' contains the filename of the videosource,
   'filename==NULL' indicates that ffmpeg's seek support works
   for the particular file.
   'filename!=NULL' indicates that the slow fallback function is used for seeking,
   and so the filename is needed to reopen the file on backward seeking.
*/
    char              * filename;
I
Ilya Lavrenov 已提交
455 456 457 458

#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(52, 111, 0)
    AVDictionary *dict;
#endif
459
#if USE_AV_INTERRUPT_CALLBACK
460
    AVInterruptCallbackMetadata interrupt_metadata;
461
#endif
462 463 464 465 466 467 468 469
};

void CvCapture_FFMPEG::init()
{
    ic = 0;
    video_stream = -1;
    video_st = 0;
    picture = 0;
V
Vadim Pisarevsky 已提交
470 471
    picture_pts = AV_NOPTS_VALUE_;
    first_frame_number = -1;
472 473 474
    memset( &rgb_picture, 0, sizeof(rgb_picture) );
    memset( &frame, 0, sizeof(frame) );
    filename = 0;
V
Vadim Pisarevsky 已提交
475 476
    memset(&packet, 0, sizeof(packet));
    av_init_packet(&packet);
477
    img_convert_ctx = 0;
V
Vadim Pisarevsky 已提交
478 479 480 481

    avcodec = 0;
    frame_number = 0;
    eps_zero = 0.000025;
I
Ilya Lavrenov 已提交
482 483 484 485

#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(52, 111, 0)
    dict = NULL;
#endif
486 487 488 489 490
}


void CvCapture_FFMPEG::close()
{
V
Vadim Pisarevsky 已提交
491 492 493 494 495
    if( img_convert_ctx )
    {
        sws_freeContext(img_convert_ctx);
        img_convert_ctx = 0;
    }
496

497
    if( picture )
498 499
    {
#if LIBAVCODEC_BUILD >= (LIBAVCODEC_VERSION_MICRO >= 100 \
J
jisli 已提交
500 501 502
    ? CALC_FFMPEG_VERSION(55, 45, 101) : CALC_FFMPEG_VERSION(55, 28, 1))
        av_frame_free(&picture);
#elif LIBAVCODEC_BUILD >= (LIBAVCODEC_VERSION_MICRO >= 100 \
503 504 505
    ? CALC_FFMPEG_VERSION(54, 59, 100) : CALC_FFMPEG_VERSION(54, 28, 0))
        avcodec_free_frame(&picture);
#else
506
        av_free(picture);
507 508
#endif
    }
509 510 511 512 513

    if( video_st )
    {
#if LIBAVFORMAT_BUILD > 4628
        avcodec_close( video_st->codec );
V
Vadim Pisarevsky 已提交
514

515
#else
V
Vadim Pisarevsky 已提交
516 517
        avcodec_close( &(video_st->codec) );

518 519 520 521 522 523
#endif
        video_st = NULL;
    }

    if( ic )
    {
V
Vadim Pisarevsky 已提交
524
#if LIBAVFORMAT_BUILD < CALC_FFMPEG_VERSION(53, 24, 2)
525
        av_close_input_file(ic);
V
Vadim Pisarevsky 已提交
526
#else
527
        avformat_close_input(&ic);
V
Vadim Pisarevsky 已提交
528 529
#endif

530 531 532
        ic = NULL;
    }

533 534 535
#if USE_AV_FRAME_GET_BUFFER
    av_frame_unref(&rgb_picture);
#else
536 537 538 539 540
    if( rgb_picture.data[0] )
    {
        free( rgb_picture.data[0] );
        rgb_picture.data[0] = 0;
    }
541
#endif
542 543 544

    // free last packet if exist
    if (packet.data) {
P
Peter Rekdal Sunde 已提交
545
        _opencv_ffmpeg_av_packet_unref (&packet);
V
Vadim Pisarevsky 已提交
546
        packet.data = NULL;
547 548
    }

I
Ilya Lavrenov 已提交
549 550 551 552 553
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(52, 111, 0)
    if (dict != NULL)
       av_dict_free(&dict);
#endif

554 555 556 557 558
    init();
}


#ifndef AVSEEK_FLAG_FRAME
559
#define AVSEEK_FLAG_FRAME 0
560
#endif
A
Andrey Morozov 已提交
561
#ifndef AVSEEK_FLAG_ANY
562
#define AVSEEK_FLAG_ANY 1
563
#endif
V
Vadim Pisarevsky 已提交
564

I
Ilya Lavrenov 已提交
565
class ImplMutex
V
Vadim Pisarevsky 已提交
566
{
I
Ilya Lavrenov 已提交
567
public:
A
Andrey Kamaev 已提交
568 569 570
    ImplMutex() { init(); }
    ~ImplMutex() { destroy(); }

I
Ilya Lavrenov 已提交
571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590
    void init();
    void destroy();

    void lock();
    bool trylock();
    void unlock();

    struct Impl;
protected:
    Impl* impl;

private:
    ImplMutex(const ImplMutex&);
    ImplMutex& operator = (const ImplMutex& m);
};

#if defined WIN32 || defined _WIN32 || defined WINCE

struct ImplMutex::Impl
{
591 592 593 594 595 596 597 598 599
    void init()
    {
#if (_WIN32_WINNT >= 0x0600)
        ::InitializeCriticalSectionEx(&cs, 1000, 0);
#else
        ::InitializeCriticalSection(&cs);
#endif
        refcount = 1;
    }
I
Ilya Lavrenov 已提交
600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637
    void destroy() { DeleteCriticalSection(&cs); }

    void lock() { EnterCriticalSection(&cs); }
    bool trylock() { return TryEnterCriticalSection(&cs) != 0; }
    void unlock() { LeaveCriticalSection(&cs); }

    CRITICAL_SECTION cs;
    int refcount;
};

#ifndef __GNUC__
static int _interlockedExchangeAdd(int* addr, int delta)
{
#if defined _MSC_VER && _MSC_VER >= 1500
    return (int)_InterlockedExchangeAdd((long volatile*)addr, delta);
#else
    return (int)InterlockedExchangeAdd((long volatile*)addr, delta);
#endif
}
#endif // __GNUC__

#elif defined __APPLE__

#include <libkern/OSAtomic.h>

struct ImplMutex::Impl
{
    void init() { sl = OS_SPINLOCK_INIT; refcount = 1; }
    void destroy() { }

    void lock() { OSSpinLockLock(&sl); }
    bool trylock() { return OSSpinLockTry(&sl); }
    void unlock() { OSSpinLockUnlock(&sl); }

    OSSpinLock sl;
    int refcount;
};

638
#elif defined __linux__ && !defined __ANDROID__
I
Ilya Lavrenov 已提交
639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671

struct ImplMutex::Impl
{
    void init() { pthread_spin_init(&sl, 0); refcount = 1; }
    void destroy() { pthread_spin_destroy(&sl); }

    void lock() { pthread_spin_lock(&sl); }
    bool trylock() { return pthread_spin_trylock(&sl) == 0; }
    void unlock() { pthread_spin_unlock(&sl); }

    pthread_spinlock_t sl;
    int refcount;
};

#else

struct ImplMutex::Impl
{
    void init() { pthread_mutex_init(&sl, 0); refcount = 1; }
    void destroy() { pthread_mutex_destroy(&sl); }

    void lock() { pthread_mutex_lock(&sl); }
    bool trylock() { return pthread_mutex_trylock(&sl) == 0; }
    void unlock() { pthread_mutex_unlock(&sl); }

    pthread_mutex_t sl;
    int refcount;
};

#endif

void ImplMutex::init()
{
672
    impl = new Impl();
A
Andrey Kamaev 已提交
673
    impl->init();
I
Ilya Lavrenov 已提交
674
}
A
Andrey Kamaev 已提交
675
void ImplMutex::destroy()
I
Ilya Lavrenov 已提交
676
{
A
Andrey Kamaev 已提交
677
    impl->destroy();
678
    delete(impl);
A
Andrey Kamaev 已提交
679
    impl = NULL;
I
Ilya Lavrenov 已提交
680 681 682 683 684 685 686 687 688
}
void ImplMutex::lock() { impl->lock(); }
void ImplMutex::unlock() { impl->unlock(); }
bool ImplMutex::trylock() { return impl->trylock(); }

static int LockCallBack(void **mutex, AVLockOp op)
{
    ImplMutex* localMutex = reinterpret_cast<ImplMutex*>(*mutex);
    switch (op)
689
    {
I
Ilya Lavrenov 已提交
690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709
        case AV_LOCK_CREATE:
            localMutex = reinterpret_cast<ImplMutex*>(malloc(sizeof(ImplMutex)));
            localMutex->init();
            *mutex = localMutex;
            if (!*mutex)
                return 1;
        break;

        case AV_LOCK_OBTAIN:
            localMutex->lock();
        break;

        case AV_LOCK_RELEASE:
            localMutex->unlock();
        break;

        case AV_LOCK_DESTROY:
            localMutex->destroy();
            free(localMutex);
            localMutex = NULL;
710
            *mutex = NULL;
I
Ilya Lavrenov 已提交
711 712 713 714 715 716 717 718
        break;
    }
    return 0;
}

static ImplMutex _mutex;
static bool _initialized = false;

719 720 721 722 723 724 725 726 727 728 729 730 731
class AutoLock
{
public:
    AutoLock(ImplMutex& m) : mutex(&m) { mutex->lock(); }
    ~AutoLock() { mutex->unlock(); }
protected:
    ImplMutex* mutex;
private:
    AutoLock(const AutoLock&); // disabled
    AutoLock& operator = (const AutoLock&); // disabled
};


I
Ilya Lavrenov 已提交
732 733 734 735
class InternalFFMpegRegister
{
public:
    InternalFFMpegRegister()
736
    {
737
        AutoLock lock(_mutex);
I
Ilya Lavrenov 已提交
738 739
        if (!_initialized)
        {
740
    #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 13, 0)
I
Ilya Lavrenov 已提交
741
            avformat_network_init();
742
    #endif
V
Vadim Pisarevsky 已提交
743

I
Ilya Lavrenov 已提交
744 745
            /* register all codecs, demux and protocols */
            av_register_all();
V
Vadim Pisarevsky 已提交
746

I
Ilya Lavrenov 已提交
747 748
            /* register a callback function for synchronization */
            av_lockmgr_register(&LockCallBack);
749

I
Ilya Lavrenov 已提交
750
            av_log_set_level(AV_LOG_ERROR);
V
Vadim Pisarevsky 已提交
751

I
Ilya Lavrenov 已提交
752 753
            _initialized = true;
        }
V
Vadim Pisarevsky 已提交
754
    }
755

I
Ilya Lavrenov 已提交
756 757 758 759
    ~InternalFFMpegRegister()
    {
        _initialized = false;
        av_lockmgr_register(NULL);
V
Vadim Pisarevsky 已提交
760
    }
I
Ilya Lavrenov 已提交
761 762 763
};

static InternalFFMpegRegister _init;
764 765 766

bool CvCapture_FFMPEG::open( const char* _filename )
{
767
    AutoLock lock(_mutex);
768 769 770 771
    unsigned i;
    bool valid = false;

    close();
772

773
#if USE_AV_INTERRUPT_CALLBACK
774
    /* interrupt callback */
775
    interrupt_metadata.timeout_after_ms = LIBAVFORMAT_INTERRUPT_OPEN_TIMEOUT_MS;
776 777 778 779 780
    get_monotonic_time(&interrupt_metadata.value);

    ic = avformat_alloc_context();
    ic->interrupt_callback.callback = _opencv_ffmpeg_interrupt_callback;
    ic->interrupt_callback.opaque = &interrupt_metadata;
781
#endif
782

V
Vadim Pisarevsky 已提交
783
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(52, 111, 0)
I
Ilya Lavrenov 已提交
784
    av_dict_set(&dict, "rtsp_transport", "tcp", 0);
785
    int err = avformat_open_input(&ic, _filename, NULL, &dict);
V
Vadim Pisarevsky 已提交
786
#else
787
    int err = av_open_input_file(&ic, _filename, NULL, 0, NULL);
788 789
#endif

I
Ilya Lavrenov 已提交
790 791
    if (err < 0)
    {
V
Vadim Pisarevsky 已提交
792
        CV_WARN("Error opening file");
793
        CV_WARN(_filename);
V
Vadim Pisarevsky 已提交
794
        goto exit_func;
795
    }
V
Vadim Pisarevsky 已提交
796
    err =
R
Roman Donchenko 已提交
797
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 6, 0)
V
Vadim Pisarevsky 已提交
798 799 800 801
    avformat_find_stream_info(ic, NULL);
#else
    av_find_stream_info(ic);
#endif
I
Ilya Lavrenov 已提交
802 803
    if (err < 0)
    {
V
Vadim Pisarevsky 已提交
804 805
        CV_WARN("Could not find codec parameters");
        goto exit_func;
806
    }
V
Vadim Pisarevsky 已提交
807 808
    for(i = 0; i < ic->nb_streams; i++)
    {
809 810 811 812 813 814
#if LIBAVFORMAT_BUILD > 4628
        AVCodecContext *enc = ic->streams[i]->codec;
#else
        AVCodecContext *enc = &ic->streams[i]->codec;
#endif

I
Ilya Lavrenov 已提交
815 816 817
//#ifdef FF_API_THREAD_INIT
//        avcodec_thread_init(enc, get_number_of_cpus());
//#else
V
Vadim Pisarevsky 已提交
818
        enc->thread_count = get_number_of_cpus();
I
Ilya Lavrenov 已提交
819
//#endif
820

821 822 823
#if LIBAVFORMAT_BUILD < CALC_FFMPEG_VERSION(53, 2, 0)
#define AVMEDIA_TYPE_VIDEO CODEC_TYPE_VIDEO
#endif
V
Vadim Pisarevsky 已提交
824

I
Ilya Lavrenov 已提交
825 826
        if( AVMEDIA_TYPE_VIDEO == enc->codec_type && video_stream < 0)
        {
G
gferry 已提交
827 828 829 830
            // backup encoder' width/height
            int enc_width = enc->width;
            int enc_height = enc->height;

A
Andrey Morozov 已提交
831
            AVCodec *codec = avcodec_find_decoder(enc->codec_id);
832
            if (!codec ||
V
Vadim Pisarevsky 已提交
833 834 835 836 837
#if LIBAVCODEC_VERSION_INT >= ((53<<16)+(8<<8)+0)
                avcodec_open2(enc, codec, NULL)
#else
                avcodec_open(enc, codec)
#endif
I
Ilya Lavrenov 已提交
838 839
                < 0)
                goto exit_func;
V
Vadim Pisarevsky 已提交
840

G
gferry 已提交
841 842 843 844
            // checking width/height (since decoder can sometimes alter it, eg. vp6f)
            if (enc_width && (enc->width != enc_width)) { enc->width = enc_width; }
            if (enc_height && (enc->height != enc_height)) { enc->height = enc_height; }

845 846
            video_stream = i;
            video_st = ic->streams[i];
J
jisli 已提交
847 848 849 850
#if LIBAVCODEC_BUILD >= (LIBAVCODEC_VERSION_MICRO >= 100 \
    ? CALC_FFMPEG_VERSION(55, 45, 101) : CALC_FFMPEG_VERSION(55, 28, 1))
            picture = av_frame_alloc();
#else
851
            picture = avcodec_alloc_frame();
J
jisli 已提交
852
#endif
853 854 855 856

            frame.width = enc->width;
            frame.height = enc->height;
            frame.cn = 3;
857 858
            frame.step = 0;
            frame.data = NULL;
859 860 861 862 863 864
            break;
        }
    }

    if(video_stream >= 0) valid = true;

V
Vadim Pisarevsky 已提交
865
exit_func:
866

867 868 869 870 871
#if USE_AV_INTERRUPT_CALLBACK
    // deactivate interrupt callback
    interrupt_metadata.timeout_after_ms = 0;
#endif

872 873 874 875 876 877 878 879 880 881 882 883
    if( !valid )
        close();

    return valid;
}


bool CvCapture_FFMPEG::grabFrame()
{
    bool valid = false;
    int got_picture;

V
Vadim Pisarevsky 已提交
884
    int count_errs = 0;
J
jormansa 已提交
885
    const int max_number_of_attempts = 1 << 9;
886

V
Vadim Pisarevsky 已提交
887
    if( !ic || !video_st )  return false;
888

889 890 891
    if( ic->streams[video_stream]->nb_frames > 0 &&
        frame_number > ic->streams[video_stream]->nb_frames )
        return false;
892

V
Vadim Pisarevsky 已提交
893
    picture_pts = AV_NOPTS_VALUE_;
894

895 896 897 898 899 900
#if USE_AV_INTERRUPT_CALLBACK
    // activate interrupt callback
    get_monotonic_time(&interrupt_metadata.value);
    interrupt_metadata.timeout_after_ms = LIBAVFORMAT_INTERRUPT_READ_TIMEOUT_MS;
#endif

901
    // get the next frame
V
Vadim Pisarevsky 已提交
902 903
    while (!valid)
    {
H
hahne 已提交
904

P
Peter Rekdal Sunde 已提交
905
        _opencv_ffmpeg_av_packet_unref (&packet);
906

907
#if USE_AV_INTERRUPT_CALLBACK
908 909 910 911 912
        if (interrupt_metadata.timeout)
        {
            valid = false;
            break;
        }
913
#endif
914

915
        int ret = av_read_frame(ic, &packet);
V
Vadim Pisarevsky 已提交
916 917 918 919 920 921
        if (ret == AVERROR(EAGAIN)) continue;

        /* else if (ret < 0) break; */

        if( packet.stream_index != video_stream )
        {
P
Peter Rekdal Sunde 已提交
922
            _opencv_ffmpeg_av_packet_unref (&packet);
V
Vadim Pisarevsky 已提交
923 924 925
            count_errs++;
            if (count_errs > max_number_of_attempts)
                break;
926 927
            continue;
        }
928

V
Vadim Pisarevsky 已提交
929 930 931 932 933 934 935 936 937 938 939 940
        // Decode video frame
        #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 2, 0)
            avcodec_decode_video2(video_st->codec, picture, &got_picture, &packet);
        #elif LIBAVFORMAT_BUILD > 4628
                avcodec_decode_video(video_st->codec,
                                     picture, &got_picture,
                                     packet.data, packet.size);
        #else
                avcodec_decode_video(&video_st->codec,
                                     picture, &got_picture,
                                     packet.data, packet.size);
        #endif
941

V
Vadim Pisarevsky 已提交
942 943 944 945 946
        // Did we get a video frame?
        if(got_picture)
        {
            //picture_pts = picture->best_effort_timestamp;
            if( picture_pts == AV_NOPTS_VALUE_ )
947 948
                picture_pts = picture->pkt_pts != AV_NOPTS_VALUE_ && picture->pkt_pts != 0 ? picture->pkt_pts : picture->pkt_dts;

V
Vadim Pisarevsky 已提交
949 950 951 952 953 954 955 956
            frame_number++;
            valid = true;
        }
        else
        {
            count_errs++;
            if (count_errs > max_number_of_attempts)
                break;
957 958 959
        }
    }

V
Vadim Pisarevsky 已提交
960 961
    if( valid && first_frame_number < 0 )
        first_frame_number = dts_to_frame_number(picture_pts);
962

963 964 965 966 967
#if USE_AV_INTERRUPT_CALLBACK
    // deactivate interrupt callback
    interrupt_metadata.timeout_after_ms = 0;
#endif

968 969 970 971 972 973 974 975 976 977
    // return if we have a new picture or not
    return valid;
}


bool CvCapture_FFMPEG::retrieveFrame(int, unsigned char** data, int* step, int* width, int* height, int* cn)
{
    if( !video_st || !picture->data[0] )
        return false;

V
Vadim Pisarevsky 已提交
978 979
    if( img_convert_ctx == NULL ||
        frame.width != video_st->codec->width ||
980 981
        frame.height != video_st->codec->height ||
        frame.data == NULL )
V
Vadim Pisarevsky 已提交
982
    {
983 984 985
        // Some sws_scale optimizations have some assumptions about alignment of data/step/width/height
        // Also we use coded_width/height to workaround problem with legacy ffmpeg versions (like n0.8)
        int buffer_width = video_st->codec->coded_width, buffer_height = video_st->codec->coded_height;
V
Vadim Pisarevsky 已提交
986 987

        img_convert_ctx = sws_getCachedContext(
988 989
                img_convert_ctx,
                buffer_width, buffer_height,
V
Vadim Pisarevsky 已提交
990
                video_st->codec->pix_fmt,
991
                buffer_width, buffer_height,
J
jisli 已提交
992
                AV_PIX_FMT_BGR24,
V
Vadim Pisarevsky 已提交
993 994 995 996 997 998
                SWS_BICUBIC,
                NULL, NULL, NULL
                );

        if (img_convert_ctx == NULL)
            return false;//CV_Error(0, "Cannot initialize the conversion context!");
999

1000 1001 1002 1003 1004 1005 1006 1007 1008 1009 1010 1011 1012
#if USE_AV_FRAME_GET_BUFFER
        av_frame_unref(&rgb_picture);
        rgb_picture.format = AV_PIX_FMT_BGR24;
        rgb_picture.width = buffer_width;
        rgb_picture.height = buffer_height;
        if (0 != av_frame_get_buffer(&rgb_picture, 32))
        {
            CV_WARN("OutOfMemory");
            return false;
        }
#else
        int aligns[AV_NUM_DATA_POINTERS];
        avcodec_align_dimensions2(video_st->codec, &buffer_width, &buffer_height, aligns);
1013
        rgb_picture.data[0] = (uint8_t*)realloc(rgb_picture.data[0],
P
Peter Rekdal Sunde 已提交
1014
                _opencv_ffmpeg_av_image_get_buffer_size( AV_PIX_FMT_BGR24,
1015
                                    buffer_width, buffer_height ));
P
Peter Rekdal Sunde 已提交
1016
        _opencv_ffmpeg_av_image_fill_arrays(&rgb_picture, rgb_picture.data[0],
1017 1018 1019 1020 1021
                        AV_PIX_FMT_BGR24, buffer_width, buffer_height );
#endif
        frame.width = video_st->codec->width;
        frame.height = video_st->codec->height;
        frame.cn = 3;
1022
        frame.data = rgb_picture.data[0];
1023
        frame.step = rgb_picture.linesize[0];
V
Vadim Pisarevsky 已提交
1024 1025 1026 1027 1028 1029
    }

    sws_scale(
            img_convert_ctx,
            picture->data,
            picture->linesize,
1030
            0, video_st->codec->coded_height,
V
Vadim Pisarevsky 已提交
1031 1032 1033 1034
            rgb_picture.data,
            rgb_picture.linesize
            );

1035 1036 1037 1038 1039 1040 1041 1042 1043 1044
    *data = frame.data;
    *step = frame.step;
    *width = frame.width;
    *height = frame.height;
    *cn = frame.cn;

    return true;
}


1045
double CvCapture_FFMPEG::getProperty( int property_id ) const
1046 1047 1048 1049 1050
{
    if( !video_st ) return 0;

    switch( property_id )
    {
V
Vadim Pisarevsky 已提交
1051 1052
    case CV_FFMPEG_CAP_PROP_POS_MSEC:
        return 1000.0*(double)frame_number/get_fps();
1053
    case CV_FFMPEG_CAP_PROP_POS_FRAMES:
V
Vadim Pisarevsky 已提交
1054
        return (double)frame_number;
1055
    case CV_FFMPEG_CAP_PROP_POS_AVI_RATIO:
V
Vadim Pisarevsky 已提交
1056
        return r2d(ic->streams[video_stream]->time_base);
1057
    case CV_FFMPEG_CAP_PROP_FRAME_COUNT:
V
Vadim Pisarevsky 已提交
1058
        return (double)get_total_frames();
1059 1060 1061 1062 1063
    case CV_FFMPEG_CAP_PROP_FRAME_WIDTH:
        return (double)frame.width;
    case CV_FFMPEG_CAP_PROP_FRAME_HEIGHT:
        return (double)frame.height;
    case CV_FFMPEG_CAP_PROP_FPS:
1064
        return get_fps();
1065 1066 1067 1068 1069 1070
    case CV_FFMPEG_CAP_PROP_FOURCC:
#if LIBAVFORMAT_BUILD > 4628
        return (double)video_st->codec->codec_tag;
#else
        return (double)video_st->codec.codec_tag;
#endif
1071 1072 1073 1074
    case CV_FFMPEG_CAP_PROP_SAR_NUM:
        return get_sample_aspect_ratio(ic->streams[video_stream]).num;
    case CV_FFMPEG_CAP_PROP_SAR_DEN:
        return get_sample_aspect_ratio(ic->streams[video_stream]).den;
V
Vadim Pisarevsky 已提交
1075
    default:
1076
        break;
1077
    }
V
Vadim Pisarevsky 已提交
1078

1079 1080 1081
    return 0;
}

1082
double CvCapture_FFMPEG::r2d(AVRational r) const
V
Vadim Pisarevsky 已提交
1083 1084 1085 1086
{
    return r.num == 0 || r.den == 0 ? 0. : (double)r.num / (double)r.den;
}

1087
double CvCapture_FFMPEG::get_duration_sec() const
1088
{
V
Vadim Pisarevsky 已提交
1089 1090 1091
    double sec = (double)ic->duration / (double)AV_TIME_BASE;

    if (sec < eps_zero)
1092
    {
V
Vadim Pisarevsky 已提交
1093
        sec = (double)ic->streams[video_stream]->duration * r2d(ic->streams[video_stream]->time_base);
1094
    }
V
Vadim Pisarevsky 已提交
1095 1096

    if (sec < eps_zero)
1097
    {
V
Vadim Pisarevsky 已提交
1098
        sec = (double)ic->streams[video_stream]->duration * r2d(ic->streams[video_stream]->time_base);
1099
    }
V
Vadim Pisarevsky 已提交
1100 1101

    return sec;
1102 1103
}

1104
int CvCapture_FFMPEG::get_bitrate() const
1105
{
V
Vadim Pisarevsky 已提交
1106 1107 1108
    return ic->bit_rate;
}

1109
double CvCapture_FFMPEG::get_fps() const
V
Vadim Pisarevsky 已提交
1110
{
A
Alexander Alekhin 已提交
1111 1112 1113 1114 1115 1116
#if 0 && LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(55, 1, 100) && LIBAVFORMAT_VERSION_MICRO >= 100
    double fps = r2d(av_guess_frame_rate(ic, ic->streams[video_stream], NULL));
#else
#if LIBAVCODEC_BUILD >= CALC_FFMPEG_VERSION(54, 1, 0)
    double fps = r2d(ic->streams[video_stream]->avg_frame_rate);
#else
V
Vadim Pisarevsky 已提交
1117
    double fps = r2d(ic->streams[video_stream]->r_frame_rate);
A
Alexander Alekhin 已提交
1118
#endif
V
Vadim Pisarevsky 已提交
1119 1120 1121 1122 1123

#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(52, 111, 0)
    if (fps < eps_zero)
    {
        fps = r2d(ic->streams[video_stream]->avg_frame_rate);
1124
    }
1125
#endif
V
Vadim Pisarevsky 已提交
1126 1127 1128 1129 1130

    if (fps < eps_zero)
    {
        fps = 1.0 / r2d(ic->streams[video_stream]->codec->time_base);
    }
A
Alexander Alekhin 已提交
1131
#endif
V
Vadim Pisarevsky 已提交
1132 1133 1134
    return fps;
}

1135
int64_t CvCapture_FFMPEG::get_total_frames() const
V
Vadim Pisarevsky 已提交
1136 1137 1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151
{
    int64_t nbf = ic->streams[video_stream]->nb_frames;

    if (nbf == 0)
    {
        nbf = (int64_t)floor(get_duration_sec() * get_fps() + 0.5);
    }
    return nbf;
}

int64_t CvCapture_FFMPEG::dts_to_frame_number(int64_t dts)
{
    double sec = dts_to_sec(dts);
    return (int64_t)(get_fps() * sec + 0.5);
}

1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173
AVRational CvCapture_FFMPEG::get_sample_aspect_ratio(AVStream *stream) const
{
    AVRational undef = {0, 1};
    AVRational stream_sample_aspect_ratio = stream ? stream->sample_aspect_ratio : undef;
    AVRational frame_sample_aspect_ratio  = stream && stream->codec ? stream->codec->sample_aspect_ratio : undef;

    av_reduce(&stream_sample_aspect_ratio.num, &stream_sample_aspect_ratio.den,
        stream_sample_aspect_ratio.num,  stream_sample_aspect_ratio.den, INT_MAX);
    if (stream_sample_aspect_ratio.num <= 0 || stream_sample_aspect_ratio.den <= 0)
        stream_sample_aspect_ratio = undef;

    av_reduce(&frame_sample_aspect_ratio.num, &frame_sample_aspect_ratio.den,
        frame_sample_aspect_ratio.num,  frame_sample_aspect_ratio.den, INT_MAX);
    if (frame_sample_aspect_ratio.num <= 0 || frame_sample_aspect_ratio.den <= 0)
        frame_sample_aspect_ratio = undef;

    if (stream_sample_aspect_ratio.num)
        return stream_sample_aspect_ratio;
    else
        return frame_sample_aspect_ratio;
}

V
Vadim Pisarevsky 已提交
1174 1175 1176 1177 1178 1179 1180 1181 1182 1183
double CvCapture_FFMPEG::dts_to_sec(int64_t dts)
{
    return (double)(dts - ic->streams[video_stream]->start_time) *
        r2d(ic->streams[video_stream]->time_base);
}

void CvCapture_FFMPEG::seek(int64_t _frame_number)
{
    _frame_number = std::min(_frame_number, get_total_frames());
    int delta = 16;
1184

V
Vadim Pisarevsky 已提交
1185 1186
    // if we have not grabbed a single frame before first seek, let's read the first frame
    // and get some valuable information during the process
1187
    if( first_frame_number < 0 && get_total_frames() > 1 )
1188
        grabFrame();
1189

V
Vadim Pisarevsky 已提交
1190 1191 1192 1193 1194 1195 1196
    for(;;)
    {
        int64_t _frame_number_temp = std::max(_frame_number-delta, (int64_t)0);
        double sec = (double)_frame_number_temp / get_fps();
        int64_t time_stamp = ic->streams[video_stream]->start_time;
        double  time_base  = r2d(ic->streams[video_stream]->time_base);
        time_stamp += (int64_t)(sec / time_base + 0.5);
1197
        if (get_total_frames() > 1) av_seek_frame(ic, video_stream, time_stamp, AVSEEK_FLAG_BACKWARD);
V
Vadim Pisarevsky 已提交
1198 1199 1200 1201
        avcodec_flush_buffers(ic->streams[video_stream]->codec);
        if( _frame_number > 0 )
        {
            grabFrame();
1202

V
Vadim Pisarevsky 已提交
1203 1204 1205 1206 1207
            if( _frame_number > 1 )
            {
                frame_number = dts_to_frame_number(picture_pts) - first_frame_number;
                //printf("_frame_number = %d, frame_number = %d, delta = %d\n",
                //       (int)_frame_number, (int)frame_number, delta);
1208

V
Vadim Pisarevsky 已提交
1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234
                if( frame_number < 0 || frame_number > _frame_number-1 )
                {
                    if( _frame_number_temp == 0 || delta >= INT_MAX/4 )
                        break;
                    delta = delta < 16 ? delta*2 : delta*3/2;
                    continue;
                }
                while( frame_number < _frame_number-1 )
                {
                    if(!grabFrame())
                        break;
                }
                frame_number++;
                break;
            }
            else
            {
                frame_number = 1;
                break;
            }
        }
        else
        {
            frame_number = 0;
            break;
        }
1235
    }
V
Vadim Pisarevsky 已提交
1236 1237 1238 1239 1240
}

void CvCapture_FFMPEG::seek(double sec)
{
    seek((int64_t)(sec * get_fps() + 0.5));
1241
}
1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255

bool CvCapture_FFMPEG::setProperty( int property_id, double value )
{
    if( !video_st ) return false;

    switch( property_id )
    {
    case CV_FFMPEG_CAP_PROP_POS_MSEC:
    case CV_FFMPEG_CAP_PROP_POS_FRAMES:
    case CV_FFMPEG_CAP_PROP_POS_AVI_RATIO:
        {
            switch( property_id )
            {
            case CV_FFMPEG_CAP_PROP_POS_FRAMES:
V
Vadim Pisarevsky 已提交
1256
                seek((int64_t)value);
1257 1258 1259
                break;

            case CV_FFMPEG_CAP_PROP_POS_MSEC:
V
Vadim Pisarevsky 已提交
1260
                seek(value/1000.0);
1261 1262 1263
                break;

            case CV_FFMPEG_CAP_PROP_POS_AVI_RATIO:
V
Vadim Pisarevsky 已提交
1264
                seek((int64_t)(value*ic->duration));
1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282
                break;
            }

            picture_pts=(int64_t)value;
        }
        break;
    default:
        return false;
    }

    return true;
}


///////////////// FFMPEG CvVideoWriter implementation //////////////////////////
struct CvVideoWriter_FFMPEG
{
    bool open( const char* filename, int fourcc,
1283
               double fps, int width, int height, bool isColor );
1284 1285 1286 1287 1288
    void close();
    bool writeFrame( const unsigned char* data, int step, int width, int height, int cn, int origin );

    void init();

1289
    AVOutputFormat  * fmt;
V
Vadim Pisarevsky 已提交
1290
    AVFormatContext * oc;
1291 1292 1293 1294 1295 1296 1297 1298
    uint8_t         * outbuf;
    uint32_t          outbuf_size;
    FILE            * outfile;
    AVFrame         * picture;
    AVFrame         * input_picture;
    uint8_t         * picbuf;
    AVStream        * video_st;
    int               input_pix_fmt;
1299
    unsigned char   * aligned_input;
V
Vadim Pisarevsky 已提交
1300
    int               frame_width, frame_height;
1301
    int               frame_idx;
V
Vadim Pisarevsky 已提交
1302
    bool              ok;
1303 1304 1305 1306 1307
    struct SwsContext *img_convert_ctx;
};

static const char * icvFFMPEGErrStr(int err)
{
1308
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 2, 0)
1309
    switch(err) {
1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337
    case AVERROR_BSF_NOT_FOUND:
        return "Bitstream filter not found";
    case AVERROR_DECODER_NOT_FOUND:
        return "Decoder not found";
    case AVERROR_DEMUXER_NOT_FOUND:
        return "Demuxer not found";
    case AVERROR_ENCODER_NOT_FOUND:
        return "Encoder not found";
    case AVERROR_EOF:
        return "End of file";
    case AVERROR_EXIT:
        return "Immediate exit was requested; the called function should not be restarted";
    case AVERROR_FILTER_NOT_FOUND:
        return "Filter not found";
    case AVERROR_INVALIDDATA:
        return "Invalid data found when processing input";
    case AVERROR_MUXER_NOT_FOUND:
        return "Muxer not found";
    case AVERROR_OPTION_NOT_FOUND:
        return "Option not found";
    case AVERROR_PATCHWELCOME:
        return "Not yet implemented in FFmpeg, patches welcome";
    case AVERROR_PROTOCOL_NOT_FOUND:
        return "Protocol not found";
    case AVERROR_STREAM_NOT_FOUND:
        return "Stream not found";
    default:
        break;
V
Vadim Pisarevsky 已提交
1338
    }
1339
#else
1340 1341
    switch(err) {
    case AVERROR_NUMEXPECTED:
V
Vadim Pisarevsky 已提交
1342
        return "Incorrect filename syntax";
1343
    case AVERROR_INVALIDDATA:
V
Vadim Pisarevsky 已提交
1344
        return "Invalid data in header";
1345
    case AVERROR_NOFMT:
V
Vadim Pisarevsky 已提交
1346
        return "Unknown format";
1347
    case AVERROR_IO:
V
Vadim Pisarevsky 已提交
1348
        return "I/O error occurred";
1349
    case AVERROR_NOMEM:
V
Vadim Pisarevsky 已提交
1350
        return "Memory allocation error";
1351
    default:
V
Vadim Pisarevsky 已提交
1352
        break;
1353
    }
1354 1355
#endif

V
Vadim Pisarevsky 已提交
1356
    return "Unspecified error";
1357 1358 1359 1360
}

/* function internal to FFMPEG (libavformat/riff.c) to lookup codec id by fourcc tag*/
extern "C" {
1361
    enum CV_CODEC_ID codec_get_bmp_id(unsigned int tag);
1362 1363 1364 1365 1366 1367 1368 1369 1370 1371 1372 1373 1374 1375
}

void CvVideoWriter_FFMPEG::init()
{
    fmt = 0;
    oc = 0;
    outbuf = 0;
    outbuf_size = 0;
    outfile = 0;
    picture = 0;
    input_picture = 0;
    picbuf = 0;
    video_st = 0;
    input_pix_fmt = 0;
1376
    aligned_input = NULL;
1377
    img_convert_ctx = 0;
V
Vadim Pisarevsky 已提交
1378
    frame_width = frame_height = 0;
1379
    frame_idx = 0;
V
Vadim Pisarevsky 已提交
1380
    ok = false;
1381 1382 1383 1384 1385 1386 1387 1388
}

/**
 * the following function is a modified version of code
 * found in ffmpeg-0.4.9-pre1/output_example.c
 */
static AVFrame * icv_alloc_picture_FFMPEG(int pix_fmt, int width, int height, bool alloc)
{
V
Vadim Pisarevsky 已提交
1389
    AVFrame * picture;
1390
    uint8_t * picture_buf = 0;
V
Vadim Pisarevsky 已提交
1391 1392
    int size;

J
jisli 已提交
1393 1394 1395 1396
#if LIBAVCODEC_BUILD >= (LIBAVCODEC_VERSION_MICRO >= 100 \
    ? CALC_FFMPEG_VERSION(55, 45, 101) : CALC_FFMPEG_VERSION(55, 28, 1))
    picture = av_frame_alloc();
#else
V
Vadim Pisarevsky 已提交
1397
    picture = avcodec_alloc_frame();
J
jisli 已提交
1398
#endif
V
Vadim Pisarevsky 已提交
1399 1400
    if (!picture)
        return NULL;
1401 1402 1403 1404 1405

    picture->format = pix_fmt;
    picture->width = width;
    picture->height = height;

P
Peter Rekdal Sunde 已提交
1406
    size = _opencv_ffmpeg_av_image_get_buffer_size( (AVPixelFormat) pix_fmt, width, height);
V
Vadim Pisarevsky 已提交
1407 1408 1409 1410 1411 1412 1413
    if(alloc){
        picture_buf = (uint8_t *) malloc(size);
        if (!picture_buf)
        {
            av_free(picture);
            return NULL;
        }
P
Peter Rekdal Sunde 已提交
1414
        _opencv_ffmpeg_av_image_fill_arrays(picture, picture_buf,
J
jisli 已提交
1415
                       (AVPixelFormat) pix_fmt, width, height);
V
Vadim Pisarevsky 已提交
1416 1417 1418
    }
    else {
    }
1419

V
Vadim Pisarevsky 已提交
1420
    return picture;
1421 1422 1423 1424
}

/* add a video output stream to the container */
static AVStream *icv_add_video_stream_FFMPEG(AVFormatContext *oc,
1425
                                             CV_CODEC_ID codec_id,
V
Vadim Pisarevsky 已提交
1426 1427
                                             int w, int h, int bitrate,
                                             double fps, int pixel_format)
1428
{
V
Vadim Pisarevsky 已提交
1429 1430 1431 1432
    AVCodecContext *c;
    AVStream *st;
    int frame_rate, frame_rate_base;
    AVCodec *codec;
1433

V
Vadim Pisarevsky 已提交
1434 1435 1436 1437 1438
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 10, 0)
    st = avformat_new_stream(oc, 0);
#else
    st = av_new_stream(oc, 0);
#endif
1439

V
Vadim Pisarevsky 已提交
1440 1441 1442 1443
    if (!st) {
        CV_WARN("Could not allocate stream");
        return NULL;
    }
1444 1445

#if LIBAVFORMAT_BUILD > 4628
V
Vadim Pisarevsky 已提交
1446
    c = st->codec;
1447
#else
V
Vadim Pisarevsky 已提交
1448
    c = &(st->codec);
1449 1450 1451
#endif

#if LIBAVFORMAT_BUILD > 4621
V
Vadim Pisarevsky 已提交
1452
    c->codec_id = av_guess_codec(oc->oformat, NULL, oc->filename, NULL, AVMEDIA_TYPE_VIDEO);
1453
#else
V
Vadim Pisarevsky 已提交
1454
    c->codec_id = oc->oformat->video_codec;
1455 1456
#endif

1457
    if(codec_id != CV_CODEC(CODEC_ID_NONE)){
V
Vadim Pisarevsky 已提交
1458 1459
        c->codec_id = codec_id;
    }
1460 1461

    //if(codec_tag) c->codec_tag=codec_tag;
V
Vadim Pisarevsky 已提交
1462
    codec = avcodec_find_encoder(c->codec_id);
1463

V
Vadim Pisarevsky 已提交
1464
    c->codec_type = AVMEDIA_TYPE_VIDEO;
1465

1466
#if LIBAVCODEC_BUILD >= CALC_FFMPEG_VERSION(54,25,0)
1467 1468 1469 1470 1471
    // Set per-codec defaults
    AVCodecID c_id = c->codec_id;
    avcodec_get_context_defaults3(c, codec);
    // avcodec_get_context_defaults3 erases codec_id for some reason
    c->codec_id = c_id;
1472
#endif
1473

V
Vadim Pisarevsky 已提交
1474 1475 1476 1477 1478
    /* put sample parameters */
    int64_t lbit_rate = (int64_t)bitrate;
    lbit_rate += (bitrate / 2);
    lbit_rate = std::min(lbit_rate, (int64_t)INT_MAX);
    c->bit_rate = lbit_rate;
1479

V
Vadim Pisarevsky 已提交
1480 1481 1482
    // took advice from
    // http://ffmpeg-users.933282.n4.nabble.com/warning-clipping-1-dct-coefficients-to-127-127-td934297.html
    c->qmin = 3;
1483

V
Vadim Pisarevsky 已提交
1484 1485 1486 1487 1488 1489
    /* resolution must be a multiple of two */
    c->width = w;
    c->height = h;

    /* time base: this is the fundamental unit of time (in seconds) in terms
       of which frame timestamps are represented. for fixed-fps content,
1490 1491
       timebase should be 1/framerate and timestamp increments should be
       identically 1. */
V
Vadim Pisarevsky 已提交
1492 1493 1494 1495 1496 1497
    frame_rate=(int)(fps+0.5);
    frame_rate_base=1;
    while (fabs((double)frame_rate/frame_rate_base) - fps > 0.001){
        frame_rate_base*=10;
        frame_rate=(int)(fps*frame_rate_base + 0.5);
    }
1498 1499 1500
#if LIBAVFORMAT_BUILD > 4752
    c->time_base.den = frame_rate;
    c->time_base.num = frame_rate_base;
V
Vadim Pisarevsky 已提交
1501 1502 1503
    /* adjust time base for supported framerates */
    if(codec && codec->supported_framerates){
        const AVRational *p= codec->supported_framerates;
1504
        AVRational req = {frame_rate, frame_rate_base};
V
Vadim Pisarevsky 已提交
1505 1506 1507 1508 1509 1510 1511 1512 1513 1514
        const AVRational *best=NULL;
        AVRational best_error= {INT_MAX, 1};
        for(; p->den!=0; p++){
            AVRational error= av_sub_q(req, *p);
            if(error.num <0) error.num *= -1;
            if(av_cmp_q(error, best_error) < 0){
                best_error= error;
                best= p;
            }
        }
1515 1516
        if (best == NULL)
            return NULL;
V
Vadim Pisarevsky 已提交
1517 1518 1519
        c->time_base.den= best->num;
        c->time_base.num= best->den;
    }
1520
#else
V
Vadim Pisarevsky 已提交
1521 1522
    c->frame_rate = frame_rate;
    c->frame_rate_base = frame_rate_base;
1523 1524
#endif

V
Vadim Pisarevsky 已提交
1525
    c->gop_size = 12; /* emit one intra frame every twelve frames at most */
J
jisli 已提交
1526
    c->pix_fmt = (AVPixelFormat) pixel_format;
1527

1528
    if (c->codec_id == CV_CODEC(CODEC_ID_MPEG2VIDEO)) {
1529 1530
        c->max_b_frames = 2;
    }
1531
    if (c->codec_id == CV_CODEC(CODEC_ID_MPEG1VIDEO) || c->codec_id == CV_CODEC(CODEC_ID_MSMPEG4V3)){
1532 1533 1534
        /* needed to avoid using macroblocks in which some coeffs overflow
           this doesnt happen with normal video, it just happens here as the
           motion of the chroma plane doesnt match the luma plane */
V
Vadim Pisarevsky 已提交
1535
        /* avoid FFMPEG warning 'clipping 1 dct coefficients...' */
1536 1537
        c->mb_decision=2;
    }
1538 1539

#if LIBAVUTIL_BUILD > CALC_FFMPEG_VERSION(51,11,0)
1540 1541
    /* Some settings for libx264 encoding, restore dummy values for gop_size
     and qmin since they will be set to reasonable defaults by the libx264
1542
     preset system. Also, use a crf encode with the default quality rating,
1543
     this seems easier than finding an appropriate default bitrate. */
1544
    if (c->codec_id == AV_CODEC_ID_H264) {
1545 1546 1547
      c->gop_size = -1;
      c->qmin = -1;
      c->bit_rate = 0;
1548 1549
      if (c->priv_data)
          av_opt_set(c->priv_data,"crf","23", 0);
1550
    }
1551 1552
#endif

1553 1554 1555 1556 1557 1558 1559 1560
#if LIBAVCODEC_VERSION_INT>0x000409
    // some formats want stream headers to be seperate
    if(oc->oformat->flags & AVFMT_GLOBALHEADER)
    {
        c->flags |= CODEC_FLAG_GLOBAL_HEADER;
    }
#endif

A
Alexander Alekhin 已提交
1561 1562 1563 1564
#if LIBAVCODEC_BUILD >= CALC_FFMPEG_VERSION(52, 42, 0)
    st->avg_frame_rate = (AVRational){frame_rate, frame_rate_base};
#endif

1565 1566 1567
    return st;
}

V
Vadim Pisarevsky 已提交
1568 1569
static const int OPENCV_NO_FRAMES_WRITTEN_CODE = 1000;

1570 1571 1572 1573 1574 1575 1576
static int icv_av_write_frame_FFMPEG( AVFormatContext * oc, AVStream * video_st,
#if LIBAVCODEC_BUILD >= CALC_FFMPEG_VERSION(54, 1, 0)
                                      uint8_t *, uint32_t,
#else
                                      uint8_t * outbuf, uint32_t outbuf_size,
#endif
                                      AVFrame * picture )
1577 1578
{
#if LIBAVFORMAT_BUILD > 4628
V
Vadim Pisarevsky 已提交
1579
    AVCodecContext * c = video_st->codec;
1580
#else
V
Vadim Pisarevsky 已提交
1581
    AVCodecContext * c = &(video_st->codec);
1582
#endif
1583
    int ret = OPENCV_NO_FRAMES_WRITTEN_CODE;
1584 1585 1586 1587 1588 1589 1590

    if (oc->oformat->flags & AVFMT_RAWPICTURE) {
        /* raw video case. The API will change slightly in the near
           futur for that */
        AVPacket pkt;
        av_init_packet(&pkt);

1591 1592 1593
#ifndef PKT_FLAG_KEY
#define PKT_FLAG_KEY AV_PKT_FLAG_KEY
#endif
V
Vadim Pisarevsky 已提交
1594 1595

        pkt.flags |= PKT_FLAG_KEY;
1596 1597 1598 1599 1600 1601 1602
        pkt.stream_index= video_st->index;
        pkt.data= (uint8_t *)picture;
        pkt.size= sizeof(AVPicture);

        ret = av_write_frame(oc, &pkt);
    } else {
        /* encode the image */
1603 1604 1605 1606 1607 1608 1609 1610
        AVPacket pkt;
        av_init_packet(&pkt);
#if LIBAVCODEC_BUILD >= CALC_FFMPEG_VERSION(54, 1, 0)
        int got_output = 0;
        pkt.data = NULL;
        pkt.size = 0;
        ret = avcodec_encode_video2(c, &pkt, picture, &got_output);
        if (ret < 0)
1611
            ;
1612
        else if (got_output) {
1613 1614 1615 1616 1617 1618
            if (pkt.pts != (int64_t)AV_NOPTS_VALUE)
                pkt.pts = av_rescale_q(pkt.pts, c->time_base, video_st->time_base);
            if (pkt.dts != (int64_t)AV_NOPTS_VALUE)
                pkt.dts = av_rescale_q(pkt.dts, c->time_base, video_st->time_base);
            if (pkt.duration)
                pkt.duration = av_rescale_q(pkt.duration, c->time_base, video_st->time_base);
1619 1620
            pkt.stream_index= video_st->index;
            ret = av_write_frame(oc, &pkt);
P
Peter Rekdal Sunde 已提交
1621
            _opencv_ffmpeg_av_packet_unref(&pkt);
1622 1623 1624 1625 1626
        }
        else
            ret = OPENCV_NO_FRAMES_WRITTEN_CODE;
#else
        int out_size = avcodec_encode_video(c, outbuf, outbuf_size, picture);
1627 1628 1629
        /* if zero size, it means the image was buffered */
        if (out_size > 0) {
#if LIBAVFORMAT_BUILD > 4752
1630
            if(c->coded_frame->pts != (int64_t)AV_NOPTS_VALUE)
1631
                pkt.pts = av_rescale_q(c->coded_frame->pts, c->time_base, video_st->time_base);
1632
#else
V
Vadim Pisarevsky 已提交
1633
            pkt.pts = c->coded_frame->pts;
1634 1635 1636 1637 1638 1639 1640 1641 1642 1643
#endif
            if(c->coded_frame->key_frame)
                pkt.flags |= PKT_FLAG_KEY;
            pkt.stream_index= video_st->index;
            pkt.data= outbuf;
            pkt.size= out_size;

            /* write the compressed frame in the media file */
            ret = av_write_frame(oc, &pkt);
        }
1644
#endif
1645
    }
V
Vadim Pisarevsky 已提交
1646
    return ret;
1647 1648 1649 1650 1651
}

/// write a frame with FFMPEG
bool CvVideoWriter_FFMPEG::writeFrame( const unsigned char* data, int step, int width, int height, int cn, int origin )
{
1652 1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665
    // check parameters
    if (input_pix_fmt == AV_PIX_FMT_BGR24) {
        if (cn != 3) {
            return false;
        }
    }
    else if (input_pix_fmt == AV_PIX_FMT_GRAY8) {
        if (cn != 1) {
            return false;
        }
    }
    else {
        assert(false);
    }
1666

V
Vadim Pisarevsky 已提交
1667 1668 1669 1670
    if( (width & -2) != frame_width || (height & -2) != frame_height || !data )
        return false;
    width = frame_width;
    height = frame_height;
1671

V
Vadim Pisarevsky 已提交
1672
    // typecast from opaque data type to implemented struct
1673 1674 1675
#if LIBAVFORMAT_BUILD > 4628
    AVCodecContext *c = video_st->codec;
#else
A
Alexander Shishkov 已提交
1676
    AVCodecContext *c = &(video_st->codec);
1677 1678
#endif

1679 1680 1681 1682 1683 1684
    // FFmpeg contains SIMD optimizations which can sometimes read data past
    // the supplied input buffer. To ensure that doesn't happen, we pad the
    // step to a multiple of 32 (that's the minimal alignment for which Valgrind
    // doesn't raise any warnings).
    const int STEP_ALIGNMENT = 32;
    if( step % STEP_ALIGNMENT != 0 )
A
Alexander Shishkov 已提交
1685
    {
1686 1687 1688
        int aligned_step = (step + STEP_ALIGNMENT - 1) & -STEP_ALIGNMENT;

        if( !aligned_input )
A
Alexander Shishkov 已提交
1689
        {
1690
            aligned_input = (unsigned char*)av_mallocz(aligned_step * height);
A
Alexander Shishkov 已提交
1691
        }
1692

A
Alexander Shishkov 已提交
1693 1694
        if (origin == 1)
            for( int y = 0; y < height; y++ )
1695
                memcpy(aligned_input + y*aligned_step, data + (height-1-y)*step, step);
A
Alexander Shishkov 已提交
1696 1697
        else
            for( int y = 0; y < height; y++ )
1698
                memcpy(aligned_input + y*aligned_step, data + y*step, step);
1699

1700 1701
        data = aligned_input;
        step = aligned_step;
1702 1703
    }

V
Vadim Pisarevsky 已提交
1704 1705 1706
    if ( c->pix_fmt != input_pix_fmt ) {
        assert( input_picture );
        // let input_picture point to the raw data buffer of 'image'
P
Peter Rekdal Sunde 已提交
1707
        _opencv_ffmpeg_av_image_fill_arrays(input_picture, (uint8_t *) data,
J
jisli 已提交
1708
                       (AVPixelFormat)input_pix_fmt, width, height);
1709
        input_picture->linesize[0] = step;
1710

V
Vadim Pisarevsky 已提交
1711 1712 1713 1714
        if( !img_convert_ctx )
        {
            img_convert_ctx = sws_getContext(width,
                                             height,
J
jisli 已提交
1715
                                             (AVPixelFormat)input_pix_fmt,
V
Vadim Pisarevsky 已提交
1716 1717 1718 1719 1720 1721 1722 1723
                                             c->width,
                                             c->height,
                                             c->pix_fmt,
                                             SWS_BICUBIC,
                                             NULL, NULL, NULL);
            if( !img_convert_ctx )
                return false;
        }
1724 1725 1726 1727 1728 1729

        if ( sws_scale(img_convert_ctx, input_picture->data,
                       input_picture->linesize, 0,
                       height,
                       picture->data, picture->linesize) < 0 )
            return false;
V
Vadim Pisarevsky 已提交
1730 1731
    }
    else{
P
Peter Rekdal Sunde 已提交
1732
        _opencv_ffmpeg_av_image_fill_arrays(picture, (uint8_t *) data,
J
jisli 已提交
1733
                       (AVPixelFormat)input_pix_fmt, width, height);
1734
        picture->linesize[0] = step;
V
Vadim Pisarevsky 已提交
1735
    }
1736

1737
    picture->pts = frame_idx;
1738
    bool ret = icv_av_write_frame_FFMPEG( oc, video_st, outbuf, outbuf_size, picture) >= 0;
1739
    frame_idx++;
1740

V
Vadim Pisarevsky 已提交
1741
    return ret;
1742 1743 1744 1745 1746
}

/// close video output stream and free associated memory
void CvVideoWriter_FFMPEG::close()
{
V
Vadim Pisarevsky 已提交
1747 1748 1749
    // nothing to do if already released
    if ( !picture )
        return;
1750

V
Vadim Pisarevsky 已提交
1751 1752 1753 1754
    /* no more frame to compress. The codec has a latency of a few
       frames if using B frames, so we get the last frames by
       passing the same picture again */
    // TODO -- do we need to account for latency here?
1755

V
Vadim Pisarevsky 已提交
1756 1757 1758 1759 1760 1761 1762 1763 1764 1765 1766 1767 1768 1769
    /* write the trailer, if any */
    if(ok && oc)
    {
        if( (oc->oformat->flags & AVFMT_RAWPICTURE) == 0 )
        {
            for(;;)
            {
                int ret = icv_av_write_frame_FFMPEG( oc, video_st, outbuf, outbuf_size, NULL);
                if( ret == OPENCV_NO_FRAMES_WRITTEN_CODE || ret < 0 )
                    break;
            }
        }
        av_write_trailer(oc);
    }
1770

V
Vadim Pisarevsky 已提交
1771 1772 1773 1774 1775
    if( img_convert_ctx )
    {
        sws_freeContext(img_convert_ctx);
        img_convert_ctx = 0;
    }
1776

V
Vadim Pisarevsky 已提交
1777
    // free pictures
1778
#if LIBAVFORMAT_BUILD > 4628
V
Vadim Pisarevsky 已提交
1779
    if( video_st->codec->pix_fmt != input_pix_fmt)
1780
#else
V
Vadim Pisarevsky 已提交
1781
    if( video_st->codec.pix_fmt != input_pix_fmt)
1782
#endif
V
Vadim Pisarevsky 已提交
1783 1784 1785 1786 1787 1788
    {
        if(picture->data[0])
            free(picture->data[0]);
        picture->data[0] = 0;
    }
    av_free(picture);
1789

V
Vadim Pisarevsky 已提交
1790 1791
    if (input_picture)
        av_free(input_picture);
1792

V
Vadim Pisarevsky 已提交
1793
    /* close codec */
1794
#if LIBAVFORMAT_BUILD > 4628
V
Vadim Pisarevsky 已提交
1795
    avcodec_close(video_st->codec);
1796
#else
V
Vadim Pisarevsky 已提交
1797
    avcodec_close(&(video_st->codec));
1798 1799
#endif

V
Vadim Pisarevsky 已提交
1800
    av_free(outbuf);
1801

1802
    if (oc)
V
Vadim Pisarevsky 已提交
1803
    {
1804 1805 1806
        if (!(fmt->flags & AVFMT_NOFILE))
        {
            /* close the output file */
1807

V
Vadim Pisarevsky 已提交
1808
#if LIBAVCODEC_VERSION_INT < ((52<<16)+(123<<8)+0)
1809
#if LIBAVCODEC_VERSION_INT >= ((51<<16)+(49<<8)+0)
1810
            url_fclose(oc->pb);
1811
#else
1812
            url_fclose(&oc->pb);
V
Vadim Pisarevsky 已提交
1813 1814
#endif
#else
1815
            avio_close(oc->pb);
1816 1817
#endif

1818
        }
1819

1820 1821 1822
        /* free the stream */
        avformat_free_context(oc);
    }
1823

1824
    av_freep(&aligned_input);
1825

V
Vadim Pisarevsky 已提交
1826 1827
    init();
}
1828

1829 1830 1831
#define CV_PRINTABLE_CHAR(ch) ((ch) < 32 ? '?' : (ch))
#define CV_TAG_TO_PRINTABLE_CHAR4(tag) CV_PRINTABLE_CHAR((tag) & 255), CV_PRINTABLE_CHAR(((tag) >> 8) & 255), CV_PRINTABLE_CHAR(((tag) >> 16) & 255), CV_PRINTABLE_CHAR(((tag) >> 24) & 255)

1832
static inline bool cv_ff_codec_tag_match(const AVCodecTag *tags, CV_CODEC_ID id, unsigned int tag)
1833 1834 1835 1836 1837 1838 1839 1840 1841
{
    while (tags->id != AV_CODEC_ID_NONE)
    {
        if (tags->id == id && tags->tag == tag)
            return true;
        tags++;
    }
    return false;
}
1842
static inline bool cv_ff_codec_tag_list_match(const AVCodecTag *const *tags, CV_CODEC_ID id, unsigned int tag)
1843 1844 1845 1846 1847 1848 1849 1850 1851 1852
{
    int i;
    for (i = 0; tags && tags[i]; i++) {
        bool res = cv_ff_codec_tag_match(tags[i], id, tag);
        if (res)
            return res;
    }
    return false;
}

V
Vadim Pisarevsky 已提交
1853 1854 1855 1856
/// Create a video writer object that uses FFMPEG
bool CvVideoWriter_FFMPEG::open( const char * filename, int fourcc,
                                 double fps, int width, int height, bool is_color )
{
1857
    CV_CODEC_ID codec_id = CV_CODEC(CODEC_ID_NONE);
V
Vadim Pisarevsky 已提交
1858 1859
    int err, codec_pix_fmt;
    double bitrate_scale = 1;
1860

V
Vadim Pisarevsky 已提交
1861
    close();
1862

V
Vadim Pisarevsky 已提交
1863 1864 1865 1866 1867
    // check arguments
    if( !filename )
        return false;
    if(fps <= 0)
        return false;
1868

V
Vadim Pisarevsky 已提交
1869 1870 1871 1872 1873 1874 1875
    // we allow frames of odd width or height, but in this case we truncate
    // the rightmost column/the bottom row. Probably, this should be handled more elegantly,
    // but some internal functions inside FFMPEG swscale require even width/height.
    width &= -2;
    height &= -2;
    if( width <= 0 || height <= 0 )
        return false;
1876

V
Vadim Pisarevsky 已提交
1877
    /* auto detect the output format from the name and fourcc code. */
1878

1879
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 2, 0)
V
Vadim Pisarevsky 已提交
1880
    fmt = av_guess_format(NULL, filename, NULL);
1881
#else
V
Vadim Pisarevsky 已提交
1882
    fmt = guess_format(NULL, filename, NULL);
1883
#endif
1884

V
Vadim Pisarevsky 已提交
1885 1886
    if (!fmt)
        return false;
1887

V
Vadim Pisarevsky 已提交
1888 1889
    /* determine optimal pixel format */
    if (is_color) {
J
jisli 已提交
1890
        input_pix_fmt = AV_PIX_FMT_BGR24;
V
Vadim Pisarevsky 已提交
1891 1892
    }
    else {
J
jisli 已提交
1893
        input_pix_fmt = AV_PIX_FMT_GRAY8;
V
Vadim Pisarevsky 已提交
1894
    }
1895

V
Vadim Pisarevsky 已提交
1896
    /* Lookup codec_id for given fourcc */
1897
#if LIBAVCODEC_VERSION_INT<((51<<16)+(49<<8)+0)
1898
    if( (codec_id = codec_get_bmp_id( fourcc )) == CV_CODEC(CODEC_ID_NONE) )
V
Vadim Pisarevsky 已提交
1899
        return false;
1900
#else
1901 1902 1903
    if( (codec_id = av_codec_get_id(fmt->codec_tag, fourcc)) == CV_CODEC(CODEC_ID_NONE) )
    {
        const struct AVCodecTag * fallback_tags[] = {
1904 1905 1906 1907
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(54, 1, 0)
// APIchanges:
// 2012-01-31 - dd6d3b0 - lavf 54.01.0
//   Add avformat_get_riff_video_tags() and avformat_get_riff_audio_tags().
1908
                avformat_get_riff_video_tags(),
1909 1910
#endif
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(55, 25, 100) && defined LIBAVFORMAT_VERSION_MICRO && LIBAVFORMAT_VERSION_MICRO >= 100
1911 1912 1913
// APIchanges: ffmpeg only
// 2014-01-19 - 1a193c4 - lavf 55.25.100 - avformat.h
//   Add avformat_get_mov_video_tags() and avformat_get_mov_audio_tags().
1914
                avformat_get_mov_video_tags(),
1915
#endif
1916 1917
                codec_bmp_tags, // fallback for avformat < 54.1
                NULL };
1918 1919 1920 1921 1922 1923 1924 1925 1926 1927 1928 1929 1930 1931 1932 1933 1934 1935 1936 1937 1938 1939 1940 1941
        if( (codec_id = av_codec_get_id(fallback_tags, fourcc)) == CV_CODEC(CODEC_ID_NONE) )
        {
            fflush(stdout);
            fprintf(stderr, "OpenCV: FFMPEG: tag 0x%08x/'%c%c%c%c' is not found (format '%s / %s')'\n",
                    fourcc, CV_TAG_TO_PRINTABLE_CHAR4(fourcc),
                    fmt->name, fmt->long_name);
            return false;
        }
    }
    // validate tag
    if (cv_ff_codec_tag_list_match(fmt->codec_tag, codec_id, fourcc) == false)
    {
        fflush(stdout);
        fprintf(stderr, "OpenCV: FFMPEG: tag 0x%08x/'%c%c%c%c' is not supported with codec id %d and format '%s / %s'\n",
                fourcc, CV_TAG_TO_PRINTABLE_CHAR4(fourcc),
                codec_id, fmt->name, fmt->long_name);
        int supported_tag;
        if( (supported_tag = av_codec_get_tag(fmt->codec_tag, codec_id)) != 0 )
        {
            fprintf(stderr, "OpenCV: FFMPEG: fallback to use tag 0x%08x/'%c%c%c%c'\n",
                    supported_tag, CV_TAG_TO_PRINTABLE_CHAR4(supported_tag));
            fourcc = supported_tag;
        }
    }
1942 1943
#endif

V
Vadim Pisarevsky 已提交
1944
    // alloc memory for context
1945
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 2, 0)
V
Vadim Pisarevsky 已提交
1946
    oc = avformat_alloc_context();
1947
#else
V
Vadim Pisarevsky 已提交
1948
    oc = av_alloc_format_context();
1949
#endif
V
Vadim Pisarevsky 已提交
1950
    assert (oc);
1951

V
Vadim Pisarevsky 已提交
1952 1953 1954
    /* set file name */
    oc->oformat = fmt;
    snprintf(oc->filename, sizeof(oc->filename), "%s", filename);
1955

V
Vadim Pisarevsky 已提交
1956 1957
    /* set some options */
    oc->max_delay = (int)(0.7*AV_TIME_BASE);  /* This reduces buffer underrun warnings with MPEG */
1958

V
Vadim Pisarevsky 已提交
1959 1960
    // set a few optimal pixel formats for lossless codecs of interest..
    switch (codec_id) {
1961
#if LIBAVCODEC_VERSION_INT>((50<<16)+(1<<8)+0)
1962
    case CV_CODEC(CODEC_ID_JPEGLS):
V
Vadim Pisarevsky 已提交
1963 1964 1965
        // BGR24 or GRAY8 depending on is_color...
        codec_pix_fmt = input_pix_fmt;
        break;
1966
#endif
1967
    case CV_CODEC(CODEC_ID_HUFFYUV):
J
jisli 已提交
1968
        codec_pix_fmt = AV_PIX_FMT_YUV422P;
V
Vadim Pisarevsky 已提交
1969
        break;
1970 1971
    case CV_CODEC(CODEC_ID_MJPEG):
    case CV_CODEC(CODEC_ID_LJPEG):
J
jisli 已提交
1972
        codec_pix_fmt = AV_PIX_FMT_YUVJ420P;
V
Vadim Pisarevsky 已提交
1973 1974
        bitrate_scale = 3;
        break;
1975
    case CV_CODEC(CODEC_ID_RAWVIDEO):
J
jisli 已提交
1976 1977 1978
        codec_pix_fmt = input_pix_fmt == AV_PIX_FMT_GRAY8 ||
                        input_pix_fmt == AV_PIX_FMT_GRAY16LE ||
                        input_pix_fmt == AV_PIX_FMT_GRAY16BE ? input_pix_fmt : AV_PIX_FMT_YUV420P;
V
Vadim Pisarevsky 已提交
1979 1980 1981
        break;
    default:
        // good for lossy formats, MPEG, etc.
J
jisli 已提交
1982
        codec_pix_fmt = AV_PIX_FMT_YUV420P;
V
Vadim Pisarevsky 已提交
1983 1984
        break;
    }
1985

V
Vadim Pisarevsky 已提交
1986
    double bitrate = MIN(bitrate_scale*fps*width*height, (double)INT_MAX/2);
1987

V
Vadim Pisarevsky 已提交
1988 1989 1990 1991
    // TODO -- safe to ignore output audio stream?
    video_st = icv_add_video_stream_FFMPEG(oc, codec_id,
                                           width, height, (int)(bitrate + 0.5),
                                           fps, codec_pix_fmt);
1992

V
Vadim Pisarevsky 已提交
1993 1994 1995 1996 1997 1998 1999
    /* set the output parameters (must be done even if no
   parameters). */
#if LIBAVFORMAT_BUILD < CALC_FFMPEG_VERSION(53, 2, 0)
    if (av_set_parameters(oc, NULL) < 0) {
        return false;
    }
#endif
2000

V
Vadim Pisarevsky 已提交
2001 2002 2003
#if 0
#if FF_API_DUMP_FORMAT
    dump_format(oc, 0, filename, 1);
2004
#else
V
Vadim Pisarevsky 已提交
2005 2006
    av_dump_format(oc, 0, filename, 1);
#endif
2007 2008
#endif

V
Vadim Pisarevsky 已提交
2009 2010 2011 2012
    /* now that all the parameters are set, we can open the audio and
     video codecs and allocate the necessary encode buffers */
    if (!video_st){
        return false;
2013
    }
2014

V
Vadim Pisarevsky 已提交
2015 2016
    AVCodec *codec;
    AVCodecContext *c;
2017

V
Vadim Pisarevsky 已提交
2018 2019 2020 2021 2022
#if LIBAVFORMAT_BUILD > 4628
    c = (video_st->codec);
#else
    c = &(video_st->codec);
#endif
2023

V
Vadim Pisarevsky 已提交
2024 2025 2026 2027
    c->codec_tag = fourcc;
    /* find the video encoder */
    codec = avcodec_find_encoder(c->codec_id);
    if (!codec) {
2028
        fprintf(stderr, "Could not find encoder for codec id %d: %s\n", c->codec_id, icvFFMPEGErrStr(
V
Vadim Pisarevsky 已提交
2029 2030 2031 2032 2033 2034 2035
        #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 2, 0)
                AVERROR_ENCODER_NOT_FOUND
        #else
                -1
        #endif
                ));
        return false;
2036
    }
2037

V
Vadim Pisarevsky 已提交
2038 2039 2040 2041 2042
    int64_t lbit_rate = (int64_t)c->bit_rate;
    lbit_rate += (bitrate / 2);
    lbit_rate = std::min(lbit_rate, (int64_t)INT_MAX);
    c->bit_rate_tolerance = (int)lbit_rate;
    c->bit_rate = (int)lbit_rate;
2043

V
Vadim Pisarevsky 已提交
2044 2045 2046 2047 2048 2049 2050 2051
    /* open the codec */
    if ((err=
#if LIBAVCODEC_VERSION_INT >= ((53<<16)+(8<<8)+0)
         avcodec_open2(c, codec, NULL)
#else
         avcodec_open(c, codec)
#endif
         ) < 0) {
2052
        fprintf(stderr, "Could not open codec '%s': %s\n", codec->name, icvFFMPEGErrStr(err));
V
Vadim Pisarevsky 已提交
2053
        return false;
2054
    }
2055

V
Vadim Pisarevsky 已提交
2056
    outbuf = NULL;
2057

V
Vadim Pisarevsky 已提交
2058 2059 2060 2061 2062
    if (!(oc->oformat->flags & AVFMT_RAWPICTURE)) {
        /* allocate output buffer */
        /* assume we will never get codec output with more than 4 bytes per pixel... */
        outbuf_size = width*height*4;
        outbuf = (uint8_t *) av_malloc(outbuf_size);
2063
    }
2064

V
Vadim Pisarevsky 已提交
2065 2066
    bool need_color_convert;
    need_color_convert = (c->pix_fmt != input_pix_fmt);
2067

V
Vadim Pisarevsky 已提交
2068 2069 2070 2071
    /* allocate the encoded raw picture */
    picture = icv_alloc_picture_FFMPEG(c->pix_fmt, c->width, c->height, need_color_convert);
    if (!picture) {
        return false;
2072
    }
2073

V
Vadim Pisarevsky 已提交
2074 2075 2076 2077 2078 2079 2080 2081
    /* if the output format is not our input format, then a temporary
   picture of the input format is needed too. It is then converted
   to the required output format */
    input_picture = NULL;
    if ( need_color_convert ) {
        input_picture = icv_alloc_picture_FFMPEG(input_pix_fmt, c->width, c->height, false);
        if (!input_picture) {
            return false;
2082
        }
2083 2084
    }

V
Vadim Pisarevsky 已提交
2085 2086 2087 2088 2089 2090 2091 2092 2093 2094
    /* open the output file, if needed */
    if (!(fmt->flags & AVFMT_NOFILE)) {
#if LIBAVFORMAT_BUILD < CALC_FFMPEG_VERSION(53, 2, 0)
        if (url_fopen(&oc->pb, filename, URL_WRONLY) < 0)
#else
            if (avio_open(&oc->pb, filename, AVIO_FLAG_WRITE) < 0)
#endif
            {
            return false;
        }
2095
    }
2096

V
Vadim Pisarevsky 已提交
2097 2098 2099 2100 2101
#if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(52, 111, 0)
    /* write the stream header, if any */
    err=avformat_write_header(oc, NULL);
#else
    err=av_write_header( oc );
2102 2103
#endif

V
Vadim Pisarevsky 已提交
2104
    if(err < 0)
V
Vladislav Vinogradov 已提交
2105
    {
V
Vadim Pisarevsky 已提交
2106 2107 2108
        close();
        remove(filename);
        return false;
V
Vladislav Vinogradov 已提交
2109
    }
V
Vadim Pisarevsky 已提交
2110 2111
    frame_width = width;
    frame_height = height;
2112
    frame_idx = 0;
V
Vadim Pisarevsky 已提交
2113
    ok = true;
I
Ilya Lavrenov 已提交
2114

V
Vadim Pisarevsky 已提交
2115
    return true;
V
Vladislav Vinogradov 已提交
2116 2117 2118 2119
}



V
Vadim Pisarevsky 已提交
2120
CvCapture_FFMPEG* cvCreateFileCapture_FFMPEG( const char* filename )
V
Vladislav Vinogradov 已提交
2121
{
V
Vadim Pisarevsky 已提交
2122
    CvCapture_FFMPEG* capture = (CvCapture_FFMPEG*)malloc(sizeof(*capture));
2123 2124
    if (!capture)
        return 0;
V
Vadim Pisarevsky 已提交
2125 2126 2127
    capture->init();
    if( capture->open( filename ))
        return capture;
I
Ilya Lavrenov 已提交
2128

V
Vadim Pisarevsky 已提交
2129 2130 2131
    capture->close();
    free(capture);
    return 0;
V
Vladislav Vinogradov 已提交
2132 2133
}

V
Vadim Pisarevsky 已提交
2134 2135

void cvReleaseCapture_FFMPEG(CvCapture_FFMPEG** capture)
V
Vladislav Vinogradov 已提交
2136
{
V
Vadim Pisarevsky 已提交
2137
    if( capture && *capture )
V
Vladislav Vinogradov 已提交
2138
    {
V
Vadim Pisarevsky 已提交
2139 2140 2141
        (*capture)->close();
        free(*capture);
        *capture = 0;
V
Vladislav Vinogradov 已提交
2142 2143 2144
    }
}

V
Vadim Pisarevsky 已提交
2145
int cvSetCaptureProperty_FFMPEG(CvCapture_FFMPEG* capture, int prop_id, double value)
V
Vladislav Vinogradov 已提交
2146
{
V
Vadim Pisarevsky 已提交
2147
    return capture->setProperty(prop_id, value);
V
Vladislav Vinogradov 已提交
2148 2149
}

V
Vadim Pisarevsky 已提交
2150
double cvGetCaptureProperty_FFMPEG(CvCapture_FFMPEG* capture, int prop_id)
V
Vladislav Vinogradov 已提交
2151
{
V
Vadim Pisarevsky 已提交
2152
    return capture->getProperty(prop_id);
V
Vladislav Vinogradov 已提交
2153 2154
}

V
Vadim Pisarevsky 已提交
2155
int cvGrabFrame_FFMPEG(CvCapture_FFMPEG* capture)
V
Vladislav Vinogradov 已提交
2156
{
V
Vadim Pisarevsky 已提交
2157
    return capture->grabFrame();
V
Vladislav Vinogradov 已提交
2158
}
V
Vladislav Vinogradov 已提交
2159

V
Vadim Pisarevsky 已提交
2160
int cvRetrieveFrame_FFMPEG(CvCapture_FFMPEG* capture, unsigned char** data, int* step, int* width, int* height, int* cn)
V
Vladislav Vinogradov 已提交
2161
{
V
Vadim Pisarevsky 已提交
2162
    return capture->retrieveFrame(0, data, step, width, height, cn);
V
Vladislav Vinogradov 已提交
2163 2164
}

V
Vadim Pisarevsky 已提交
2165 2166
CvVideoWriter_FFMPEG* cvCreateVideoWriter_FFMPEG( const char* filename, int fourcc, double fps,
                                                  int width, int height, int isColor )
V
Vladislav Vinogradov 已提交
2167
{
V
Vadim Pisarevsky 已提交
2168
    CvVideoWriter_FFMPEG* writer = (CvVideoWriter_FFMPEG*)malloc(sizeof(*writer));
2169 2170
    if (!writer)
        return 0;
V
Vadim Pisarevsky 已提交
2171 2172 2173 2174 2175 2176
    writer->init();
    if( writer->open( filename, fourcc, fps, width, height, isColor != 0 ))
        return writer;
    writer->close();
    free(writer);
    return 0;
V
Vladislav Vinogradov 已提交
2177 2178
}

V
Vadim Pisarevsky 已提交
2179 2180 2181
void cvReleaseVideoWriter_FFMPEG( CvVideoWriter_FFMPEG** writer )
{
    if( writer && *writer )
V
Vladislav Vinogradov 已提交
2182
    {
V
Vadim Pisarevsky 已提交
2183 2184 2185
        (*writer)->close();
        free(*writer);
        *writer = 0;
V
Vladislav Vinogradov 已提交
2186 2187 2188 2189
    }
}


V
Vadim Pisarevsky 已提交
2190 2191 2192
int cvWriteFrame_FFMPEG( CvVideoWriter_FFMPEG* writer,
                         const unsigned char* data, int step,
                         int width, int height, int cn, int origin)
V
Vladislav Vinogradov 已提交
2193
{
V
Vadim Pisarevsky 已提交
2194
    return writer->writeFrame(data, step, width, height, cn, origin);
V
Vladislav Vinogradov 已提交
2195 2196
}

2197 2198 2199 2200 2201 2202 2203 2204 2205 2206


/*
 * For CUDA encoder
 */

struct OutputMediaStream_FFMPEG
{
    bool open(const char* fileName, int width, int height, double fps);
    void close();
2207

2208 2209 2210
    void write(unsigned char* data, int size, int keyFrame);

    // add a video output stream to the container
J
jisli 已提交
2211
    static AVStream* addVideoStream(AVFormatContext *oc, CV_CODEC_ID codec_id, int w, int h, int bitrate, double fps, AVPixelFormat pixel_format);
2212 2213 2214 2215 2216 2217 2218 2219 2220 2221 2222 2223 2224 2225 2226 2227 2228 2229 2230 2231 2232 2233 2234 2235 2236 2237 2238 2239 2240 2241 2242 2243 2244 2245 2246 2247 2248 2249 2250 2251 2252 2253 2254 2255 2256 2257

    AVOutputFormat* fmt_;
    AVFormatContext* oc_;
    AVStream* video_st_;
};

void OutputMediaStream_FFMPEG::close()
{
    // no more frame to compress. The codec has a latency of a few
    // frames if using B frames, so we get the last frames by
    // passing the same picture again

    // TODO -- do we need to account for latency here?

    if (oc_)
    {
        // write the trailer, if any
        av_write_trailer(oc_);

        // free the streams
        for (unsigned int i = 0; i < oc_->nb_streams; ++i)
        {
            av_freep(&oc_->streams[i]->codec);
            av_freep(&oc_->streams[i]);
        }

        if (!(fmt_->flags & AVFMT_NOFILE) && oc_->pb)
        {
            // close the output file

            #if LIBAVCODEC_VERSION_INT < ((52<<16)+(123<<8)+0)
                #if LIBAVCODEC_VERSION_INT >= ((51<<16)+(49<<8)+0)
                    url_fclose(oc_->pb);
                #else
                    url_fclose(&oc_->pb);
                #endif
            #else
                avio_close(oc_->pb);
            #endif
        }

        // free the stream
        av_free(oc_);
    }
}

J
jisli 已提交
2258
AVStream* OutputMediaStream_FFMPEG::addVideoStream(AVFormatContext *oc, CV_CODEC_ID codec_id, int w, int h, int bitrate, double fps, AVPixelFormat pixel_format)
2259
{
2260 2261 2262 2263 2264 2265 2266
    AVCodec* codec = avcodec_find_encoder(codec_id);
    if (!codec)
    {
        fprintf(stderr, "Could not find encoder for codec id %d\n", codec_id);
        return NULL;
    }

2267 2268 2269 2270 2271 2272 2273 2274 2275 2276 2277 2278 2279 2280 2281 2282 2283 2284 2285 2286 2287 2288 2289 2290 2291 2292 2293 2294 2295 2296 2297 2298 2299 2300 2301 2302 2303 2304 2305 2306 2307 2308 2309 2310 2311 2312 2313 2314 2315 2316 2317 2318 2319 2320 2321 2322 2323 2324
    #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 10, 0)
        AVStream* st = avformat_new_stream(oc, 0);
    #else
        AVStream* st = av_new_stream(oc, 0);
    #endif
    if (!st)
        return 0;

    #if LIBAVFORMAT_BUILD > 4628
        AVCodecContext* c = st->codec;
    #else
        AVCodecContext* c = &(st->codec);
    #endif

    c->codec_id = codec_id;
    c->codec_type = AVMEDIA_TYPE_VIDEO;

    // put sample parameters
    unsigned long long lbit_rate = static_cast<unsigned long long>(bitrate);
    lbit_rate += (bitrate / 4);
    lbit_rate = std::min(lbit_rate, static_cast<unsigned long long>(std::numeric_limits<int>::max()));
    c->bit_rate = bitrate;

    // took advice from
    // http://ffmpeg-users.933282.n4.nabble.com/warning-clipping-1-dct-coefficients-to-127-127-td934297.html
    c->qmin = 3;

    // resolution must be a multiple of two
    c->width = w;
    c->height = h;

    // time base: this is the fundamental unit of time (in seconds) in terms
    // of which frame timestamps are represented. for fixed-fps content,
    // timebase should be 1/framerate and timestamp increments should be
    // identically 1

    int frame_rate = static_cast<int>(fps+0.5);
    int frame_rate_base = 1;
    while (fabs(static_cast<double>(frame_rate)/frame_rate_base) - fps > 0.001)
    {
        frame_rate_base *= 10;
        frame_rate = static_cast<int>(fps*frame_rate_base + 0.5);
    }
    c->time_base.den = frame_rate;
    c->time_base.num = frame_rate_base;

    #if LIBAVFORMAT_BUILD > 4752
        // adjust time base for supported framerates
        if (codec && codec->supported_framerates)
        {
            AVRational req = {frame_rate, frame_rate_base};
            const AVRational* best = NULL;
            AVRational best_error = {INT_MAX, 1};

            for (const AVRational* p = codec->supported_framerates; p->den!=0; ++p)
            {
                AVRational error = av_sub_q(req, *p);

2325
                if (error.num < 0)
2326 2327 2328 2329 2330 2331 2332 2333 2334
                    error.num *= -1;

                if (av_cmp_q(error, best_error) < 0)
                {
                    best_error= error;
                    best= p;
                }
            }

2335 2336
            if (best == NULL)
                return NULL;
2337 2338 2339 2340 2341 2342 2343 2344
            c->time_base.den= best->num;
            c->time_base.num= best->den;
        }
    #endif

    c->gop_size = 12; // emit one intra frame every twelve frames at most
    c->pix_fmt = pixel_format;

2345
    if (c->codec_id == CV_CODEC(CODEC_ID_MPEG2VIDEO))
2346 2347
        c->max_b_frames = 2;

2348
    if (c->codec_id == CV_CODEC(CODEC_ID_MPEG1VIDEO) || c->codec_id == CV_CODEC(CODEC_ID_MSMPEG4V3))
2349 2350 2351 2352 2353 2354 2355 2356 2357 2358 2359 2360 2361 2362 2363 2364 2365 2366 2367 2368 2369 2370 2371 2372 2373 2374 2375 2376 2377 2378 2379 2380 2381 2382 2383 2384
    {
        // needed to avoid using macroblocks in which some coeffs overflow
        // this doesnt happen with normal video, it just happens here as the
        // motion of the chroma plane doesnt match the luma plane

        // avoid FFMPEG warning 'clipping 1 dct coefficients...'

        c->mb_decision = 2;
    }

    #if LIBAVCODEC_VERSION_INT > 0x000409
        // some formats want stream headers to be seperate
        if (oc->oformat->flags & AVFMT_GLOBALHEADER)
        {
            c->flags |= CODEC_FLAG_GLOBAL_HEADER;
        }
    #endif

    return st;
}

bool OutputMediaStream_FFMPEG::open(const char* fileName, int width, int height, double fps)
{
    fmt_ = 0;
    oc_ = 0;
    video_st_ = 0;

    // auto detect the output format from the name and fourcc code
    #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 2, 0)
        fmt_ = av_guess_format(NULL, fileName, NULL);
    #else
        fmt_ = guess_format(NULL, fileName, NULL);
    #endif
    if (!fmt_)
        return false;

2385
    CV_CODEC_ID codec_id = CV_CODEC(CODEC_ID_H264);
2386 2387 2388 2389 2390 2391 2392 2393 2394 2395 2396 2397 2398 2399 2400 2401 2402

    // alloc memory for context
    #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 2, 0)
        oc_ = avformat_alloc_context();
    #else
        oc_ = av_alloc_format_context();
    #endif
    if (!oc_)
        return false;

    // set some options
    oc_->oformat = fmt_;
    snprintf(oc_->filename, sizeof(oc_->filename), "%s", fileName);

    oc_->max_delay = (int)(0.7 * AV_TIME_BASE); // This reduces buffer underrun warnings with MPEG

    // set a few optimal pixel formats for lossless codecs of interest..
J
jisli 已提交
2403
    AVPixelFormat codec_pix_fmt = AV_PIX_FMT_YUV420P;
2404 2405 2406 2407 2408 2409 2410 2411 2412 2413 2414 2415 2416 2417 2418 2419 2420 2421 2422 2423 2424 2425 2426 2427 2428 2429 2430 2431 2432 2433 2434 2435 2436 2437 2438 2439 2440 2441 2442
    int bitrate_scale = 64;

    // TODO -- safe to ignore output audio stream?
    video_st_ = addVideoStream(oc_, codec_id, width, height, width * height * bitrate_scale, fps, codec_pix_fmt);
    if (!video_st_)
        return false;

    // set the output parameters (must be done even if no parameters)
    #if LIBAVFORMAT_BUILD < CALC_FFMPEG_VERSION(53, 2, 0)
        if (av_set_parameters(oc_, NULL) < 0)
            return false;
    #endif

    // now that all the parameters are set, we can open the audio and
    // video codecs and allocate the necessary encode buffers

    #if LIBAVFORMAT_BUILD > 4628
        AVCodecContext* c = (video_st_->codec);
    #else
        AVCodecContext* c = &(video_st_->codec);
    #endif

    c->codec_tag = MKTAG('H', '2', '6', '4');
    c->bit_rate_tolerance = c->bit_rate;

    // open the output file, if needed
    if (!(fmt_->flags & AVFMT_NOFILE))
    {
        #if LIBAVFORMAT_BUILD < CALC_FFMPEG_VERSION(53, 2, 0)
            int err = url_fopen(&oc_->pb, fileName, URL_WRONLY);
        #else
            int err = avio_open(&oc_->pb, fileName, AVIO_FLAG_WRITE);
        #endif

        if (err != 0)
            return false;
    }

    // write the stream header, if any
A
Alexander Alekhin 已提交
2443
    int header_err =
2444 2445 2446 2447 2448
    #if LIBAVFORMAT_BUILD < CALC_FFMPEG_VERSION(53, 2, 0)
        av_write_header(oc_);
    #else
        avformat_write_header(oc_, NULL);
    #endif
A
Alexander Alekhin 已提交
2449 2450
    if (header_err != 0)
        return false;
2451 2452 2453 2454 2455 2456 2457

    return true;
}

void OutputMediaStream_FFMPEG::write(unsigned char* data, int size, int keyFrame)
{
    // if zero size, it means the image was buffered
2458
    if (size > 0)
2459 2460 2461 2462 2463 2464 2465 2466 2467 2468 2469 2470 2471 2472 2473 2474 2475 2476 2477
    {
        AVPacket pkt;
        av_init_packet(&pkt);

        if (keyFrame)
            pkt.flags |= PKT_FLAG_KEY;

        pkt.stream_index = video_st_->index;
        pkt.data = data;
        pkt.size = size;

        // write the compressed frame in the media file
        av_write_frame(oc_, &pkt);
    }
}

struct OutputMediaStream_FFMPEG* create_OutputMediaStream_FFMPEG(const char* fileName, int width, int height, double fps)
{
    OutputMediaStream_FFMPEG* stream = (OutputMediaStream_FFMPEG*) malloc(sizeof(OutputMediaStream_FFMPEG));
2478 2479
    if (!stream)
        return 0;
2480 2481 2482 2483 2484 2485

    if (stream->open(fileName, width, height, fps))
        return stream;

    stream->close();
    free(stream);
2486

2487 2488 2489 2490 2491 2492 2493 2494 2495 2496 2497 2498 2499 2500 2501 2502 2503 2504 2505 2506 2507 2508 2509 2510 2511 2512 2513 2514 2515 2516 2517 2518 2519 2520
    return 0;
}

void release_OutputMediaStream_FFMPEG(struct OutputMediaStream_FFMPEG* stream)
{
    stream->close();
    free(stream);
}

void write_OutputMediaStream_FFMPEG(struct OutputMediaStream_FFMPEG* stream, unsigned char* data, int size, int keyFrame)
{
    stream->write(data, size, keyFrame);
}

/*
 * For CUDA decoder
 */

enum
{
    VideoCodec_MPEG1 = 0,
    VideoCodec_MPEG2,
    VideoCodec_MPEG4,
    VideoCodec_VC1,
    VideoCodec_H264,
    VideoCodec_JPEG,
    VideoCodec_H264_SVC,
    VideoCodec_H264_MVC,

    // Uncompressed YUV
    VideoCodec_YUV420 = (('I'<<24)|('Y'<<16)|('U'<<8)|('V')),   // Y,U,V (4:2:0)
    VideoCodec_YV12   = (('Y'<<24)|('V'<<16)|('1'<<8)|('2')),   // Y,V,U (4:2:0)
    VideoCodec_NV12   = (('N'<<24)|('V'<<16)|('1'<<8)|('2')),   // Y,UV  (4:2:0)
    VideoCodec_YUYV   = (('Y'<<24)|('U'<<16)|('Y'<<8)|('V')),   // YUYV/YUY2 (4:2:2)
I
Ilya Lavrenov 已提交
2521
    VideoCodec_UYVY   = (('U'<<24)|('Y'<<16)|('V'<<8)|('Y'))    // UYVY (4:2:2)
2522 2523 2524 2525 2526 2527 2528
};

enum
{
    VideoChromaFormat_Monochrome = 0,
    VideoChromaFormat_YUV420,
    VideoChromaFormat_YUV422,
I
Ilya Lavrenov 已提交
2529
    VideoChromaFormat_YUV444
2530 2531 2532 2533 2534 2535 2536 2537 2538 2539 2540 2541 2542 2543 2544 2545 2546
};

struct InputMediaStream_FFMPEG
{
public:
    bool open(const char* fileName, int* codec, int* chroma_format, int* width, int* height);
    void close();

    bool read(unsigned char** data, int* size, int* endOfFile);

private:
    InputMediaStream_FFMPEG(const InputMediaStream_FFMPEG&);
    InputMediaStream_FFMPEG& operator =(const InputMediaStream_FFMPEG&);

    AVFormatContext* ctx_;
    int video_stream_id_;
    AVPacket pkt_;
2547

2548
#if USE_AV_INTERRUPT_CALLBACK
2549
    AVInterruptCallbackMetadata interrupt_metadata;
2550
#endif
2551 2552 2553 2554 2555 2556 2557 2558 2559 2560
};

bool InputMediaStream_FFMPEG::open(const char* fileName, int* codec, int* chroma_format, int* width, int* height)
{
    int err;

    ctx_ = 0;
    video_stream_id_ = -1;
    memset(&pkt_, 0, sizeof(AVPacket));

2561
#if USE_AV_INTERRUPT_CALLBACK
2562
    /* interrupt callback */
2563
    interrupt_metadata.timeout_after_ms = LIBAVFORMAT_INTERRUPT_OPEN_TIMEOUT_MS;
2564 2565 2566 2567 2568
    get_monotonic_time(&interrupt_metadata.value);

    ctx_ = avformat_alloc_context();
    ctx_->interrupt_callback.callback = _opencv_ffmpeg_interrupt_callback;
    ctx_->interrupt_callback.opaque = &interrupt_metadata;
2569
#endif
2570

2571 2572 2573 2574 2575 2576 2577 2578 2579 2580 2581 2582
    #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 13, 0)
        avformat_network_init();
    #endif

    #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 6, 0)
        err = avformat_open_input(&ctx_, fileName, 0, 0);
    #else
        err = av_open_input_file(&ctx_, fileName, 0, 0, 0);
    #endif
    if (err < 0)
        return false;

R
Roman Donchenko 已提交
2583
    #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 6, 0)
2584 2585 2586 2587 2588 2589 2590 2591 2592 2593 2594 2595 2596 2597 2598 2599 2600 2601 2602 2603 2604
        err = avformat_find_stream_info(ctx_, 0);
    #else
        err = av_find_stream_info(ctx_);
    #endif
    if (err < 0)
        return false;

    for (unsigned int i = 0; i < ctx_->nb_streams; ++i)
    {
        #if LIBAVFORMAT_BUILD > 4628
            AVCodecContext *enc = ctx_->streams[i]->codec;
        #else
            AVCodecContext *enc = &ctx_->streams[i]->codec;
        #endif

        if (enc->codec_type == AVMEDIA_TYPE_VIDEO)
        {
            video_stream_id_ = static_cast<int>(i);

            switch (enc->codec_id)
            {
2605
            case CV_CODEC(CODEC_ID_MPEG1VIDEO):
2606 2607 2608
                *codec = ::VideoCodec_MPEG1;
                break;

2609
            case CV_CODEC(CODEC_ID_MPEG2VIDEO):
2610 2611 2612
                *codec = ::VideoCodec_MPEG2;
                break;

2613
            case CV_CODEC(CODEC_ID_MPEG4):
2614 2615 2616
                *codec = ::VideoCodec_MPEG4;
                break;

2617
            case CV_CODEC(CODEC_ID_VC1):
2618 2619 2620
                *codec = ::VideoCodec_VC1;
                break;

2621
            case CV_CODEC(CODEC_ID_H264):
2622 2623 2624 2625 2626 2627 2628 2629 2630
                *codec = ::VideoCodec_H264;
                break;

            default:
                return false;
            };

            switch (enc->pix_fmt)
            {
J
jisli 已提交
2631
            case AV_PIX_FMT_YUV420P:
2632 2633 2634
                *chroma_format = ::VideoChromaFormat_YUV420;
                break;

J
jisli 已提交
2635
            case AV_PIX_FMT_YUV422P:
2636 2637 2638
                *chroma_format = ::VideoChromaFormat_YUV422;
                break;

J
jisli 已提交
2639
            case AV_PIX_FMT_YUV444P:
2640 2641 2642 2643 2644 2645 2646 2647 2648 2649 2650 2651 2652 2653 2654 2655 2656 2657 2658
                *chroma_format = ::VideoChromaFormat_YUV444;
                break;

            default:
                return false;
            }

            *width = enc->coded_width;
            *height = enc->coded_height;

            break;
        }
    }

    if (video_stream_id_ < 0)
        return false;

    av_init_packet(&pkt_);

2659 2660 2661 2662 2663
#if USE_AV_INTERRUPT_CALLBACK
    // deactivate interrupt callback
    interrupt_metadata.timeout_after_ms = 0;
#endif

2664 2665 2666 2667 2668 2669 2670 2671 2672 2673 2674 2675 2676 2677 2678 2679
    return true;
}

void InputMediaStream_FFMPEG::close()
{
    if (ctx_)
    {
        #if LIBAVFORMAT_BUILD >= CALC_FFMPEG_VERSION(53, 24, 2)
            avformat_close_input(&ctx_);
        #else
            av_close_input_file(ctx_);
        #endif
    }

    // free last packet if exist
    if (pkt_.data)
P
Peter Rekdal Sunde 已提交
2680
        _opencv_ffmpeg_av_packet_unref(&pkt_);
2681 2682 2683 2684
}

bool InputMediaStream_FFMPEG::read(unsigned char** data, int* size, int* endOfFile)
{
2685 2686 2687 2688 2689 2690 2691 2692
    bool result = false;

#if USE_AV_INTERRUPT_CALLBACK
    // activate interrupt callback
    get_monotonic_time(&interrupt_metadata.value);
    interrupt_metadata.timeout_after_ms = LIBAVFORMAT_INTERRUPT_READ_TIMEOUT_MS;
#endif

2693 2694
    // free last packet if exist
    if (pkt_.data)
P
Peter Rekdal Sunde 已提交
2695
        _opencv_ffmpeg_av_packet_unref(&pkt_);
2696 2697 2698 2699

    // get the next frame
    for (;;)
    {
2700
#if USE_AV_INTERRUPT_CALLBACK
2701 2702 2703 2704
        if(interrupt_metadata.timeout)
        {
            break;
        }
2705
#endif
2706

2707 2708 2709 2710 2711 2712 2713
        int ret = av_read_frame(ctx_, &pkt_);

        if (ret == AVERROR(EAGAIN))
            continue;

        if (ret < 0)
        {
A
Andrey Kamaev 已提交
2714
            if (ret == (int)AVERROR_EOF)
2715
                *endOfFile = true;
2716
            break;
2717 2718 2719 2720
        }

        if (pkt_.stream_index != video_stream_id_)
        {
P
Peter Rekdal Sunde 已提交
2721
            _opencv_ffmpeg_av_packet_unref(&pkt_);
2722 2723 2724
            continue;
        }

2725
        result = true;
2726 2727 2728
        break;
    }

2729 2730 2731 2732 2733 2734 2735 2736 2737 2738 2739
#if USE_AV_INTERRUPT_CALLBACK
    // deactivate interrupt callback
    interrupt_metadata.timeout_after_ms = 0;
#endif

    if (result)
    {
        *data = pkt_.data;
        *size = pkt_.size;
        *endOfFile = false;
    }
2740

2741
    return result;
2742 2743 2744 2745 2746
}

InputMediaStream_FFMPEG* create_InputMediaStream_FFMPEG(const char* fileName, int* codec, int* chroma_format, int* width, int* height)
{
    InputMediaStream_FFMPEG* stream = (InputMediaStream_FFMPEG*) malloc(sizeof(InputMediaStream_FFMPEG));
2747 2748
    if (!stream)
        return 0;
2749 2750 2751 2752 2753 2754 2755 2756 2757 2758 2759 2760 2761 2762 2763 2764 2765 2766 2767 2768

    if (stream && stream->open(fileName, codec, chroma_format, width, height))
        return stream;

    stream->close();
    free(stream);

    return 0;
}

void release_InputMediaStream_FFMPEG(InputMediaStream_FFMPEG* stream)
{
    stream->close();
    free(stream);
}

int read_InputMediaStream_FFMPEG(InputMediaStream_FFMPEG* stream, unsigned char** data, int* size, int* endOfFile)
{
    return stream->read(data, size, endOfFile);
}