mov.c 72.2 KB
Newer Older
1
/*
2
 * MOV demuxer
3
 * Copyright (c) 2001 Fabrice Bellard
4
 * Copyright (c) 2009 Baptiste Coudurier <baptiste dot coudurier at gmail dot com>
5
 *
6 7 8
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
F
Fabrice Bellard 已提交
9 10
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
11
 * version 2.1 of the License, or (at your option) any later version.
12
 *
13
 * FFmpeg is distributed in the hope that it will be useful,
14
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
F
Fabrice Bellard 已提交
15 16
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
17
 *
F
Fabrice Bellard 已提交
18
 * You should have received a copy of the GNU Lesser General Public
19
 * License along with FFmpeg; if not, write to the Free Software
20
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21
 */
22 23

#include <limits.h>
24

B
Baptiste Coudurier 已提交
25
//#define DEBUG
26 27
//#define DEBUG_METADATA
//#define MOV_EXPORT_ALL_METADATA
28

29
#include "libavutil/intreadwrite.h"
30
#include "libavutil/avstring.h"
31
#include "avformat.h"
32
#include "riff.h"
33
#include "isom.h"
34 35
#include "libavcodec/mpeg4audio.h"
#include "libavcodec/mpegaudiodata.h"
36
#include "libavcodec/bitstream.h"
37

38
#if CONFIG_ZLIB
39 40 41
#include <zlib.h>
#endif

42 43
/*
 * First version by Francois Revol revol@free.fr
44
 * Seek function by Gael Chardon gael.dev@4now.net
45
 *
46
 * Features and limitations:
47
 * - reads most of the QT files I have (at least the structure),
48 49
 *   Sample QuickTime files with mp3 audio can be found at: http://www.3ivx.com/showcase.html
 * - the code is quite ugly... maybe I won't do it recursive next time :-)
50
 *
51 52
 * Funny I didn't know about http://sourceforge.net/projects/qt-ffmpeg/
 * when coding this :) (it's a writer anyway)
53
 *
54 55 56
 * Reference documents:
 * http://www.geocities.com/xhelmboyx/quicktime/formats/qtm-layout.txt
 * Apple:
G
Gael Chardon 已提交
57
 *  http://developer.apple.com/documentation/QuickTime/QTFF/
58
 *  http://developer.apple.com/documentation/QuickTime/QTFF/qtff.pdf
59 60 61
 * QuickTime is a trademark of Apple (AFAIK :))
 */

62 63
#include "qtpalette.h"

G
Gael Chardon 已提交
64

65 66 67
#undef NDEBUG
#include <assert.h>

68 69 70 71
/* XXX: it's the first time I make a recursive parser I think... sorry if it's ugly :P */

/* those functions parse an atom */
/* return code:
B
Baptiste Coudurier 已提交
72
  0: continue to parse next atom
D
Diego Biurrun 已提交
73
 <0: error occurred, exit
B
Baptiste Coudurier 已提交
74
*/
75 76
/* links atom IDs to parse functions */
typedef struct MOVParseTableEntry {
77
    uint32_t type;
78
    int (*parse)(MOVContext *ctx, ByteIOContext *pb, MOVAtom atom);
79 80
} MOVParseTableEntry;

81 82
static const MOVParseTableEntry mov_default_parse_table[];

B
Baptiste Coudurier 已提交
83 84 85 86 87 88 89 90 91 92 93 94 95
static int mov_metadata_trkn(MOVContext *c, ByteIOContext *pb, unsigned len)
{
    char buf[16];

    get_be16(pb); // unknown
    snprintf(buf, sizeof(buf), "%d", get_be16(pb));
    av_metadata_set(&c->fc->metadata, "track", buf);

    get_be16(pb); // total tracks

    return 0;
}

96 97 98 99 100 101 102 103
static int mov_read_udta_string(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
{
#ifdef MOV_EXPORT_ALL_METADATA
    char tmp_key[5];
#endif
    char str[1024], key2[16], language[4] = {0};
    const char *key = NULL;
    uint16_t str_size;
B
Baptiste Coudurier 已提交
104
    int (*parse)(MOVContext*, ByteIOContext*, unsigned) = NULL;
105 106 107 108 109 110 111 112 113 114 115 116 117 118

    switch (atom.type) {
    case MKTAG(0xa9,'n','a','m'): key = "title";     break;
    case MKTAG(0xa9,'a','u','t'):
    case MKTAG(0xa9,'A','R','T'):
    case MKTAG(0xa9,'w','r','t'): key = "author";    break;
    case MKTAG(0xa9,'c','p','y'): key = "copyright"; break;
    case MKTAG(0xa9,'c','m','t'):
    case MKTAG(0xa9,'i','n','f'): key = "comment";   break;
    case MKTAG(0xa9,'a','l','b'): key = "album";     break;
    case MKTAG(0xa9,'d','a','y'): key = "year";      break;
    case MKTAG(0xa9,'g','e','n'): key = "genre";     break;
    case MKTAG(0xa9,'t','o','o'):
    case MKTAG(0xa9,'e','n','c'): key = "muxer";     break;
B
Baptiste Coudurier 已提交
119 120
    case MKTAG( 't','r','k','n'): key = "track";
        parse = mov_metadata_trkn; break;
121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151
    }

    if (c->itunes_metadata && atom.size > 8) {
        int data_size = get_be32(pb);
        int tag = get_le32(pb);
        if (tag == MKTAG('d','a','t','a')) {
            get_be32(pb); // type
            get_be32(pb); // unknown
            str_size = data_size - 16;
            atom.size -= 16;
        } else return 0;
    } else if (atom.size > 4 && key && !c->itunes_metadata) {
        str_size = get_be16(pb); // string length
        ff_mov_lang_to_iso639(get_be16(pb), language);
        atom.size -= 4;
    } else
        str_size = atom.size;

#ifdef MOV_EXPORT_ALL_METADATA
    if (!key) {
        snprintf(tmp_key, 5, "%.4s", (char*)&atom.type);
        key = tmp_key;
    }
#endif

    if (!key)
        return 0;
    if (atom.size < 0)
        return -1;

    str_size = FFMIN3(sizeof(str)-1, str_size, atom.size);
B
Baptiste Coudurier 已提交
152 153 154 155

    if (parse)
        parse(c, pb, str_size);
    else {
B
Baptiste Coudurier 已提交
156 157 158 159 160 161 162
        get_buffer(pb, str, str_size);
        str[str_size] = 0;
        av_metadata_set(&c->fc->metadata, key, str);
        if (*language && strcmp(language, "und")) {
            snprintf(key2, sizeof(key2), "%s-%s", key, language);
            av_metadata_set(&c->fc->metadata, key2, str);
        }
B
Baptiste Coudurier 已提交
163
    }
164 165 166 167 168 169 170 171
#ifdef DEBUG_METADATA
    av_log(c->fc, AV_LOG_DEBUG, "lang \"%3s\" ", language);
    av_log(c->fc, AV_LOG_DEBUG, "tag \"%s\" value \"%s\" atom \"%.4s\" %d %lld\n",
           key, str, (char*)&atom.type, str_size, atom.size);
#endif

    return 0;
}
172

173
static int mov_read_default(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
174
{
175
    int64_t total_size = 0;
176
    MOVAtom a;
177 178
    int i;
    int err = 0;
179 180

    a.offset = atom.offset;
181

182
    if (atom.size < 0)
B
Baptiste Coudurier 已提交
183
        atom.size = INT64_MAX;
184
    while(((total_size + 8) < atom.size) && !url_feof(pb) && !err) {
185
        int (*parse)(MOVContext*, ByteIOContext*, MOVAtom) = NULL;
186
        a.size = atom.size;
B
Baptiste Coudurier 已提交
187
        a.type=0;
188
        if(atom.size >= 8) {
189
            a.size = get_be32(pb);
190
            a.type = get_le32(pb);
191
        }
192
        total_size += 8;
193
        a.offset += 8;
194 195
        dprintf(c->fc, "type: %08x  %.4s  sz: %"PRIx64"  %"PRIx64"   %"PRIx64"\n",
                a.type, (char*)&a.type, a.size, atom.size, total_size);
196
        if (a.size == 1) { /* 64 bit extended size */
197
            a.size = get_be64(pb) - 8;
198 199
            a.offset += 8;
            total_size += 8;
200
        }
201 202 203
        if (a.size == 0) {
            a.size = atom.size - total_size;
            if (a.size <= 8)
204
                break;
205 206
        }
        a.size -= 8;
207
        if(a.size < 0)
208
            break;
B
Baptiste Coudurier 已提交
209
        a.size = FFMIN(a.size, atom.size - total_size);
210

211 212 213 214 215
        for (i = 0; mov_default_parse_table[i].type; i++)
            if (mov_default_parse_table[i].type == a.type) {
                parse = mov_default_parse_table[i].parse;
                break;
            }
216

217 218 219 220 221 222
        // container is user data
        if (!parse && (atom.type == MKTAG('u','d','t','a') ||
                       atom.type == MKTAG('i','l','s','t')))
            parse = mov_read_udta_string;

        if (!parse) { /* skip leaf atoms data */
223
            url_fskip(pb, a.size);
224
        } else {
225
            int64_t start_pos = url_ftell(pb);
226
            int64_t left;
227
            err = parse(c, pb, a);
228
            if (url_is_streamed(pb) && c->found_moov && c->found_mdat)
B
Baptiste Coudurier 已提交
229
                break;
230 231 232
            left = a.size - url_ftell(pb) + start_pos;
            if (left > 0) /* skip garbage at atom end */
                url_fskip(pb, left);
233
        }
234

235
        a.offset += a.size;
236
        total_size += a.size;
237 238
    }

B
Baptiste Coudurier 已提交
239
    if (!err && total_size < atom.size && atom.size < 0x7ffff)
240
        url_fskip(pb, atom.size - total_size);
241

242 243 244
    return err;
}

245
static int mov_read_dref(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
246 247 248 249 250 251 252 253 254 255
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    MOVStreamContext *sc = st->priv_data;
    int entries, i, j;

    get_be32(pb); // version + flags
    entries = get_be32(pb);
    if (entries >= UINT_MAX / sizeof(*sc->drefs))
        return -1;
    sc->drefs = av_mallocz(entries * sizeof(*sc->drefs));
256 257 258
    if (!sc->drefs)
        return AVERROR(ENOMEM);
    sc->drefs_count = entries;
259 260

    for (i = 0; i < sc->drefs_count; i++) {
261
        MOVDref *dref = &sc->drefs[i];
262
        uint32_t size = get_be32(pb);
263
        int64_t next = url_ftell(pb) + size - 4;
264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291

        dref->type = get_le32(pb);
        get_be32(pb); // version + flags
        dprintf(c->fc, "type %.4s size %d\n", (char*)&dref->type, size);

        if (dref->type == MKTAG('a','l','i','s') && size > 150) {
            /* macintosh alias record */
            uint16_t volume_len, len;
            char volume[28];
            int16_t type;

            url_fskip(pb, 10);

            volume_len = get_byte(pb);
            volume_len = FFMIN(volume_len, 27);
            get_buffer(pb, volume, 27);
            volume[volume_len] = 0;
            av_log(c->fc, AV_LOG_DEBUG, "volume %s, len %d\n", volume, volume_len);

            url_fskip(pb, 112);

            for (type = 0; type != -1 && url_ftell(pb) < next; ) {
                type = get_be16(pb);
                len = get_be16(pb);
                av_log(c->fc, AV_LOG_DEBUG, "type %d, len %d\n", type, len);
                if (len&1)
                    len += 1;
                if (type == 2) { // absolute path
292
                    av_free(dref->path);
293
                    dref->path = av_mallocz(len+1);
294 295
                    if (!dref->path)
                        return AVERROR(ENOMEM);
296
                    get_buffer(pb, dref->path, len);
297
                    if (len > volume_len && !strncmp(dref->path, volume, volume_len)) {
298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314
                        len -= volume_len;
                        memmove(dref->path, dref->path+volume_len, len);
                        dref->path[len] = 0;
                    }
                    for (j = 0; j < len; j++)
                        if (dref->path[j] == ':')
                            dref->path[j] = '/';
                    av_log(c->fc, AV_LOG_DEBUG, "path %s\n", dref->path);
                } else
                    url_fskip(pb, len);
            }
        }
        url_fseek(pb, next, SEEK_SET);
    }
    return 0;
}

315
static int mov_read_hdlr(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
316
{
317
    AVStream *st;
318 319
    uint32_t type;
    uint32_t ctype;
320

321 322 323 324 325
    if (c->fc->nb_streams < 1) // meta before first trak
        return 0;

    st = c->fc->streams[c->fc->nb_streams-1];

326
    get_byte(pb); /* version */
327
    get_be24(pb); /* flags */
328 329 330 331 332

    /* component type */
    ctype = get_le32(pb);
    type = get_le32(pb); /* component subtype */

B
Baptiste Coudurier 已提交
333 334
    dprintf(c->fc, "ctype= %.4s (0x%08x)\n", (char*)&ctype, ctype);
    dprintf(c->fc, "stype= %.4s\n", (char*)&type);
335

336
    if     (type == MKTAG('v','i','d','e'))
337
        st->codec->codec_type = CODEC_TYPE_VIDEO;
338
    else if(type == MKTAG('s','o','u','n'))
339
        st->codec->codec_type = CODEC_TYPE_AUDIO;
340
    else if(type == MKTAG('m','1','a',' '))
341
        st->codec->codec_id = CODEC_ID_MP2;
342
    else if(type == MKTAG('s','u','b','p'))
343
        st->codec->codec_type = CODEC_TYPE_SUBTITLE;
344

345 346 347 348
    get_be32(pb); /* component  manufacture */
    get_be32(pb); /* component flags */
    get_be32(pb); /* component flags mask */

349
    if(atom.size <= 24)
350
        return 0; /* nothing left to read */
351

352
    url_fskip(pb, atom.size - (url_ftell(pb) - atom.offset));
353 354 355
    return 0;
}

B
Baptiste Coudurier 已提交
356
static int mp4_read_descr_len(ByteIOContext *pb)
357
{
358
    int len = 0;
359 360
    int count = 4;
    while (count--) {
361
        int c = get_byte(pb);
362 363 364
        len = (len << 7) | (c & 0x7f);
        if (!(c & 0x80))
            break;
365 366 367 368
    }
    return len;
}

B
Baptiste Coudurier 已提交
369
static int mp4_read_descr(MOVContext *c, ByteIOContext *pb, int *tag)
370 371 372
{
    int len;
    *tag = get_byte(pb);
B
Baptiste Coudurier 已提交
373
    len = mp4_read_descr_len(pb);
M
Michel Bardiaux 已提交
374
    dprintf(c->fc, "MPEG4 description: tag=0x%02x len=%d\n", *tag, len);
375 376 377
    return len;
}

378 379 380 381
#define MP4ESDescrTag                   0x03
#define MP4DecConfigDescrTag            0x04
#define MP4DecSpecificDescrTag          0x05

382
static const AVCodecTag mp4_audio_types[] = {
383 384 385 386 387
    { CODEC_ID_MP3ON4, AOT_PS   }, /* old mp3on4 draft */
    { CODEC_ID_MP3ON4, AOT_L1   }, /* layer 1 */
    { CODEC_ID_MP3ON4, AOT_L2   }, /* layer 2 */
    { CODEC_ID_MP3ON4, AOT_L3   }, /* layer 3 */
    { CODEC_ID_NONE,   AOT_NULL },
388 389
};

390
static int mov_read_esds(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
391 392 393
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    int tag, len;
394

395
    get_be32(pb); /* version + flags */
B
Baptiste Coudurier 已提交
396
    len = mp4_read_descr(c, pb, &tag);
397
    if (tag == MP4ESDescrTag) {
398 399
        get_be16(pb); /* ID */
        get_byte(pb); /* priority */
400
    } else
401
        get_be16(pb); /* ID */
402

B
Baptiste Coudurier 已提交
403
    len = mp4_read_descr(c, pb, &tag);
404
    if (tag == MP4DecConfigDescrTag) {
405 406 407 408 409 410 411 412
        int object_type_id = get_byte(pb);
        get_byte(pb); /* stream type */
        get_be24(pb); /* buffer size db */
        get_be32(pb); /* max bitrate */
        get_be32(pb); /* avg bitrate */

        st->codec->codec_id= codec_get_id(ff_mp4_obj_type, object_type_id);
        dprintf(c->fc, "esds object type id %d\n", object_type_id);
B
Baptiste Coudurier 已提交
413
        len = mp4_read_descr(c, pb, &tag);
414
        if (tag == MP4DecSpecificDescrTag) {
M
Michel Bardiaux 已提交
415
            dprintf(c->fc, "Specific MPEG4 header len=%d\n", len);
B
Baptiste Coudurier 已提交
416 417
            if((uint64_t)len > (1<<30))
                return -1;
B
Baptiste Coudurier 已提交
418
            st->codec->extradata = av_mallocz(len + FF_INPUT_BUFFER_PADDING_SIZE);
419 420
            if (!st->codec->extradata)
                return AVERROR(ENOMEM);
B
Baptiste Coudurier 已提交
421 422
            get_buffer(pb, st->codec->extradata, len);
            st->codec->extradata_size = len;
423 424 425 426
            if (st->codec->codec_id == CODEC_ID_AAC) {
                MPEG4AudioConfig cfg;
                ff_mpeg4audio_get_config(&cfg, st->codec->extradata,
                                         st->codec->extradata_size);
427
                if (cfg.chan_config > 7)
428 429 430 431 432 433 434 435 436 437
                    return -1;
                st->codec->channels = ff_mpeg4audio_channels[cfg.chan_config];
                if (cfg.object_type == 29 && cfg.sampling_index < 3) // old mp3on4
                    st->codec->sample_rate = ff_mpa_freq_tab[cfg.sampling_index];
                else
                    st->codec->sample_rate = cfg.sample_rate; // ext sample rate ?
                dprintf(c->fc, "mp4a config channels %d obj %d ext obj %d "
                        "sample rate %d ext sample rate %d\n", st->codec->channels,
                        cfg.object_type, cfg.ext_object_type,
                        cfg.sample_rate, cfg.ext_sample_rate);
438 439 440
                if (!(st->codec->codec_id = codec_get_id(mp4_audio_types,
                                                         cfg.object_type)))
                    st->codec->codec_id = CODEC_ID_AAC;
B
Baptiste Coudurier 已提交
441
            }
442
        }
443 444 445 446
    }
    return 0;
}

447 448 449 450 451 452
static int mov_read_pasp(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
{
    const int num = get_be32(pb);
    const int den = get_be32(pb);
    AVStream * const st = c->fc->streams[c->fc->nb_streams-1];
    if (den != 0) {
453 454
        if ((st->sample_aspect_ratio.den != 1 || st->sample_aspect_ratio.num) && // default
            (den != st->sample_aspect_ratio.den || num != st->sample_aspect_ratio.num))
455
            av_log(c->fc, AV_LOG_WARNING,
456 457
                   "sample aspect ratio already set to %d:%d, overriding by 'pasp' atom\n",
                   st->sample_aspect_ratio.num, st->sample_aspect_ratio.den);
458 459 460 461 462 463
        st->sample_aspect_ratio.num = num;
        st->sample_aspect_ratio.den = den;
    }
    return 0;
}

464
/* this atom contains actual media data */
465
static int mov_read_mdat(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
466
{
467 468 469 470 471 472
    if(atom.size == 0) /* wrong one (MP4) */
        return 0;
    c->found_mdat=1;
    return 0; /* now go for moov */
}

473
static int mov_read_ftyp(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
474 475 476
{
    uint32_t type = get_le32(pb);

477 478
    if (type != MKTAG('q','t',' ',' '))
        c->isom = 1;
479
    av_log(c->fc, AV_LOG_DEBUG, "ISO: File Type Major Brand: %.4s\n",(char *)&type);
480 481 482 483 484
    get_be32(pb); /* minor version */
    url_fskip(pb, atom.size - 8);
    return 0;
}

485
/* this atom should contain all header atoms */
486
static int mov_read_moov(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
487
{
488 489
    if (mov_read_default(c, pb, atom) < 0)
        return -1;
490 491 492 493 494 495
    /* we parsed the 'moov' atom, we can terminate the parsing as soon as we find the 'mdat' */
    /* so we don't parse the whole file if over a network */
    c->found_moov=1;
    return 0; /* now go for mdat */
}

496
static int mov_read_moof(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
B
Baptiste Coudurier 已提交
497 498 499 500 501
{
    c->fragment.moof_offset = url_ftell(pb) - 8;
    dprintf(c->fc, "moof offset %llx\n", c->fragment.moof_offset);
    return mov_read_default(c, pb, atom);
}
502

503
static int mov_read_mdhd(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
504
{
B
clean  
Baptiste Coudurier 已提交
505
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
506
    MOVStreamContext *sc = st->priv_data;
B
clean  
Baptiste Coudurier 已提交
507
    int version = get_byte(pb);
508
    char language[4] = {0};
509
    unsigned lang;
510

511
    if (version > 1)
B
Baptiste Coudurier 已提交
512
        return -1; /* unsupported */
513

514
    get_be24(pb); /* flags */
B
clean  
Baptiste Coudurier 已提交
515 516 517 518 519 520 521
    if (version == 1) {
        get_be64(pb);
        get_be64(pb);
    } else {
        get_be32(pb); /* creation time */
        get_be32(pb); /* modification time */
    }
522

B
clean  
Baptiste Coudurier 已提交
523 524
    sc->time_scale = get_be32(pb);
    st->duration = (version == 1) ? get_be64(pb) : get_be32(pb); /* duration */
525

526
    lang = get_be16(pb); /* language */
527 528
    if (ff_mov_lang_to_iso639(lang, language))
        av_metadata_set(&st->metadata, "language", language);
529 530 531 532 533
    get_be16(pb); /* quality */

    return 0;
}

534
static int mov_read_mvhd(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
535
{
B
Baptiste Coudurier 已提交
536
    int version = get_byte(pb); /* version */
537
    get_be24(pb); /* flags */
538

B
Baptiste Coudurier 已提交
539 540 541 542 543 544 545
    if (version == 1) {
        get_be64(pb);
        get_be64(pb);
    } else {
        get_be32(pb); /* creation time */
        get_be32(pb); /* modification time */
    }
546
    c->time_scale = get_be32(pb); /* time scale */
547 548 549

    dprintf(c->fc, "time scale = %i\n", c->time_scale);

B
Baptiste Coudurier 已提交
550
    c->duration = (version == 1) ? get_be64(pb) : get_be32(pb); /* duration */
551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569
    get_be32(pb); /* preferred scale */

    get_be16(pb); /* preferred volume */

    url_fskip(pb, 10); /* reserved */

    url_fskip(pb, 36); /* display matrix */

    get_be32(pb); /* preview time */
    get_be32(pb); /* preview duration */
    get_be32(pb); /* poster time */
    get_be32(pb); /* selection time */
    get_be32(pb); /* selection duration */
    get_be32(pb); /* current time */
    get_be32(pb); /* next track ID */

    return 0;
}

570
static int mov_read_smi(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
571 572 573
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];

574 575
    if((uint64_t)atom.size > (1<<30))
        return -1;
576

577 578
    // currently SVQ3 decoder expect full STSD header - so let's fake it
    // this should be fixed and just SMI header should be passed
579
    av_free(st->codec->extradata);
580 581 582
    st->codec->extradata = av_mallocz(atom.size + 0x5a + FF_INPUT_BUFFER_PADDING_SIZE);
    if (!st->codec->extradata)
        return AVERROR(ENOMEM);
B
Baptiste Coudurier 已提交
583 584 585 586
    st->codec->extradata_size = 0x5a + atom.size;
    memcpy(st->codec->extradata, "SVQ3", 4); // fake
    get_buffer(pb, st->codec->extradata + 0x5a, atom.size);
    dprintf(c->fc, "Reading SMI %"PRId64"  %s\n", atom.size, st->codec->extradata + 0x5a);
587 588
    return 0;
}
589

590
static int mov_read_enda(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
591 592 593 594
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    int little_endian = get_be16(pb);

595 596
    dprintf(c->fc, "enda %d\n", little_endian);
    if (little_endian == 1) {
597 598 599 600 601 602 603
        switch (st->codec->codec_id) {
        case CODEC_ID_PCM_S24BE:
            st->codec->codec_id = CODEC_ID_PCM_S24LE;
            break;
        case CODEC_ID_PCM_S32BE:
            st->codec->codec_id = CODEC_ID_PCM_S32LE;
            break;
604 605 606 607 608 609
        case CODEC_ID_PCM_F32BE:
            st->codec->codec_id = CODEC_ID_PCM_F32LE;
            break;
        case CODEC_ID_PCM_F64BE:
            st->codec->codec_id = CODEC_ID_PCM_F64LE;
            break;
610 611 612 613 614 615 616
        default:
            break;
        }
    }
    return 0;
}

617
/* FIXME modify qdm2/svq3/h264 decoders to take full atom as extradata */
618
static int mov_read_extradata(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
619
{
620 621
    AVStream *st;
    uint64_t size;
622
    uint8_t *buf;
623 624 625 626 627

    if (c->fc->nb_streams < 1) // will happen with jp2 files
        return 0;
    st= c->fc->streams[c->fc->nb_streams-1];
    size= (uint64_t)st->codec->extradata_size + atom.size + 8 + FF_INPUT_BUFFER_PADDING_SIZE;
628
    if(size > INT_MAX || (uint64_t)atom.size > INT_MAX)
629
        return -1;
630 631 632 633 634 635 636 637 638
    buf= av_realloc(st->codec->extradata, size);
    if(!buf)
        return -1;
    st->codec->extradata= buf;
    buf+= st->codec->extradata_size;
    st->codec->extradata_size= size - FF_INPUT_BUFFER_PADDING_SIZE;
    AV_WB32(       buf    , atom.size + 8);
    AV_WL32(       buf + 4, atom.type);
    get_buffer(pb, buf + 8, atom.size);
639 640 641
    return 0;
}

642
static int mov_read_wave(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
R
Roberto Togni 已提交
643 644 645 646 647
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];

    if((uint64_t)atom.size > (1<<30))
        return -1;
648

649 650 651
    if (st->codec->codec_id == CODEC_ID_QDM2) {
        // pass all frma atom to codec, needed at least for QDM2
        av_free(st->codec->extradata);
652 653 654
        st->codec->extradata = av_mallocz(atom.size + FF_INPUT_BUFFER_PADDING_SIZE);
        if (!st->codec->extradata)
            return AVERROR(ENOMEM);
655
        st->codec->extradata_size = atom.size;
656
        get_buffer(pb, st->codec->extradata, atom.size);
657
    } else if (atom.size > 8) { /* to read frma, esds atoms */
658 659
        if (mov_read_default(c, pb, atom) < 0)
            return -1;
660
    } else
661
        url_fskip(pb, atom.size);
R
Roberto Togni 已提交
662 663 664
    return 0;
}

665 666 667 668
/**
 * This function reads atom content and puts data in extradata without tag
 * nor size unlike mov_read_extradata.
 */
669
static int mov_read_glbl(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
670 671 672
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];

673 674 675
    if((uint64_t)atom.size > (1<<30))
        return -1;

676
    av_free(st->codec->extradata);
677 678 679
    st->codec->extradata = av_mallocz(atom.size + FF_INPUT_BUFFER_PADDING_SIZE);
    if (!st->codec->extradata)
        return AVERROR(ENOMEM);
680
    st->codec->extradata_size = atom.size;
681
    get_buffer(pb, st->codec->extradata, atom.size);
682 683 684
    return 0;
}

685
static int mov_read_stco(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
686 687
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
688
    MOVStreamContext *sc = st->priv_data;
689
    unsigned int i, entries;
690 691

    get_byte(pb); /* version */
692
    get_be24(pb); /* flags */
693 694

    entries = get_be32(pb);
695

696 697
    if(entries >= UINT_MAX/sizeof(int64_t))
        return -1;
698

B
Baptiste Coudurier 已提交
699
    sc->chunk_offsets = av_malloc(entries * sizeof(int64_t));
700
    if (!sc->chunk_offsets)
701 702 703
        return AVERROR(ENOMEM);
    sc->chunk_count = entries;

704 705
    if      (atom.type == MKTAG('s','t','c','o'))
        for(i=0; i<entries; i++)
706
            sc->chunk_offsets[i] = get_be32(pb);
707 708
    else if (atom.type == MKTAG('c','o','6','4'))
        for(i=0; i<entries; i++)
709
            sc->chunk_offsets[i] = get_be64(pb);
710
    else
711
        return -1;
712

713 714 715
    return 0;
}

716 717 718 719
/**
 * Compute codec id for 'lpcm' tag.
 * See CoreAudioTypes and AudioStreamBasicDescription at Apple.
 */
D
Diego Pettenò 已提交
720
static enum CodecID mov_get_lpcm_codec_id(int bps, int flags)
721 722 723 724
{
    if (flags & 1) { // floating point
        if (flags & 2) { // big endian
            if      (bps == 32) return CODEC_ID_PCM_F32BE;
725
            else if (bps == 64) return CODEC_ID_PCM_F64BE;
726
        } else {
727 728
            if      (bps == 32) return CODEC_ID_PCM_F32LE;
            else if (bps == 64) return CODEC_ID_PCM_F64LE;
729 730 731 732 733 734 735 736 737 738 739 740 741 742
        }
    } else {
        if (flags & 2) {
            if      (bps == 8)
                // signed integer
                if (flags & 4)  return CODEC_ID_PCM_S8;
                else            return CODEC_ID_PCM_U8;
            else if (bps == 16) return CODEC_ID_PCM_S16BE;
            else if (bps == 24) return CODEC_ID_PCM_S24BE;
            else if (bps == 32) return CODEC_ID_PCM_S32BE;
        } else {
            if      (bps == 8)
                if (flags & 4)  return CODEC_ID_PCM_S8;
                else            return CODEC_ID_PCM_U8;
B
Baptiste Coudurier 已提交
743
            else if (bps == 16) return CODEC_ID_PCM_S16LE;
744 745 746 747
            else if (bps == 24) return CODEC_ID_PCM_S24LE;
            else if (bps == 32) return CODEC_ID_PCM_S32LE;
        }
    }
D
Diego Pettenò 已提交
748
    return CODEC_ID_NONE;
749 750
}

751
static int mov_read_stsd(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
752 753
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
754
    MOVStreamContext *sc = st->priv_data;
755
    int j, entries, pseudo_stream_id;
756

757
    get_byte(pb); /* version */
758
    get_be24(pb); /* flags */
759 760 761

    entries = get_be32(pb);

762 763
    for(pseudo_stream_id=0; pseudo_stream_id<entries; pseudo_stream_id++) {
        //Parsing Sample description table
764
        enum CodecID id;
765
        int dref_id;
766
        MOVAtom a = { 0, 0, 0 };
767
        int64_t start_pos = url_ftell(pb);
768
        int size = get_be32(pb); /* size */
769
        uint32_t format = get_le32(pb); /* data format */
770

771 772
        get_be32(pb); /* reserved */
        get_be16(pb); /* reserved */
773
        dref_id = get_be16(pb);
774

775
        if (st->codec->codec_tag &&
776
            st->codec->codec_tag != format &&
777
            (c->fc->video_codec_id ? codec_get_id(codec_movvideo_tags, format) != c->fc->video_codec_id
778
                                   : st->codec->codec_tag != MKTAG('j','p','e','g'))
779
           ){
D
Diego Biurrun 已提交
780 781 782
            /* Multiple fourcc, we skip JPEG. This is not correct, we should
             * export it as a separate AVStream but this needs a few changes
             * in the MOV demuxer, patch welcome. */
B
Baptiste Coudurier 已提交
783
            av_log(c->fc, AV_LOG_WARNING, "multiple fourcc not supported\n");
784 785 786
            url_fskip(pb, size - (url_ftell(pb) - start_pos));
            continue;
        }
787
        sc->pseudo_stream_id = st->codec->codec_tag ? -1 : pseudo_stream_id;
788
        sc->dref_id= dref_id;
789

790
        st->codec->codec_tag = format;
791
        id = codec_get_id(codec_movaudio_tags, format);
792
        if (id<=0 && (format&0xFFFF) == 'm'+('s'<<8))
M
Michael Niedermayer 已提交
793 794
            id = codec_get_id(codec_wav_tags, bswap_32(format)&0xFFFF);

795
        if (st->codec->codec_type != CODEC_TYPE_VIDEO && id > 0) {
796
            st->codec->codec_type = CODEC_TYPE_AUDIO;
797
        } else if (st->codec->codec_type != CODEC_TYPE_AUDIO && /* do not overwrite codec type */
798
                   format && format != MKTAG('m','p','4','s')) { /* skip old asf mpeg4 tag */
799
            id = codec_get_id(codec_movvideo_tags, format);
800
            if (id <= 0)
801
                id = codec_get_id(codec_bmp_tags, format);
802 803
            if (id > 0)
                st->codec->codec_type = CODEC_TYPE_VIDEO;
804 805 806 807 808
            else if(st->codec->codec_type == CODEC_TYPE_DATA){
                id = codec_get_id(ff_codec_movsubtitle_tags, format);
                if(id > 0)
                    st->codec->codec_type = CODEC_TYPE_SUBTITLE;
            }
809 810
        }

811 812 813
        dprintf(c->fc, "size=%d 4CC= %c%c%c%c codec_type=%d\n", size,
                (format >> 0) & 0xff, (format >> 8) & 0xff, (format >> 16) & 0xff,
                (format >> 24) & 0xff, st->codec->codec_type);
814

815
        if(st->codec->codec_type==CODEC_TYPE_VIDEO) {
816 817 818 819
            uint8_t codec_name[32];
            unsigned int color_depth;
            int color_greyscale;

820
            st->codec->codec_id = id;
821 822 823 824
            get_be16(pb); /* version */
            get_be16(pb); /* revision level */
            get_be32(pb); /* vendor */
            get_be32(pb); /* temporal quality */
D
Diego Biurrun 已提交
825
            get_be32(pb); /* spatial quality */
826 827 828 829

            st->codec->width = get_be16(pb); /* width */
            st->codec->height = get_be16(pb); /* height */

830 831 832
            get_be32(pb); /* horiz resolution */
            get_be32(pb); /* vert resolution */
            get_be32(pb); /* data size, always 0 */
B
Baptiste Coudurier 已提交
833
            get_be16(pb); /* frames per samples */
834

B
Baptiste Coudurier 已提交
835
            get_buffer(pb, codec_name, 32); /* codec name, pascal string */
B
Baptiste Coudurier 已提交
836 837 838 839
            if (codec_name[0] <= 31) {
                memcpy(st->codec->codec_name, &codec_name[1],codec_name[0]);
                st->codec->codec_name[codec_name[0]] = 0;
            }
840

841
            st->codec->bits_per_coded_sample = get_be16(pb); /* depth */
842
            st->codec->color_table_id = get_be16(pb); /* colortable id */
843
            dprintf(c->fc, "depth %d, ctab id %d\n",
844
                   st->codec->bits_per_coded_sample, st->codec->color_table_id);
845
            /* figure out the palette situation */
846 847
            color_depth = st->codec->bits_per_coded_sample & 0x1F;
            color_greyscale = st->codec->bits_per_coded_sample & 0x20;
848 849

            /* if the depth is 2, 4, or 8 bpp, file is palettized */
850
            if ((color_depth == 2) || (color_depth == 4) ||
851
                (color_depth == 8)) {
852 853 854 855
                /* for palette traversal */
                unsigned int color_start, color_count, color_end;
                unsigned char r, g, b;

856
                st->codec->palctrl = av_malloc(sizeof(*st->codec->palctrl));
857
                if (color_greyscale) {
858
                    int color_index, color_dec;
859
                    /* compute the greyscale palette */
860
                    st->codec->bits_per_coded_sample = color_depth;
861 862 863 864 865
                    color_count = 1 << color_depth;
                    color_index = 255;
                    color_dec = 256 / (color_count - 1);
                    for (j = 0; j < color_count; j++) {
                        r = g = b = color_index;
866
                        st->codec->palctrl->palette[j] =
867 868 869 870 871
                            (r << 16) | (g << 8) | (b);
                        color_index -= color_dec;
                        if (color_index < 0)
                            color_index = 0;
                    }
872
                } else if (st->codec->color_table_id) {
873
                    const uint8_t *color_table;
874 875 876
                    /* if flag bit 3 is set, use the default palette */
                    color_count = 1 << color_depth;
                    if (color_depth == 2)
M
Michael Niedermayer 已提交
877
                        color_table = ff_qt_default_palette_4;
878
                    else if (color_depth == 4)
M
Michael Niedermayer 已提交
879
                        color_table = ff_qt_default_palette_16;
880
                    else
M
Michael Niedermayer 已提交
881
                        color_table = ff_qt_default_palette_256;
882 883 884 885 886

                    for (j = 0; j < color_count; j++) {
                        r = color_table[j * 4 + 0];
                        g = color_table[j * 4 + 1];
                        b = color_table[j * 4 + 2];
887
                        st->codec->palctrl->palette[j] =
888 889 890 891 892 893 894
                            (r << 16) | (g << 8) | (b);
                    }
                } else {
                    /* load the palette from the file */
                    color_start = get_be32(pb);
                    color_count = get_be16(pb);
                    color_end = get_be16(pb);
895 896
                    if ((color_start <= 255) &&
                        (color_end <= 255)) {
M
Mike Melanson 已提交
897 898 899 900 901 902 903 904 905 906 907 908
                        for (j = color_start; j <= color_end; j++) {
                            /* each R, G, or B component is 16 bits;
                             * only use the top 8 bits; skip alpha bytes
                             * up front */
                            get_byte(pb);
                            get_byte(pb);
                            r = get_byte(pb);
                            get_byte(pb);
                            g = get_byte(pb);
                            get_byte(pb);
                            b = get_byte(pb);
                            get_byte(pb);
909
                            st->codec->palctrl->palette[j] =
M
Mike Melanson 已提交
910
                                (r << 16) | (g << 8) | (b);
911
                        }
912 913
                    }
                }
914
                st->codec->palctrl->palette_changed = 1;
915
            }
916
        } else if(st->codec->codec_type==CODEC_TYPE_AUDIO) {
917
            int bits_per_sample, flags;
918
            uint16_t version = get_be16(pb);
919

920
            st->codec->codec_id = id;
921 922
            get_be16(pb); /* revision level */
            get_be32(pb); /* vendor */
923

924
            st->codec->channels = get_be16(pb);             /* channel count */
M
Michel Bardiaux 已提交
925
            dprintf(c->fc, "audio channels %d\n", st->codec->channels);
926
            st->codec->bits_per_coded_sample = get_be16(pb);      /* sample size */
927

928
            sc->audio_cid = get_be16(pb);
929 930 931 932
            get_be16(pb); /* packet size = 0 */

            st->codec->sample_rate = ((get_be32(pb) >> 16));

933 934 935 936 937 938 939 940 941 942 943 944 945
            //Read QT version 1 fields. In version 0 these do not exist.
            dprintf(c->fc, "version =%d, isom =%d\n",version,c->isom);
            if(!c->isom) {
                if(version==1) {
                    sc->samples_per_frame = get_be32(pb);
                    get_be32(pb); /* bytes per packet */
                    sc->bytes_per_frame = get_be32(pb);
                    get_be32(pb); /* bytes per sample */
                } else if(version==2) {
                    get_be32(pb); /* sizeof struct only */
                    st->codec->sample_rate = av_int2dbl(get_be64(pb)); /* float 64 */
                    st->codec->channels = get_be32(pb);
                    get_be32(pb); /* always 0x7F000000 */
946
                    st->codec->bits_per_coded_sample = get_be32(pb); /* bits per channel if sound is uncompressed */
947
                    flags = get_be32(pb); /* lcpm format specific flag */
B
Baptiste Coudurier 已提交
948 949
                    sc->bytes_per_frame = get_be32(pb); /* bytes per audio packet if constant */
                    sc->samples_per_frame = get_be32(pb); /* lpcm frames per audio packet if constant */
950
                    if (format == MKTAG('l','p','c','m'))
951
                        st->codec->codec_id = mov_get_lpcm_codec_id(st->codec->bits_per_coded_sample, flags);
952 953 954
                }
            }

955
            switch (st->codec->codec_id) {
956 957
            case CODEC_ID_PCM_S8:
            case CODEC_ID_PCM_U8:
958
                if (st->codec->bits_per_coded_sample == 16)
959 960
                    st->codec->codec_id = CODEC_ID_PCM_S16BE;
                break;
961
            case CODEC_ID_PCM_S16LE:
962
            case CODEC_ID_PCM_S16BE:
963
                if (st->codec->bits_per_coded_sample == 8)
964
                    st->codec->codec_id = CODEC_ID_PCM_S8;
965
                else if (st->codec->bits_per_coded_sample == 24)
966 967 968
                    st->codec->codec_id =
                        st->codec->codec_id == CODEC_ID_PCM_S16BE ?
                        CODEC_ID_PCM_S24BE : CODEC_ID_PCM_S24LE;
969
                break;
970 971 972 973 974 975 976 977 978 979 980 981 982
            /* set values for old format before stsd version 1 appeared */
            case CODEC_ID_MACE3:
                sc->samples_per_frame = 6;
                sc->bytes_per_frame = 2*st->codec->channels;
                break;
            case CODEC_ID_MACE6:
                sc->samples_per_frame = 6;
                sc->bytes_per_frame = 1*st->codec->channels;
                break;
            case CODEC_ID_ADPCM_IMA_QT:
                sc->samples_per_frame = 64;
                sc->bytes_per_frame = 34*st->codec->channels;
                break;
983 984 985 986
            case CODEC_ID_GSM:
                sc->samples_per_frame = 160;
                sc->bytes_per_frame = 33;
                break;
987 988
            default:
                break;
989
            }
990

991 992
            bits_per_sample = av_get_bits_per_sample(st->codec->codec_id);
            if (bits_per_sample) {
993
                st->codec->bits_per_coded_sample = bits_per_sample;
994 995
                sc->sample_size = (bits_per_sample >> 3) * st->codec->channels;
            }
996
        } else if(st->codec->codec_type==CODEC_TYPE_SUBTITLE){
997 998 999 1000
            // ttxt stsd contains display flags, justification, background
            // color, fonts, and default styles, so fake an atom to read it
            MOVAtom fake_atom = { .size = size - (url_ftell(pb) - start_pos) };
            mov_read_glbl(c, pb, fake_atom);
1001
            st->codec->codec_id= id;
1002 1003
            st->codec->width = sc->width;
            st->codec->height = sc->height;
1004 1005 1006
        } else {
            /* other codec type, just skip (rtp, mp4s, tmcd ...) */
            url_fskip(pb, size - (url_ftell(pb) - start_pos));
1007
        }
1008 1009
        /* this will read extra atoms at the end (wave, alac, damr, avcC, SMI ...) */
        a.size = size - (url_ftell(pb) - start_pos);
1010 1011 1012 1013
        if (a.size > 8) {
            if (mov_read_default(c, pb, a) < 0)
                return -1;
        } else if (a.size > 0)
1014
            url_fskip(pb, a.size);
1015
    }
1016

B
Baptiste Coudurier 已提交
1017
    if(st->codec->codec_type==CODEC_TYPE_AUDIO && st->codec->sample_rate==0 && sc->time_scale>1)
1018
        st->codec->sample_rate= sc->time_scale;
1019

1020
    /* special codec parameters handling */
1021
    switch (st->codec->codec_id) {
1022
#if CONFIG_DV_DEMUXER
1023
    case CODEC_ID_DVAUDIO:
1024
        c->dv_fctx = avformat_alloc_context();
1025 1026 1027 1028 1029 1030 1031 1032
        c->dv_demux = dv_init_demux(c->dv_fctx);
        if (!c->dv_demux) {
            av_log(c->fc, AV_LOG_ERROR, "dv demux context init error\n");
            return -1;
        }
        sc->dv_audio_container = 1;
        st->codec->codec_id = CODEC_ID_PCM_S16LE;
        break;
1033
#endif
1034
    /* no ifdef since parameters are always those */
1035
    case CODEC_ID_QCELP:
1036
        st->codec->frame_size= 160;
1037
        st->codec->channels= 1; /* really needed */
1038
        break;
1039
    case CODEC_ID_AMR_NB:
1040
    case CODEC_ID_AMR_WB:
B
Baptiste Coudurier 已提交
1041
        st->codec->frame_size= sc->samples_per_frame;
1042
        st->codec->channels= 1; /* really needed */
1043
        /* force sample rate for amr, stsd in 3gp does not store sample rate */
B
Baptiste Coudurier 已提交
1044
        if (st->codec->codec_id == CODEC_ID_AMR_NB)
1045
            st->codec->sample_rate = 8000;
B
Baptiste Coudurier 已提交
1046 1047
        else if (st->codec->codec_id == CODEC_ID_AMR_WB)
            st->codec->sample_rate = 16000;
1048
        break;
1049
    case CODEC_ID_MP2:
1050
    case CODEC_ID_MP3:
1051
        st->codec->codec_type = CODEC_TYPE_AUDIO; /* force type after stsd for m1a hdlr */
A
Aurelien Jacobs 已提交
1052
        st->need_parsing = AVSTREAM_PARSE_FULL;
1053
        break;
1054
    case CODEC_ID_GSM:
1055 1056 1057 1058
    case CODEC_ID_ADPCM_MS:
    case CODEC_ID_ADPCM_IMA_WAV:
        st->codec->block_align = sc->bytes_per_frame;
        break;
1059
    case CODEC_ID_ALAC:
1060
        if (st->codec->extradata_size == 36) {
1061 1062
            st->codec->frame_size = AV_RB32(st->codec->extradata+12);
            st->codec->channels   = AV_RB8 (st->codec->extradata+21);
1063
        }
1064
        break;
1065 1066 1067
    default:
        break;
    }
1068

1069 1070 1071
    return 0;
}

1072
static int mov_read_stsc(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1073
{
1074
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
1075
    MOVStreamContext *sc = st->priv_data;
1076
    unsigned int i, entries;
1077

1078
    get_byte(pb); /* version */
1079
    get_be24(pb); /* flags */
1080 1081

    entries = get_be32(pb);
1082

1083 1084
    dprintf(c->fc, "track[%i].stsc.entries = %i\n", c->fc->nb_streams-1, entries);

1085 1086
    if(entries >= UINT_MAX / sizeof(*sc->stsc_data))
        return -1;
1087 1088
    sc->stsc_data = av_malloc(entries * sizeof(*sc->stsc_data));
    if (!sc->stsc_data)
1089 1090 1091
        return AVERROR(ENOMEM);
    sc->stsc_count = entries;

1092
    for(i=0; i<entries; i++) {
1093 1094 1095
        sc->stsc_data[i].first = get_be32(pb);
        sc->stsc_data[i].count = get_be32(pb);
        sc->stsc_data[i].id = get_be32(pb);
1096 1097 1098 1099
    }
    return 0;
}

1100
static int mov_read_stss(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1101 1102
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
1103
    MOVStreamContext *sc = st->priv_data;
1104
    unsigned int i, entries;
1105 1106

    get_byte(pb); /* version */
1107
    get_be24(pb); /* flags */
1108 1109

    entries = get_be32(pb);
1110

1111 1112
    dprintf(c->fc, "keyframe_count = %d\n", entries);

B
Baptiste Coudurier 已提交
1113
    if(entries >= UINT_MAX / sizeof(int))
1114
        return -1;
B
Baptiste Coudurier 已提交
1115
    sc->keyframes = av_malloc(entries * sizeof(int));
1116
    if (!sc->keyframes)
1117 1118 1119
        return AVERROR(ENOMEM);
    sc->keyframe_count = entries;

1120 1121
    for(i=0; i<entries; i++) {
        sc->keyframes[i] = get_be32(pb);
1122
        //dprintf(c->fc, "keyframes[]=%d\n", sc->keyframes[i]);
1123 1124 1125 1126
    }
    return 0;
}

1127
static int mov_read_stsz(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1128
{
1129
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
1130
    MOVStreamContext *sc = st->priv_data;
1131 1132 1133
    unsigned int i, entries, sample_size, field_size, num_bytes;
    GetBitContext gb;
    unsigned char* buf;
1134

1135
    get_byte(pb); /* version */
1136
    get_be24(pb); /* flags */
1137

1138
    if (atom.type == MKTAG('s','t','s','z')) {
1139 1140 1141 1142
        sample_size = get_be32(pb);
        if (!sc->sample_size) /* do not overwrite value computed in stsd */
            sc->sample_size = sample_size;
        field_size = 32;
1143 1144 1145 1146 1147
    } else {
        sample_size = 0;
        get_be24(pb); /* reserved */
        field_size = get_byte(pb);
    }
1148
    entries = get_be32(pb);
1149 1150

    dprintf(c->fc, "sample_size = %d sample_count = %d\n", sc->sample_size, entries);
1151

1152
    sc->sample_count = entries;
1153 1154 1155
    if (sample_size)
        return 0;

1156 1157 1158 1159 1160
    if (field_size != 4 && field_size != 8 && field_size != 16 && field_size != 32) {
        av_log(c->fc, AV_LOG_ERROR, "Invalid sample field size %d\n", field_size);
        return -1;
    }

1161 1162
    if(entries >= UINT_MAX / sizeof(int))
        return -1;
B
Baptiste Coudurier 已提交
1163
    sc->sample_sizes = av_malloc(entries * sizeof(int));
1164
    if (!sc->sample_sizes)
1165 1166
        return AVERROR(ENOMEM);

1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178 1179 1180 1181 1182
    num_bytes = (entries*field_size+4)>>3;

    buf = av_malloc(num_bytes);
    if (!buf) {
        av_freep(&sc->sample_sizes);
        return AVERROR(ENOMEM);
    }

    if (get_buffer(pb, buf, num_bytes) < num_bytes) {
        av_freep(&sc->sample_sizes);
        av_free(buf);
        return -1;
    }

    init_get_bits(&gb, buf, 8*num_bytes);

1183
    for(i=0; i<entries; i++)
1184 1185 1186
        sc->sample_sizes[i] = get_bits_long(&gb, field_size);

    av_free(buf);
1187 1188 1189
    return 0;
}

1190
static int mov_read_stts(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1191
{
1192
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
1193
    MOVStreamContext *sc = st->priv_data;
1194
    unsigned int i, entries;
1195 1196
    int64_t duration=0;
    int64_t total_sample_count=0;
1197

1198
    get_byte(pb); /* version */
1199
    get_be24(pb); /* flags */
1200
    entries = get_be32(pb);
1201 1202 1203

    dprintf(c->fc, "track[%i].stts.entries = %i\n", c->fc->nb_streams-1, entries);

1204
    if(entries >= UINT_MAX / sizeof(*sc->stts_data))
1205
        return -1;
1206
    sc->stts_data = av_malloc(entries * sizeof(*sc->stts_data));
1207
    if (!sc->stts_data)
1208 1209
        return AVERROR(ENOMEM);
    sc->stts_count = entries;
1210

1211
    for(i=0; i<entries; i++) {
M
cleanup  
Michael Niedermayer 已提交
1212 1213
        int sample_duration;
        int sample_count;
1214

1215
        sample_count=get_be32(pb);
1216
        sample_duration = get_be32(pb);
1217 1218 1219
        sc->stts_data[i].count= sample_count;
        sc->stts_data[i].duration= sample_duration;

1220
        sc->time_rate= av_gcd(sc->time_rate, sample_duration);
1221

M
Michel Bardiaux 已提交
1222
        dprintf(c->fc, "sample_count=%d, sample_duration=%d\n",sample_count,sample_duration);
1223

B
Baptiste Coudurier 已提交
1224
        duration+=(int64_t)sample_duration*sample_count;
1225 1226 1227
        total_sample_count+=sample_count;
    }

1228 1229 1230
    st->nb_frames= total_sample_count;
    if(duration)
        st->duration= duration;
1231 1232 1233
    return 0;
}

1234
static int mov_read_ctts(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
M
Michael Niedermayer 已提交
1235
{
1236
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
1237
    MOVStreamContext *sc = st->priv_data;
M
Michael Niedermayer 已提交
1238 1239 1240
    unsigned int i, entries;

    get_byte(pb); /* version */
1241
    get_be24(pb); /* flags */
M
Michael Niedermayer 已提交
1242
    entries = get_be32(pb);
1243 1244 1245

    dprintf(c->fc, "track[%i].ctts.entries = %i\n", c->fc->nb_streams-1, entries);

1246
    if(entries >= UINT_MAX / sizeof(*sc->ctts_data))
M
Michael Niedermayer 已提交
1247
        return -1;
1248
    sc->ctts_data = av_malloc(entries * sizeof(*sc->ctts_data));
1249
    if (!sc->ctts_data)
1250 1251
        return AVERROR(ENOMEM);
    sc->ctts_count = entries;
1252

M
Michael Niedermayer 已提交
1253
    for(i=0; i<entries; i++) {
1254 1255 1256
        int count    =get_be32(pb);
        int duration =get_be32(pb);

1257
        if (duration < 0) {
1258 1259
            sc->wrong_dts = 1;
            st->codec->has_b_frames = 1;
1260
        }
1261 1262 1263
        sc->ctts_data[i].count   = count;
        sc->ctts_data[i].duration= duration;

1264
        sc->time_rate= av_gcd(sc->time_rate, FFABS(duration));
M
Michael Niedermayer 已提交
1265 1266 1267 1268
    }
    return 0;
}

1269 1270 1271
static void mov_build_index(MOVContext *mov, AVStream *st)
{
    MOVStreamContext *sc = st->priv_data;
1272
    int64_t current_offset;
1273 1274 1275 1276 1277 1278
    int64_t current_dts = 0;
    unsigned int stts_index = 0;
    unsigned int stsc_index = 0;
    unsigned int stss_index = 0;
    unsigned int i, j;

1279 1280
    /* adjust first dts according to edit list */
    if (sc->time_offset) {
1281
        int rescaled = sc->time_offset < 0 ? av_rescale(sc->time_offset, sc->time_scale, mov->time_scale) : sc->time_offset;
1282
        assert(sc->time_offset % sc->time_rate == 0);
1283
        current_dts = - (rescaled / sc->time_rate);
1284 1285
    }

1286 1287 1288
    /* only use old uncompressed audio chunk demuxing when stts specifies it */
    if (!(st->codec->codec_type == CODEC_TYPE_AUDIO &&
          sc->stts_count == 1 && sc->stts_data[0].duration == 1)) {
1289 1290 1291 1292 1293 1294 1295 1296 1297
        unsigned int current_sample = 0;
        unsigned int stts_sample = 0;
        unsigned int keyframe, sample_size;
        unsigned int distance = 0;
        int key_off = sc->keyframes && sc->keyframes[0] == 1;

        st->nb_frames = sc->sample_count;
        for (i = 0; i < sc->chunk_count; i++) {
            current_offset = sc->chunk_offsets[i];
1298 1299
            if (stsc_index + 1 < sc->stsc_count &&
                i + 1 == sc->stsc_data[stsc_index + 1].first)
1300
                stsc_index++;
1301
            for (j = 0; j < sc->stsc_data[stsc_index].count; j++) {
1302 1303
                if (current_sample >= sc->sample_count) {
                    av_log(mov->fc, AV_LOG_ERROR, "wrong sample count\n");
1304
                    return;
1305 1306 1307 1308 1309 1310 1311 1312
                }
                keyframe = !sc->keyframe_count || current_sample+key_off == sc->keyframes[stss_index];
                if (keyframe) {
                    distance = 0;
                    if (stss_index + 1 < sc->keyframe_count)
                        stss_index++;
                }
                sample_size = sc->sample_size > 0 ? sc->sample_size : sc->sample_sizes[current_sample];
1313
                if(sc->pseudo_stream_id == -1 ||
1314
                   sc->stsc_data[stsc_index].id - 1 == sc->pseudo_stream_id) {
1315 1316
                    av_add_index_entry(st, current_offset, current_dts, sample_size, distance,
                                    keyframe ? AVINDEX_KEYFRAME : 0);
1317 1318 1319 1320
                    dprintf(mov->fc, "AVIndex stream %d, sample %d, offset %"PRIx64", dts %"PRId64", "
                            "size %d, distance %d, keyframe %d\n", st->index, current_sample,
                            current_offset, current_dts, sample_size, distance, keyframe);
                }
1321

1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338
                current_offset += sample_size;
                assert(sc->stts_data[stts_index].duration % sc->time_rate == 0);
                current_dts += sc->stts_data[stts_index].duration / sc->time_rate;
                distance++;
                stts_sample++;
                current_sample++;
                if (stts_index + 1 < sc->stts_count && stts_sample == sc->stts_data[stts_index].count) {
                    stts_sample = 0;
                    stts_index++;
                }
            }
        }
    } else { /* read whole chunk */
        unsigned int chunk_samples, chunk_size, chunk_duration;
        unsigned int frames = 1;
        for (i = 0; i < sc->chunk_count; i++) {
            current_offset = sc->chunk_offsets[i];
1339 1340
            if (stsc_index + 1 < sc->stsc_count &&
                i + 1 == sc->stsc_data[stsc_index + 1].first)
1341
                stsc_index++;
1342
            chunk_samples = sc->stsc_data[stsc_index].count;
1343 1344 1345
            /* get chunk size, beware of alaw/ulaw/mace */
            if (sc->samples_per_frame > 0 &&
                (chunk_samples * sc->bytes_per_frame % sc->samples_per_frame == 0)) {
1346
                if (sc->samples_per_frame < 160)
1347 1348 1349 1350 1351 1352
                    chunk_size = chunk_samples * sc->bytes_per_frame / sc->samples_per_frame;
                else {
                    chunk_size = sc->bytes_per_frame;
                    frames = chunk_samples / sc->samples_per_frame;
                    chunk_samples = sc->samples_per_frame;
                }
1353
            } else
1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371
                chunk_size = chunk_samples * sc->sample_size;
            for (j = 0; j < frames; j++) {
                av_add_index_entry(st, current_offset, current_dts, chunk_size, 0, AVINDEX_KEYFRAME);
                /* get chunk duration */
                chunk_duration = 0;
                while (chunk_samples > 0) {
                    if (chunk_samples < sc->stts_data[stts_index].count) {
                        chunk_duration += sc->stts_data[stts_index].duration * chunk_samples;
                        sc->stts_data[stts_index].count -= chunk_samples;
                        break;
                    } else {
                        chunk_duration += sc->stts_data[stts_index].duration * chunk_samples;
                        chunk_samples -= sc->stts_data[stts_index].count;
                        if (stts_index + 1 < sc->stts_count)
                            stts_index++;
                    }
                }
                current_offset += sc->bytes_per_frame;
1372 1373 1374
                dprintf(mov->fc, "AVIndex stream %d, chunk %d, offset %"PRIx64", dts %"PRId64", "
                        "size %d, duration %d\n", st->index, i, current_offset, current_dts,
                        chunk_size, chunk_duration);
1375 1376 1377 1378 1379 1380
                assert(chunk_duration % sc->time_rate == 0);
                current_dts += chunk_duration / sc->time_rate;
            }
        }
    }
}
1381

1382
static int mov_read_trak(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1383 1384 1385
{
    AVStream *st;
    MOVStreamContext *sc;
1386
    int ret;
1387 1388

    st = av_new_stream(c->fc, c->fc->nb_streams);
B
Baptiste Coudurier 已提交
1389
    if (!st) return AVERROR(ENOMEM);
B
Baptiste Coudurier 已提交
1390
    sc = av_mallocz(sizeof(MOVStreamContext));
1391
    if (!sc) return AVERROR(ENOMEM);
1392 1393

    st->priv_data = sc;
1394
    st->codec->codec_type = CODEC_TYPE_DATA;
1395
    sc->ffindex = st->index;
1396

1397 1398 1399 1400
    if ((ret = mov_read_default(c, pb, atom)) < 0)
        return ret;

    /* sanity checks */
1401 1402
    if (sc->chunk_count && (!sc->stts_count || !sc->stsc_count ||
                            (!sc->sample_size && !sc->sample_count))) {
1403 1404
        av_log(c->fc, AV_LOG_ERROR, "stream %d, missing mandatory atoms, broken header\n",
               st->index);
1405 1406
        return 0;
    }
1407 1408 1409 1410 1411 1412

    if (!sc->time_rate)
        sc->time_rate = 1;
    if (!sc->time_scale)
        sc->time_scale = c->time_scale;

1413 1414
    av_set_pts_info(st, 64, sc->time_rate, sc->time_scale);

1415
    if (st->codec->codec_type == CODEC_TYPE_AUDIO &&
1416 1417 1418 1419 1420
        !st->codec->frame_size && sc->stts_count == 1) {
        st->codec->frame_size = av_rescale(sc->stts_data[0].duration,
                                           st->codec->sample_rate, sc->time_scale);
        dprintf(c->fc, "frame size %d\n", st->codec->frame_size);
    }
1421

1422
    if (st->duration != AV_NOPTS_VALUE) {
1423 1424 1425
        assert(st->duration % sc->time_rate == 0);
        st->duration /= sc->time_rate;
    }
1426

1427 1428 1429 1430
    mov_build_index(c, st);

    if (sc->dref_id-1 < sc->drefs_count && sc->drefs[sc->dref_id-1].path) {
        if (url_fopen(&sc->pb, sc->drefs[sc->dref_id-1].path, URL_RDONLY) < 0)
1431 1432
            av_log(c->fc, AV_LOG_ERROR, "stream %d, error opening file %s: %s\n",
                   st->index, sc->drefs[sc->dref_id-1].path, strerror(errno));
1433 1434 1435 1436
    } else
        sc->pb = c->fc->pb;

    switch (st->codec->codec_id) {
1437
#if CONFIG_H261_DECODER
1438 1439
    case CODEC_ID_H261:
#endif
1440
#if CONFIG_H263_DECODER
1441 1442
    case CODEC_ID_H263:
#endif
1443
#if CONFIG_MPEG4_DECODER
1444 1445
    case CODEC_ID_MPEG4:
#endif
1446
        st->codec->width = 0; /* let decoder init width/height */
1447 1448 1449
        st->codec->height= 0;
        break;
    }
B
Baptiste Coudurier 已提交
1450 1451 1452

    /* Do not need those anymore. */
    av_freep(&sc->chunk_offsets);
1453
    av_freep(&sc->stsc_data);
B
Baptiste Coudurier 已提交
1454 1455 1456 1457
    av_freep(&sc->sample_sizes);
    av_freep(&sc->keyframes);
    av_freep(&sc->stts_data);

1458
    return 0;
1459 1460
}

1461
static int mov_read_ilst(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1462 1463 1464 1465 1466 1467 1468 1469
{
    int ret;
    c->itunes_metadata = 1;
    ret = mov_read_default(c, pb, atom);
    c->itunes_metadata = 0;
    return ret;
}

1470
static int mov_read_meta(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1471
{
1472 1473 1474 1475 1476 1477 1478 1479 1480 1481
    while (atom.size > 8) {
        uint32_t tag = get_le32(pb);
        atom.size -= 4;
        if (tag == MKTAG('h','d','l','r')) {
            url_fseek(pb, -8, SEEK_CUR);
            atom.size += 8;
            return mov_read_default(c, pb, atom);
        }
    }
    return 0;
1482 1483
}

1484
static int mov_read_tkhd(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1485
{
1486 1487 1488 1489 1490
    int i;
    int width;
    int height;
    int64_t disp_transform[2];
    int display_matrix[3][2];
B
clean  
Baptiste Coudurier 已提交
1491
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
1492
    MOVStreamContext *sc = st->priv_data;
B
clean  
Baptiste Coudurier 已提交
1493
    int version = get_byte(pb);
1494

1495
    get_be24(pb); /* flags */
1496 1497 1498 1499 1500 1501 1502
    /*
    MOV_TRACK_ENABLED 0x0001
    MOV_TRACK_IN_MOVIE 0x0002
    MOV_TRACK_IN_PREVIEW 0x0004
    MOV_TRACK_IN_POSTER 0x0008
    */

B
Baptiste Coudurier 已提交
1503 1504 1505 1506 1507 1508 1509
    if (version == 1) {
        get_be64(pb);
        get_be64(pb);
    } else {
        get_be32(pb); /* creation time */
        get_be32(pb); /* modification time */
    }
1510 1511
    st->id = (int)get_be32(pb); /* track id (NOT 0 !)*/
    get_be32(pb); /* reserved */
1512

1513 1514
    /* highlevel (considering edits) duration in movie timebase */
    (version == 1) ? get_be64(pb) : get_be32(pb);
1515 1516 1517 1518 1519 1520 1521 1522
    get_be32(pb); /* reserved */
    get_be32(pb); /* reserved */

    get_be16(pb); /* layer */
    get_be16(pb); /* alternate group */
    get_be16(pb); /* volume */
    get_be16(pb); /* reserved */

1523 1524 1525 1526 1527 1528 1529 1530
    //read in the display matrix (outlined in ISO 14496-12, Section 6.2.2)
    // they're kept in fixed point format through all calculations
    // ignore u,v,z b/c we don't need the scale factor to calc aspect ratio
    for (i = 0; i < 3; i++) {
        display_matrix[i][0] = get_be32(pb);   // 16.16 fixed point
        display_matrix[i][1] = get_be32(pb);   // 16.16 fixed point
        get_be32(pb);           // 2.30 fixed point (not used)
    }
1531

1532 1533
    width = get_be32(pb);       // 16.16 fixed point track width
    height = get_be32(pb);      // 16.16 fixed point track height
1534 1535
    sc->width = width >> 16;
    sc->height = height >> 16;
1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550

    //transform the display width/height according to the matrix
    // skip this if the display matrix is the default identity matrix
    // to keep the same scale, use [width height 1<<16]
    if (width && height &&
        (display_matrix[0][0] != 65536 || display_matrix[0][1]           ||
        display_matrix[1][0]           || display_matrix[1][1] != 65536  ||
        display_matrix[2][0]           || display_matrix[2][1])) {
        for (i = 0; i < 2; i++)
            disp_transform[i] =
                (int64_t)  width  * display_matrix[0][i] +
                (int64_t)  height * display_matrix[1][i] +
                ((int64_t) display_matrix[2][i] << 16);

        //sample aspect ratio is new width/height divided by old width/height
1551
        st->sample_aspect_ratio = av_d2q(
1552 1553 1554
            ((double) disp_transform[0] * height) /
            ((double) disp_transform[1] * width), INT_MAX);
    }
1555 1556 1557
    return 0;
}

1558
static int mov_read_tfhd(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
B
Baptiste Coudurier 已提交
1559 1560 1561 1562 1563 1564 1565 1566 1567
{
    MOVFragment *frag = &c->fragment;
    MOVTrackExt *trex = NULL;
    int flags, track_id, i;

    get_byte(pb); /* version */
    flags = get_be24(pb);

    track_id = get_be32(pb);
1568
    if (!track_id)
B
Baptiste Coudurier 已提交
1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592
        return -1;
    frag->track_id = track_id;
    for (i = 0; i < c->trex_count; i++)
        if (c->trex_data[i].track_id == frag->track_id) {
            trex = &c->trex_data[i];
            break;
        }
    if (!trex) {
        av_log(c->fc, AV_LOG_ERROR, "could not find corresponding trex\n");
        return -1;
    }

    if (flags & 0x01) frag->base_data_offset = get_be64(pb);
    else              frag->base_data_offset = frag->moof_offset;
    if (flags & 0x02) frag->stsd_id          = get_be32(pb);
    else              frag->stsd_id          = trex->stsd_id;

    frag->duration = flags & 0x08 ? get_be32(pb) : trex->duration;
    frag->size     = flags & 0x10 ? get_be32(pb) : trex->size;
    frag->flags    = flags & 0x20 ? get_be32(pb) : trex->flags;
    dprintf(c->fc, "frag flags 0x%x\n", frag->flags);
    return 0;
}

1593
static int mov_read_trex(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
B
Baptiste Coudurier 已提交
1594 1595 1596 1597 1598
{
    MOVTrackExt *trex;

    if ((uint64_t)c->trex_count+1 >= UINT_MAX / sizeof(*c->trex_data))
        return -1;
1599 1600
    trex = av_realloc(c->trex_data, (c->trex_count+1)*sizeof(*c->trex_data));
    if (!trex)
B
Baptiste Coudurier 已提交
1601
        return AVERROR(ENOMEM);
1602
    c->trex_data = trex;
B
Baptiste Coudurier 已提交
1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613
    trex = &c->trex_data[c->trex_count++];
    get_byte(pb); /* version */
    get_be24(pb); /* flags */
    trex->track_id = get_be32(pb);
    trex->stsd_id  = get_be32(pb);
    trex->duration = get_be32(pb);
    trex->size     = get_be32(pb);
    trex->flags    = get_be32(pb);
    return 0;
}

1614
static int mov_read_trun(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
B
Baptiste Coudurier 已提交
1615 1616
{
    MOVFragment *frag = &c->fragment;
1617
    AVStream *st = NULL;
1618
    MOVStreamContext *sc;
B
Baptiste Coudurier 已提交
1619 1620 1621 1622 1623 1624
    uint64_t offset;
    int64_t dts;
    int data_offset = 0;
    unsigned entries, first_sample_flags = frag->flags;
    int flags, distance, i;

1625 1626 1627 1628 1629 1630 1631 1632
    for (i = 0; i < c->fc->nb_streams; i++) {
        if (c->fc->streams[i]->id == frag->track_id) {
            st = c->fc->streams[i];
            break;
        }
    }
    if (!st) {
        av_log(c->fc, AV_LOG_ERROR, "could not find corresponding track id %d\n", frag->track_id);
1633
        return -1;
1634
    }
1635
    sc = st->priv_data;
B
Baptiste Coudurier 已提交
1636 1637 1638 1639 1640 1641 1642 1643 1644
    if (sc->pseudo_stream_id+1 != frag->stsd_id)
        return 0;
    get_byte(pb); /* version */
    flags = get_be24(pb);
    entries = get_be32(pb);
    dprintf(c->fc, "flags 0x%x entries %d\n", flags, entries);
    if (flags & 0x001) data_offset        = get_be32(pb);
    if (flags & 0x004) first_sample_flags = get_be32(pb);
    if (flags & 0x800) {
1645
        MOVStts *ctts_data;
B
Baptiste Coudurier 已提交
1646 1647
        if ((uint64_t)entries+sc->ctts_count >= UINT_MAX/sizeof(*sc->ctts_data))
            return -1;
1648 1649 1650
        ctts_data = av_realloc(sc->ctts_data,
                               (entries+sc->ctts_count)*sizeof(*sc->ctts_data));
        if (!ctts_data)
B
Baptiste Coudurier 已提交
1651
            return AVERROR(ENOMEM);
1652
        sc->ctts_data = ctts_data;
B
Baptiste Coudurier 已提交
1653 1654 1655 1656 1657 1658 1659 1660 1661 1662 1663 1664 1665 1666 1667 1668 1669 1670 1671 1672 1673 1674 1675 1676 1677 1678 1679 1680 1681 1682 1683 1684 1685 1686 1687 1688 1689
    }
    dts = st->duration;
    offset = frag->base_data_offset + data_offset;
    distance = 0;
    dprintf(c->fc, "first sample flags 0x%x\n", first_sample_flags);
    for (i = 0; i < entries; i++) {
        unsigned sample_size = frag->size;
        int sample_flags = i ? frag->flags : first_sample_flags;
        unsigned sample_duration = frag->duration;
        int keyframe;

        if (flags & 0x100) sample_duration = get_be32(pb);
        if (flags & 0x200) sample_size     = get_be32(pb);
        if (flags & 0x400) sample_flags    = get_be32(pb);
        if (flags & 0x800) {
            sc->ctts_data[sc->ctts_count].count = 1;
            sc->ctts_data[sc->ctts_count].duration = get_be32(pb);
            sc->ctts_count++;
        }
        if ((keyframe = st->codec->codec_type == CODEC_TYPE_AUDIO ||
             (flags & 0x004 && !i && !sample_flags) || sample_flags & 0x2000000))
            distance = 0;
        av_add_index_entry(st, offset, dts, sample_size, distance,
                           keyframe ? AVINDEX_KEYFRAME : 0);
        dprintf(c->fc, "AVIndex stream %d, sample %d, offset %"PRIx64", dts %"PRId64", "
                "size %d, distance %d, keyframe %d\n", st->index, sc->sample_count+i,
                offset, dts, sample_size, distance, keyframe);
        distance++;
        assert(sample_duration % sc->time_rate == 0);
        dts += sample_duration / sc->time_rate;
        offset += sample_size;
    }
    frag->moof_offset = offset;
    st->duration = dts;
    return 0;
}

1690 1691 1692
/* this atom should be null (from specs), but some buggy files put the 'moov' atom inside it... */
/* like the files created with Adobe Premiere 5.0, for samples see */
/* http://graphics.tudelft.nl/~wouter/publications/soundtests/ */
1693
static int mov_read_wide(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1694 1695 1696 1697 1698 1699 1700 1701 1702 1703 1704 1705
{
    int err;

    if (atom.size < 8)
        return 0; /* continue */
    if (get_be32(pb) != 0) { /* 0 sized mdat atom... use the 'wide' atom size */
        url_fskip(pb, atom.size - 4);
        return 0;
    }
    atom.type = get_le32(pb);
    atom.offset += 8;
    atom.size -= 8;
1706
    if (atom.type != MKTAG('m','d','a','t')) {
1707 1708 1709 1710 1711 1712 1713
        url_fskip(pb, atom.size);
        return 0;
    }
    err = mov_read_mdat(c, pb, atom);
    return err;
}

1714
static int mov_read_cmov(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
1715
{
1716
#if CONFIG_ZLIB
1717
    ByteIOContext ctx;
1718 1719
    uint8_t *cmov_data;
    uint8_t *moov_data; /* uncompressed data */
1720
    long cmov_len, moov_len;
1721
    int ret = -1;
1722

1723
    get_be32(pb); /* dcom atom */
1724
    if (get_le32(pb) != MKTAG('d','c','o','m'))
1725
        return -1;
1726
    if (get_le32(pb) != MKTAG('z','l','i','b')) {
B
Benoit Fouet 已提交
1727
        av_log(c->fc, AV_LOG_ERROR, "unknown compression for cmov atom !");
1728 1729 1730
        return -1;
    }
    get_be32(pb); /* cmvd atom */
1731
    if (get_le32(pb) != MKTAG('c','m','v','d'))
1732 1733
        return -1;
    moov_len = get_be32(pb); /* uncompressed size */
1734
    cmov_len = atom.size - 6 * 4;
1735

B
Baptiste Coudurier 已提交
1736
    cmov_data = av_malloc(cmov_len);
1737
    if (!cmov_data)
1738
        return AVERROR(ENOMEM);
B
Baptiste Coudurier 已提交
1739
    moov_data = av_malloc(moov_len);
1740 1741
    if (!moov_data) {
        av_free(cmov_data);
1742
        return AVERROR(ENOMEM);
1743 1744
    }
    get_buffer(pb, cmov_data, cmov_len);
1745
    if(uncompress (moov_data, (uLongf *) &moov_len, (const Bytef *)cmov_data, cmov_len) != Z_OK)
1746
        goto free_and_return;
1747
    if(init_put_byte(&ctx, moov_data, moov_len, 0, NULL, NULL, NULL, NULL) != 0)
1748
        goto free_and_return;
1749
    atom.type = MKTAG('m','o','o','v');
1750 1751
    atom.offset = 0;
    atom.size = moov_len;
1752
#ifdef DEBUG
M
Michael Niedermayer 已提交
1753
//    { int fd = open("/tmp/uncompheader.mov", O_WRONLY | O_CREAT); write(fd, moov_data, moov_len); close(fd); }
1754
#endif
1755
    ret = mov_read_default(c, &ctx, atom);
1756
free_and_return:
1757 1758 1759
    av_free(moov_data);
    av_free(cmov_data);
    return ret;
1760 1761 1762
#else
    av_log(c->fc, AV_LOG_ERROR, "this file requires zlib support compiled in\n");
    return -1;
1763
#endif
1764
}
1765

G
Gael Chardon 已提交
1766
/* edit list atom */
1767
static int mov_read_elst(MOVContext *c, ByteIOContext *pb, MOVAtom atom)
G
Gael Chardon 已提交
1768
{
1769
    MOVStreamContext *sc = c->fc->streams[c->fc->nb_streams-1]->priv_data;
B
Baptiste Coudurier 已提交
1770 1771 1772
    int i, edit_count;

    get_byte(pb); /* version */
1773
    get_be24(pb); /* flags */
B
Baptiste Coudurier 已提交
1774
    edit_count = get_be32(pb); /* entries */
B
Baptiste Coudurier 已提交
1775 1776

    for(i=0; i<edit_count; i++){
1777
        int time;
1778
        int duration = get_be32(pb); /* Track duration */
1779
        time = get_be32(pb); /* Media time */
B
Baptiste Coudurier 已提交
1780
        get_be32(pb); /* Media rate */
1781 1782 1783
        if (i == 0 && time >= -1) {
            sc->time_offset = time != -1 ? time : -duration;
            sc->time_rate = av_gcd(sc->time_rate, FFABS(sc->time_offset));
1784
        }
B
Baptiste Coudurier 已提交
1785
    }
1786 1787 1788 1789 1790

    if(edit_count > 1)
        av_log(c->fc, AV_LOG_WARNING, "multiple edit list entries, "
               "a/v desync might occur, patch welcome\n");

1791
    dprintf(c->fc, "track[%i].edit_count = %i\n", c->fc->nb_streams-1, edit_count);
B
Baptiste Coudurier 已提交
1792
    return 0;
G
Gael Chardon 已提交
1793 1794
}

1795
static const MOVParseTableEntry mov_default_parse_table[] = {
1796
{ MKTAG('a','v','s','s'), mov_read_extradata },
1797 1798 1799 1800 1801 1802 1803 1804 1805 1806 1807
{ MKTAG('c','o','6','4'), mov_read_stco },
{ MKTAG('c','t','t','s'), mov_read_ctts }, /* composition time to sample */
{ MKTAG('d','i','n','f'), mov_read_default },
{ MKTAG('d','r','e','f'), mov_read_dref },
{ MKTAG('e','d','t','s'), mov_read_default },
{ MKTAG('e','l','s','t'), mov_read_elst },
{ MKTAG('e','n','d','a'), mov_read_enda },
{ MKTAG('f','i','e','l'), mov_read_extradata },
{ MKTAG('f','t','y','p'), mov_read_ftyp },
{ MKTAG('g','l','b','l'), mov_read_glbl },
{ MKTAG('h','d','l','r'), mov_read_hdlr },
1808
{ MKTAG('i','l','s','t'), mov_read_ilst },
1809 1810 1811 1812
{ MKTAG('j','p','2','h'), mov_read_extradata },
{ MKTAG('m','d','a','t'), mov_read_mdat },
{ MKTAG('m','d','h','d'), mov_read_mdhd },
{ MKTAG('m','d','i','a'), mov_read_default },
1813
{ MKTAG('m','e','t','a'), mov_read_meta },
1814 1815 1816 1817 1818 1819 1820 1821
{ MKTAG('m','i','n','f'), mov_read_default },
{ MKTAG('m','o','o','f'), mov_read_moof },
{ MKTAG('m','o','o','v'), mov_read_moov },
{ MKTAG('m','v','e','x'), mov_read_default },
{ MKTAG('m','v','h','d'), mov_read_mvhd },
{ MKTAG('S','M','I',' '), mov_read_smi }, /* Sorenson extension ??? */
{ MKTAG('a','l','a','c'), mov_read_extradata }, /* alac specific atom */
{ MKTAG('a','v','c','C'), mov_read_glbl },
1822
{ MKTAG('p','a','s','p'), mov_read_pasp },
1823 1824 1825 1826 1827 1828 1829
{ MKTAG('s','t','b','l'), mov_read_default },
{ MKTAG('s','t','c','o'), mov_read_stco },
{ MKTAG('s','t','s','c'), mov_read_stsc },
{ MKTAG('s','t','s','d'), mov_read_stsd }, /* sample description */
{ MKTAG('s','t','s','s'), mov_read_stss }, /* sync sample */
{ MKTAG('s','t','s','z'), mov_read_stsz }, /* sample size */
{ MKTAG('s','t','t','s'), mov_read_stts },
1830
{ MKTAG('s','t','z','2'), mov_read_stsz }, /* compact sample size */
1831 1832 1833 1834 1835 1836
{ MKTAG('t','k','h','d'), mov_read_tkhd }, /* track header */
{ MKTAG('t','f','h','d'), mov_read_tfhd }, /* track fragment header */
{ MKTAG('t','r','a','k'), mov_read_trak },
{ MKTAG('t','r','a','f'), mov_read_default },
{ MKTAG('t','r','e','x'), mov_read_trex },
{ MKTAG('t','r','u','n'), mov_read_trun },
B
Baptiste Coudurier 已提交
1837
{ MKTAG('u','d','t','a'), mov_read_default },
1838 1839 1840 1841
{ MKTAG('w','a','v','e'), mov_read_wave },
{ MKTAG('e','s','d','s'), mov_read_esds },
{ MKTAG('w','i','d','e'), mov_read_wide }, /* place holder */
{ MKTAG('c','m','o','v'), mov_read_cmov },
B
Baptiste Coudurier 已提交
1842
{ 0, NULL }
1843 1844
};

F
Fabrice Bellard 已提交
1845 1846
static int mov_probe(AVProbeData *p)
{
1847 1848
    unsigned int offset;
    uint32_t tag;
1849
    int score = 0;
1850

F
Fabrice Bellard 已提交
1851
    /* check file header */
1852 1853 1854 1855
    offset = 0;
    for(;;) {
        /* ignore invalid offset */
        if ((offset + 8) > (unsigned int)p->buf_size)
1856
            return score;
1857
        tag = AV_RL32(p->buf + offset + 4);
1858
        switch(tag) {
1859
        /* check for obvious tags */
1860 1861 1862 1863 1864
        case MKTAG('j','P',' ',' '): /* jpeg 2000 signature */
        case MKTAG('m','o','o','v'):
        case MKTAG('m','d','a','t'):
        case MKTAG('p','n','o','t'): /* detect movs with preview pics like ew.mov and april.mov */
        case MKTAG('u','d','t','a'): /* Packet Video PVAuthor adds this and a lot of more junk */
1865
        case MKTAG('f','t','y','p'):
1866
            return AVPROBE_SCORE_MAX;
1867
        /* those are more common words, so rate then a bit less */
1868 1869 1870 1871 1872
        case MKTAG('e','d','i','w'): /* xdcam files have reverted first tags */
        case MKTAG('w','i','d','e'):
        case MKTAG('f','r','e','e'):
        case MKTAG('j','u','n','k'):
        case MKTAG('p','i','c','t'):
1873
            return AVPROBE_SCORE_MAX - 5;
B
Baptiste Coudurier 已提交
1874
        case MKTAG(0x82,0x82,0x7f,0x7d):
1875 1876 1877
        case MKTAG('s','k','i','p'):
        case MKTAG('u','u','i','d'):
        case MKTAG('p','r','f','l'):
1878
            offset = AV_RB32(p->buf+offset) + offset;
1879 1880
            /* if we only find those cause probedata is too small at least rate them */
            score = AVPROBE_SCORE_MAX - 50;
1881 1882 1883
            break;
        default:
            /* unrecognized tag */
1884
            return score;
1885
        }
1886
    }
1887
    return score;
F
Fabrice Bellard 已提交
1888 1889
}

Z
Zdenek Kabelac 已提交
1890
static int mov_read_header(AVFormatContext *s, AVFormatParameters *ap)
1891
{
1892
    MOVContext *mov = s->priv_data;
1893
    ByteIOContext *pb = s->pb;
B
Baptiste Coudurier 已提交
1894
    int err;
1895
    MOVAtom atom = { 0, 0, 0 };
1896 1897

    mov->fc = s;
1898 1899
    /* .mov and .mp4 aren't streamable anyway (only progressive download if moov is before mdat) */
    if(!url_is_streamed(pb))
1900
        atom.size = url_fsize(pb);
1901
    else
B
Baptiste Coudurier 已提交
1902
        atom.size = INT64_MAX;
1903 1904

    /* check MOV header */
B
Baptiste Coudurier 已提交
1905 1906 1907 1908 1909 1910
    if ((err = mov_read_default(mov, pb, atom)) < 0) {
        av_log(s, AV_LOG_ERROR, "error reading header: %d\n", err);
        return err;
    }
    if (!mov->found_moov) {
        av_log(s, AV_LOG_ERROR, "moov atom not found\n");
1911
        return -1;
1912
    }
B
Baptiste Coudurier 已提交
1913
    dprintf(mov->fc, "on_parse_exit_offset=%lld\n", url_ftell(pb));
1914

1915 1916 1917
    return 0;
}

Z
Zdenek Kabelac 已提交
1918
static int mov_read_packet(AVFormatContext *s, AVPacket *pkt)
1919
{
1920 1921 1922
    MOVContext *mov = s->priv_data;
    MOVStreamContext *sc = 0;
    AVIndexEntry *sample = 0;
1923
    int64_t best_dts = INT64_MAX;
1924
    int i, ret;
1925
 retry:
B
Baptiste Coudurier 已提交
1926
    for (i = 0; i < s->nb_streams; i++) {
1927 1928
        AVStream *st = s->streams[i];
        MOVStreamContext *msc = st->priv_data;
1929
        if (st->discard != AVDISCARD_ALL && msc->pb && msc->current_sample < st->nb_index_entries) {
1930
            AVIndexEntry *current_sample = &st->index_entries[msc->current_sample];
1931 1932
            int64_t dts = av_rescale(current_sample->timestamp * (int64_t)msc->time_rate,
                                     AV_TIME_BASE, msc->time_scale);
B
Baptiste Coudurier 已提交
1933
            dprintf(s, "stream %d, sample %d, dts %"PRId64"\n", i, msc->current_sample, dts);
B
Baptiste Coudurier 已提交
1934 1935
            if (!sample || (url_is_streamed(s->pb) && current_sample->pos < sample->pos) ||
                (!url_is_streamed(s->pb) &&
1936
                 ((msc->pb != s->pb && dts < best_dts) || (msc->pb == s->pb &&
B
Baptiste Coudurier 已提交
1937
                 ((FFABS(best_dts - dts) <= AV_TIME_BASE && current_sample->pos < sample->pos) ||
1938
                  (FFABS(best_dts - dts) > AV_TIME_BASE && dts < best_dts)))))) {
1939 1940 1941
                sample = current_sample;
                best_dts = dts;
                sc = msc;
1942
            }
1943 1944
        }
    }
1945 1946 1947
    if (!sample) {
        mov->found_mdat = 0;
        if (!url_is_streamed(s->pb) ||
1948
            mov_read_default(mov, s->pb, (MOVAtom){ 0, 0, INT64_MAX }) < 0 ||
1949 1950 1951 1952 1953
            url_feof(s->pb))
            return -1;
        dprintf(s, "read fragments, offset 0x%llx\n", url_ftell(s->pb));
        goto retry;
    }
1954 1955
    /* must be done just before reading, to avoid infinite loop on sample */
    sc->current_sample++;
1956
    if (url_fseek(sc->pb, sample->pos, SEEK_SET) != sample->pos) {
1957 1958
        av_log(mov->fc, AV_LOG_ERROR, "stream %d, offset 0x%"PRIx64": partial file\n",
               sc->ffindex, sample->pos);
1959
        return -1;
1960
    }
1961 1962 1963
    ret = av_get_packet(sc->pb, pkt, sample->size);
    if (ret < 0)
        return ret;
1964
#if CONFIG_DV_DEMUXER
B
Baptiste Coudurier 已提交
1965 1966 1967
    if (mov->dv_demux && sc->dv_audio_container) {
        dv_produce_packet(mov->dv_demux, pkt, pkt->data, pkt->size);
        av_free(pkt->data);
1968 1969 1970
        pkt->size = 0;
        if (dv_get_packet(mov->dv_demux, pkt) < 0)
            return -1;
B
Baptiste Coudurier 已提交
1971
    }
1972
#endif
1973 1974 1975
    pkt->stream_index = sc->ffindex;
    pkt->dts = sample->timestamp;
    if (sc->ctts_data) {
1976 1977
        assert(sc->ctts_data[sc->ctts_index].duration % sc->time_rate == 0);
        pkt->pts = pkt->dts + sc->ctts_data[sc->ctts_index].duration / sc->time_rate;
1978
        /* update ctts context */
1979 1980 1981 1982 1983
        sc->ctts_sample++;
        if (sc->ctts_index < sc->ctts_count &&
            sc->ctts_data[sc->ctts_index].count == sc->ctts_sample) {
            sc->ctts_index++;
            sc->ctts_sample = 0;
1984
        }
1985 1986
        if (sc->wrong_dts)
            pkt->dts = AV_NOPTS_VALUE;
1987
    } else {
1988
        AVStream *st = s->streams[sc->ffindex];
1989
        int64_t next_dts = (sc->current_sample < st->nb_index_entries) ?
1990 1991
            st->index_entries[sc->current_sample].timestamp : st->duration;
        pkt->duration = next_dts - pkt->dts;
1992
        pkt->pts = pkt->dts;
1993
    }
1994 1995
    pkt->flags |= sample->flags & AVINDEX_KEYFRAME ? PKT_FLAG_KEY : 0;
    pkt->pos = sample->pos;
1996 1997
    dprintf(s, "stream %d, pts %"PRId64", dts %"PRId64", pos 0x%"PRIx64", duration %d\n",
            pkt->stream_index, pkt->pts, pkt->dts, pkt->pos, pkt->duration);
1998 1999
    return 0;
}
2000

2001 2002 2003 2004 2005
static int mov_seek_stream(AVStream *st, int64_t timestamp, int flags)
{
    MOVStreamContext *sc = st->priv_data;
    int sample, time_sample;
    int i;
2006

2007
    sample = av_index_search_timestamp(st, timestamp, flags);
M
Michel Bardiaux 已提交
2008
    dprintf(st->codec, "stream %d, timestamp %"PRId64", sample %d\n", st->index, timestamp, sample);
2009 2010 2011
    if (sample < 0) /* not sure what to do */
        return -1;
    sc->current_sample = sample;
B
Baptiste Coudurier 已提交
2012
    dprintf(st->codec, "stream %d, found sample %d\n", st->index, sc->current_sample);
2013 2014 2015 2016
    /* adjust ctts index */
    if (sc->ctts_data) {
        time_sample = 0;
        for (i = 0; i < sc->ctts_count; i++) {
2017 2018
            int next = time_sample + sc->ctts_data[i].count;
            if (next > sc->current_sample) {
2019 2020
                sc->ctts_index = i;
                sc->ctts_sample = sc->current_sample - time_sample;
2021
                break;
2022
            }
2023
            time_sample = next;
2024 2025
        }
    }
2026
    return sample;
2027 2028
}

2029
static int mov_read_seek(AVFormatContext *s, int stream_index, int64_t sample_time, int flags)
G
Gael Chardon 已提交
2030
{
2031 2032 2033 2034
    AVStream *st;
    int64_t seek_timestamp, timestamp;
    int sample;
    int i;
G
Gael Chardon 已提交
2035

2036
    if (stream_index >= s->nb_streams)
G
Gael Chardon 已提交
2037
        return -1;
2038 2039
    if (sample_time < 0)
        sample_time = 0;
G
Gael Chardon 已提交
2040

2041 2042 2043
    st = s->streams[stream_index];
    sample = mov_seek_stream(st, sample_time, flags);
    if (sample < 0)
G
Gael Chardon 已提交
2044 2045
        return -1;

2046 2047
    /* adjust seek timestamp to found sample timestamp */
    seek_timestamp = st->index_entries[sample].timestamp;
G
Gael Chardon 已提交
2048

2049 2050 2051 2052
    for (i = 0; i < s->nb_streams; i++) {
        st = s->streams[i];
        if (stream_index == i || st->discard == AVDISCARD_ALL)
            continue;
G
Gael Chardon 已提交
2053

2054 2055
        timestamp = av_rescale_q(seek_timestamp, s->streams[stream_index]->time_base, st->time_base);
        mov_seek_stream(st, timestamp, flags);
2056
    }
G
Gael Chardon 已提交
2057 2058 2059
    return 0;
}

Z
Zdenek Kabelac 已提交
2060
static int mov_read_close(AVFormatContext *s)
2061
{
2062
    MOVContext *mov = s->priv_data;
2063 2064 2065
    int i, j;

    for (i = 0; i < s->nb_streams; i++) {
2066 2067
        AVStream *st = s->streams[i];
        MOVStreamContext *sc = st->priv_data;
2068

2069
        av_freep(&sc->ctts_data);
2070
        for (j = 0; j < sc->drefs_count; j++)
2071 2072 2073 2074
            av_freep(&sc->drefs[j].path);
        av_freep(&sc->drefs);
        if (sc->pb && sc->pb != s->pb)
            url_fclose(sc->pb);
2075 2076

        av_freep(&st->codec->palctrl);
2077
    }
2078 2079 2080

    if (mov->dv_demux) {
        for(i = 0; i < mov->dv_fctx->nb_streams; i++) {
2081 2082 2083 2084 2085 2086
            av_freep(&mov->dv_fctx->streams[i]->codec);
            av_freep(&mov->dv_fctx->streams[i]);
        }
        av_freep(&mov->dv_fctx);
        av_freep(&mov->dv_demux);
    }
2087

B
Baptiste Coudurier 已提交
2088
    av_freep(&mov->trex_data);
2089

2090 2091 2092
    return 0;
}

2093
AVInputFormat mov_demuxer = {
2094
    "mov,mp4,m4a,3gp,3g2,mj2",
2095
    NULL_IF_CONFIG_SMALL("QuickTime/MPEG-4/Motion JPEG 2000 format"),
F
Fabrice Bellard 已提交
2096 2097
    sizeof(MOVContext),
    mov_probe,
2098 2099 2100
    mov_read_header,
    mov_read_packet,
    mov_read_close,
G
Gael Chardon 已提交
2101
    mov_read_seek,
2102
};