mov.c 65.3 KB
Newer Older
1 2
/*
 * MOV decoder.
F
Fabrice Bellard 已提交
3
 * Copyright (c) 2001 Fabrice Bellard.
4
 *
F
Fabrice Bellard 已提交
5 6 7 8
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
9
 *
F
Fabrice Bellard 已提交
10
 * This library is distributed in the hope that it will be useful,
11
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
F
Fabrice Bellard 已提交
12 13
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
14
 *
F
Fabrice Bellard 已提交
15 16
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
17
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
18
 */
19 20

#include <limits.h>
21

B
Baptiste Coudurier 已提交
22
//#define DEBUG
23

24
#include "avformat.h"
25
#include "riff.h"
26
#include "isom.h"
27
#include "dv.h"
28

29 30 31 32
#ifdef CONFIG_ZLIB
#include <zlib.h>
#endif

33 34
/*
 * First version by Francois Revol revol@free.fr
35
 * Seek function by Gael Chardon gael.dev@4now.net
36
 *
37
 * Features and limitations:
38
 * - reads most of the QT files I have (at least the structure),
39
 *   the exceptions are .mov with zlib compressed headers ('cmov' section). It shouldn't be hard to implement.
40
 *   FIXED, Francois Revol, 07/17/2002
41 42 43 44 45 46 47
 * - ffmpeg has nearly none of the usual QuickTime codecs,
 *   although I succesfully dumped raw and mp3 audio tracks off .mov files.
 *   Sample QuickTime files with mp3 audio can be found at: http://www.3ivx.com/showcase.html
 * - .mp4 parsing is still hazardous, although the format really is QuickTime with some minor changes
 *   (to make .mov parser crash maybe ?), despite what they say in the MPEG FAQ at
 *   http://mpeg.telecomitalialab.com/faq.htm
 * - the code is quite ugly... maybe I won't do it recursive next time :-)
G
Gael Chardon 已提交
48
 * - seek is not supported with files that contain edit list
49
 *
50 51
 * Funny I didn't know about http://sourceforge.net/projects/qt-ffmpeg/
 * when coding this :) (it's a writer anyway)
52
 *
53 54 55
 * Reference documents:
 * http://www.geocities.com/xhelmboyx/quicktime/formats/qtm-layout.txt
 * Apple:
G
Gael Chardon 已提交
56
 *  http://developer.apple.com/documentation/QuickTime/QTFF/
57
 *  http://developer.apple.com/documentation/QuickTime/QTFF/qtff.pdf
58 59 60
 * QuickTime is a trademark of Apple (AFAIK :))
 */

61 62
#include "qtpalette.h"

G
Gael Chardon 已提交
63

64 65 66
#undef NDEBUG
#include <assert.h>

Z
Zdenek Kabelac 已提交
67
static const CodecTag mov_video_tags[] = {
68
/*  { CODEC_ID_, MKTAG('c', 'v', 'i', 'd') }, *//* Cinepak */
69 70
/*  { CODEC_ID_H263, MKTAG('r', 'a', 'w', ' ') }, *//* Uncompressed RGB */
/*  { CODEC_ID_H263, MKTAG('Y', 'u', 'v', '2') }, *//* Uncompressed YUV422 */
71
/*    { CODEC_ID_RAWVIDEO, MKTAG('A', 'V', 'U', 'I') }, *//* YUV with alpha-channel (AVID Uncompressed) */
72 73 74 75
/* Graphics */
/* Animation */
/* Apple video */
/* Kodak Photo CD */
76
    { CODEC_ID_MJPEG, MKTAG('j', 'p', 'e', 'g') }, /* PhotoJPEG */
77
    { CODEC_ID_MPEG1VIDEO, MKTAG('m', 'p', 'e', 'g') }, /* MPEG */
78
    { CODEC_ID_MJPEG, MKTAG('m', 'j', 'p', 'a') }, /* Motion-JPEG (format A) */
79
    { CODEC_ID_MJPEGB, MKTAG('m', 'j', 'p', 'b') }, /* Motion-JPEG (format B) */
80 81
    { CODEC_ID_MJPEG, MKTAG('A', 'V', 'D', 'J') }, /* MJPEG with alpha-channel (AVID JFIF meridien compressed) */
/*    { CODEC_ID_MJPEG, MKTAG('A', 'V', 'R', 'n') }, *//* MJPEG with alpha-channel (AVID ABVB/Truevision NuVista) */
82 83
/*    { CODEC_ID_GIF, MKTAG('g', 'i', 'f', ' ') }, *//* embedded gif files as frames (usually one "click to play movie" frame) */
/* Sorenson video */
84 85
    { CODEC_ID_SVQ1, MKTAG('S', 'V', 'Q', '1') }, /* Sorenson Video v1 */
    { CODEC_ID_SVQ1, MKTAG('s', 'v', 'q', '1') }, /* Sorenson Video v1 */
86
    { CODEC_ID_SVQ1, MKTAG('s', 'v', 'q', 'i') }, /* Sorenson Video v1 (from QT specs)*/
M
Michael Niedermayer 已提交
87
    { CODEC_ID_SVQ3, MKTAG('S', 'V', 'Q', '3') }, /* Sorenson Video v3 */
88
    { CODEC_ID_MPEG4, MKTAG('m', 'p', '4', 'v') },
89
    { CODEC_ID_MPEG4, MKTAG('D', 'I', 'V', 'X') }, /* OpenDiVX *//* sample files at http://heroinewarrior.com/xmovie.php3 use this tag */
90
    { CODEC_ID_MPEG4, MKTAG('X', 'V', 'I', 'D') },
91
    { CODEC_ID_MPEG4, MKTAG('3', 'I', 'V', '2') }, /* experimental: 3IVX files before ivx D4 4.5.1 */
92
/*    { CODEC_ID_, MKTAG('I', 'V', '5', '0') }, *//* Indeo 5.0 */
93
    { CODEC_ID_H263, MKTAG('h', '2', '6', '3') }, /* H263 */
94
    { CODEC_ID_H263, MKTAG('s', '2', '6', '3') }, /* H263 ?? works */
F
Fabrice Bellard 已提交
95 96
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'c', ' ') }, /* DV NTSC */
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'c', 'p') }, /* DV PAL */
97
    { CODEC_ID_VP3, MKTAG('V', 'P', '3', '1') }, /* On2 VP3 */
98 99
    { CODEC_ID_RPZA, MKTAG('r', 'p', 'z', 'a') }, /* Apple Video (RPZA) */
    { CODEC_ID_CINEPAK, MKTAG('c', 'v', 'i', 'd') }, /* Cinepak */
R
Roberto Togni 已提交
100
    { CODEC_ID_8BPS, MKTAG('8', 'B', 'P', 'S') }, /* Planar RGB (8BPS) */
101
    { CODEC_ID_SMC, MKTAG('s', 'm', 'c', ' ') }, /* Apple Graphics (SMC) */
102
    { CODEC_ID_QTRLE, MKTAG('r', 'l', 'e', ' ') }, /* Apple Animation (RLE) */
103
    { CODEC_ID_QDRAW, MKTAG('q', 'd', 'r', 'w') }, /* QuickDraw */
104
    { CODEC_ID_H264, MKTAG('a', 'v', 'c', '1') }, /* AVC-1/H.264 */
105
    { CODEC_ID_MPEG2VIDEO, MKTAG('h', 'd', 'v', '2') }, /* MPEG2 produced by Sony HD camera */
106
    { CODEC_ID_MPEG2VIDEO, MKTAG('h', 'd', 'v', '3') }, /* HDV produced by FCP */
107 108 109 110 111 112 113 114 115
    { CODEC_ID_MPEG2VIDEO, MKTAG('m', 'x', '5', 'n') }, /* MPEG2 IMX NTSC 525/60 50mb/s produced by FCP */
    { CODEC_ID_MPEG2VIDEO, MKTAG('m', 'x', '5', 'p') }, /* MPEG2 IMX PAL 625/50 50mb/s produced by FCP */
    { CODEC_ID_MPEG2VIDEO, MKTAG('m', 'x', '3', 'n') }, /* MPEG2 IMX NTSC 525/60 30mb/s produced by FCP */
    { CODEC_ID_MPEG2VIDEO, MKTAG('m', 'x', '3', 'p') }, /* MPEG2 IMX PAL 625/50 30mb/s produced by FCP */
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'p', 'p') }, /* DVCPRO PAL produced by FCP */
    //{ CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'h', '5') }, /* DVCPRO HD 50i produced by FCP */
    //{ CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'h', '6') }, /* DVCPRO HD 60i produced by FCP */
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', '5', 'p') }, /* DVCPRO50 PAL produced by FCP */
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', '5', 'n') }, /* DVCPRO50 NTSC produced by FCP */
B
Baptiste Coudurier 已提交
116
    { CODEC_ID_DVVIDEO, MKTAG('A', 'V', 'd', 'v') }, /* AVID DV */
117
    //{ CODEC_ID_JPEG2000, MKTAG('m', 'j', 'p', '2') }, /* JPEG 2000 produced by FCP */
118
    { CODEC_ID_RAWVIDEO, MKTAG('2', 'v', 'u', 'y') }, /* UNCOMPRESSED 8BIT 4:2:2 */
119
    { CODEC_ID_NONE, 0 },
120 121
};

Z
Zdenek Kabelac 已提交
122
static const CodecTag mov_audio_tags[] = {
123
    { CODEC_ID_PCM_S32BE, MKTAG('i', 'n', '3', '2') },
124
    { CODEC_ID_PCM_S24BE, MKTAG('i', 'n', '2', '4') },
B
Baptiste Coudurier 已提交
125
    { CODEC_ID_PCM_S16BE, MKTAG('N', 'O', 'N', 'E') }, /* uncompressed */
126
    { CODEC_ID_PCM_S16BE, MKTAG('t', 'w', 'o', 's') }, /* 16 bits */
127
    { CODEC_ID_PCM_U8, MKTAG('r', 'a', 'w', ' ') }, /* 8 bits unsigned */
128 129 130
    { CODEC_ID_PCM_S16LE, MKTAG('s', 'o', 'w', 't') }, /*  */
    { CODEC_ID_PCM_MULAW, MKTAG('u', 'l', 'a', 'w') }, /*  */
    { CODEC_ID_PCM_ALAW, MKTAG('a', 'l', 'a', 'w') }, /*  */
131
    { CODEC_ID_ADPCM_IMA_QT, MKTAG('i', 'm', 'a', '4') }, /* IMA-4 ADPCM */
B
Baptiste Coudurier 已提交
132
    { CODEC_ID_ADPCM_MS, MKTAG('m', 's', 0x00, 0x02) }, /* MS ADPCM */
133 134
    { CODEC_ID_MACE3, MKTAG('M', 'A', 'C', '3') }, /* Macintosh Audio Compression and Expansion 3:1 */
    { CODEC_ID_MACE6, MKTAG('M', 'A', 'C', '6') }, /* Macintosh Audio Compression and Expansion 6:1 */
135

136
    { CODEC_ID_MP3, MKTAG('.', 'm', 'p', '3') }, /* MPEG layer 3 */ /* sample files at http://www.3ivx.com/showcase.html use this tag */
137 138 139 140
    { CODEC_ID_MP2, 0x6D730055 }, /* MPEG layer 3 */
    { CODEC_ID_MP2, 0x5500736D }, /* MPEG layer 3 *//* XXX: check endianness */
/*    { CODEC_ID_OGG_VORBIS, MKTAG('O', 'g', 'g', 'S') }, *//* sample files at http://heroinewarrior.com/xmovie.php3 use this tag */
/* MP4 tags */
141
    { CODEC_ID_AAC, MKTAG('m', 'p', '4', 'a') }, /* MPEG-4 AAC */
142
    /* The standard for mpeg4 audio is still not normalised AFAIK anyway */
143
    { CODEC_ID_AMR_NB, MKTAG('s', 'a', 'm', 'r') }, /* AMR-NB 3gp */
144
    { CODEC_ID_AMR_WB, MKTAG('s', 'a', 'w', 'b') }, /* AMR-WB 3gp */
145
    { CODEC_ID_AC3, MKTAG('m', 's', 0x20, 0x00) }, /* Dolby AC-3 */
146
    { CODEC_ID_ALAC,MKTAG('a', 'l', 'a', 'c') }, /* Apple Lossless */
R
Roberto Togni 已提交
147
    { CODEC_ID_QDM2,MKTAG('Q', 'D', 'M', '2') }, /* QDM2 */
148 149
    { CODEC_ID_DVAUDIO, MKTAG('v', 'd', 'v', 'a') },
    { CODEC_ID_DVAUDIO, MKTAG('d', 'v', 'c', 'a') },
150
    { CODEC_ID_NONE, 0 },
151 152 153 154 155 156 157 158 159 160 161 162 163
};

/* the QuickTime file format is quite convoluted...
 * it has lots of index tables, each indexing something in another one...
 * Here we just use what is needed to read the chunks
 */

typedef struct MOV_sample_to_chunk_tbl {
    long first;
    long count;
    long id;
} MOV_sample_to_chunk_tbl;

164 165 166 167 168 169 170 171 172 173 174 175 176
typedef struct {
    uint32_t type;
    int64_t offset;
    int64_t size; /* total size (excluding the size and type fields) */
} MOV_atom_t;

typedef struct {
    int seed;
    int flags;
    int size;
    void* clrs;
} MOV_ctab_t;

177 178 179 180 181
typedef struct MOV_mdat_atom_s {
    offset_t offset;
    int64_t size;
} MOV_mdat_atom_t;

182 183 184 185 186 187
typedef struct {
    uint8_t  version;
    uint32_t flags; // 24bit

    /* 0x03 ESDescrTag */
    uint16_t es_id;
188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206
#define MP4ODescrTag                    0x01
#define MP4IODescrTag                   0x02
#define MP4ESDescrTag                   0x03
#define MP4DecConfigDescrTag            0x04
#define MP4DecSpecificDescrTag          0x05
#define MP4SLConfigDescrTag             0x06
#define MP4ContentIdDescrTag            0x07
#define MP4SupplContentIdDescrTag       0x08
#define MP4IPIPtrDescrTag               0x09
#define MP4IPMPPtrDescrTag              0x0A
#define MP4IPMPDescrTag                 0x0B
#define MP4RegistrationDescrTag         0x0D
#define MP4ESIDIncDescrTag              0x0E
#define MP4ESIDRefDescrTag              0x0F
#define MP4FileIODescrTag               0x10
#define MP4FileODescrTag                0x11
#define MP4ExtProfileLevelDescrTag      0x13
#define MP4ExtDescrTagsStart            0x80
#define MP4ExtDescrTagsEnd              0xFE
207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229
    uint8_t  stream_priority;

    /* 0x04 DecConfigDescrTag */
    uint8_t  object_type_id;
    uint8_t  stream_type;
    /* XXX: really streamType is
     * only 6bit, followed by:
     * 1bit  upStream
     * 1bit  reserved
     */
    uint32_t buffer_size_db; // 24
    uint32_t max_bitrate;
    uint32_t avg_bitrate;

    /* 0x05 DecSpecificDescrTag */
    uint8_t  decoder_cfg_len;
    uint8_t *decoder_cfg;

    /* 0x06 SLConfigDescrTag */
    uint8_t  sl_config_len;
    uint8_t *sl_config;
} MOV_esds_t;

230 231
struct MOVParseTableEntry;

232 233 234 235
typedef struct MOVStreamContext {
    int ffindex; /* the ffmpeg stream id */
    long next_chunk;
    long chunk_count;
236
    int64_t *chunk_offsets;
M
cleanup  
Michael Niedermayer 已提交
237 238
    int stts_count;
    Time2Sample *stts_data;
M
Michael Niedermayer 已提交
239 240
    int ctts_count;
    Time2Sample *ctts_data;
M
cleanup  
Michael Niedermayer 已提交
241
    int edit_count;             /* number of 'edit' (elst atom) */
242 243
    long sample_to_chunk_sz;
    MOV_sample_to_chunk_tbl *sample_to_chunk;
M
Michael Niedermayer 已提交
244 245
    int sample_to_ctime_index;
    int sample_to_ctime_sample;
246 247 248
    long sample_size;
    long sample_count;
    long *sample_sizes;
249 250
    long keyframe_count;
    long *keyframes;
251
    int time_scale;
252
    int time_rate;
253
    long current_sample;
254
    MOV_esds_t esds;
255
    AVRational sample_size_v1;
256
    int dv_audio_container;
257 258 259 260 261
} MOVStreamContext;

typedef struct MOVContext {
    int mp4; /* set to 1 as soon as we are sure that the file is an .mp4 file (even some header parsing depends on this) */
    AVFormatContext *fc;
262
    int time_scale;
B
Baptiste Coudurier 已提交
263
    int64_t duration; /* duration of the longest track */
264 265
    int found_moov; /* when both 'moov' and 'mdat' sections has been found */
    int found_mdat; /* we suppose we have enough data to read the file */
266 267
    int64_t mdat_size;
    int64_t mdat_offset;
268 269 270 271 272
    int total_streams;
    /* some streams listed here aren't presented to the ffmpeg API, since they aren't either video nor audio
     * but we need the info to be able to skip data from those streams in the 'mdat' section
     */
    MOVStreamContext *streams[MAX_STREAMS];
273

274 275
    int ctab_size;
    MOV_ctab_t **ctab;           /* color tables */
276 277
    const struct MOVParseTableEntry *parse_table; /* could be eventually used to change the table */
    /* NOTE: for recursion save to/ restore from local variable! */
278 279

    AVPaletteControl palette_control;
280 281
    MOV_mdat_atom_t *mdat_list;
    int mdat_count;
282 283
    DVDemuxContext *dv_demux;
    AVFormatContext *dv_fctx;
284 285 286 287 288 289 290 291 292 293 294
} MOVContext;


/* XXX: it's the first time I make a recursive parser I think... sorry if it's ugly :P */

/* those functions parse an atom */
/* return code:
 1: found what I wanted, exit
 0: continue to parse next atom
 -1: error occured, exit
 */
295
typedef int (*mov_parse_function)(MOVContext *ctx, ByteIOContext *pb, MOV_atom_t atom);
296 297 298

/* links atom IDs to parse functions */
typedef struct MOVParseTableEntry {
299
    uint32_t type;
300 301 302
    mov_parse_function func;
} MOVParseTableEntry;

303
static int mov_read_leaf(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
304
{
305 306 307
    if (atom.size>1)
        url_fskip(pb, atom.size);
/*        url_seek(pb, atom_offset+atom.size, SEEK_SET); */
308 309 310
    return 0;
}

311
static int mov_read_default(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
312
{
313
    int64_t total_size = 0;
314
    MOV_atom_t a;
315 316
    int i;
    int err = 0;
317 318

    a.offset = atom.offset;
319

320
    if (atom.size < 0)
321
        atom.size = 0x7fffffffffffffffLL;
322
    while(((total_size + 8) < atom.size) && !url_feof(pb) && !err) {
323 324
        a.size = atom.size;
        a.type=0L;
325
        if(atom.size >= 8) {
326
            a.size = get_be32(pb);
327
            a.type = get_le32(pb);
328
        }
329
        total_size += 8;
330
        a.offset += 8;
331
        dprintf("type: %08x  %.4s  sz: %"PRIx64"  %"PRIx64"   %"PRIx64"\n", a.type, (char*)&a.type, a.size, atom.size, total_size);
332
        if (a.size == 1) { /* 64 bit extended size */
333
            a.size = get_be64(pb) - 8;
334 335
            a.offset += 8;
            total_size += 8;
336
        }
337 338 339
        if (a.size == 0) {
            a.size = atom.size - total_size;
            if (a.size <= 8)
340
                break;
341 342 343 344
        }
        for (i = 0; c->parse_table[i].type != 0L
             && c->parse_table[i].type != a.type; i++)
            /* empty */;
345

346
        a.size -= 8;
347

348 349
        if(a.size < 0)
            break;
350

351
        if (c->parse_table[i].type == 0) { /* skip leaf atoms data */
352
            url_fskip(pb, a.size);
353
        } else {
354 355
            offset_t start_pos = url_ftell(pb);
            int64_t left;
356
            err = (c->parse_table[i].func)(c, pb, a);
357 358 359
            left = a.size - url_ftell(pb) + start_pos;
            if (left > 0) /* skip garbage at atom end */
                url_fskip(pb, left);
360
        }
361

362
        a.offset += a.size;
363
        total_size += a.size;
364 365
    }

366 367
    if (!err && total_size < atom.size && atom.size < 0x7ffff) {
        url_fskip(pb, atom.size - total_size);
368 369
    }

370 371 372
    return err;
}

373
static int mov_read_ctab(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
374
{
375 376 377 378
#if 1
    url_fskip(pb, atom.size); // for now
#else
    VERY VERY BROKEN, NEVER execute this, needs rewrite
379 380
    unsigned int len;
    MOV_ctab_t *t;
381 382 383 384 385 386 387
    c->ctab = av_realloc(c->ctab, ++c->ctab_size);
    t = c->ctab[c->ctab_size];
    t->seed = get_be32(pb);
    t->flags = get_be16(pb);
    t->size = get_be16(pb) + 1;
    len = 2 * t->size * 4;
    if (len > 0) {
388 389 390
        t->clrs = av_malloc(len); // 16bit A R G B
        if (t->clrs)
            get_buffer(pb, t->clrs, len);
391
    }
392
#endif
393

394 395 396
    return 0;
}

397
static int mov_read_hdlr(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
398
{
399
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
400
    int len = 0;
401 402
    uint32_t type;
    uint32_t ctype;
403

404 405 406 407 408 409 410
    get_byte(pb); /* version */
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */

    /* component type */
    ctype = get_le32(pb);
    type = get_le32(pb); /* component subtype */

411 412
    dprintf("ctype= %c%c%c%c (0x%08lx)\n", *((char *)&ctype), ((char *)&ctype)[1], ((char *)&ctype)[2], ((char *)&ctype)[3], (long) ctype);
    dprintf("stype= %c%c%c%c\n", *((char *)&type), ((char *)&type)[1], ((char *)&type)[2], ((char *)&type)[3]);
413
    if(ctype == MKTAG('m', 'h', 'l', 'r')) /* MOV */
414
        c->mp4 = 0;
415
    else if(ctype == 0)
416
        c->mp4 = 1;
417 418 419 420
    if(type == MKTAG('v', 'i', 'd', 'e'))
        st->codec->codec_type = CODEC_TYPE_VIDEO;
    else if(type == MKTAG('s', 'o', 'u', 'n'))
        st->codec->codec_type = CODEC_TYPE_AUDIO;
421 422 423 424
    get_be32(pb); /* component  manufacture */
    get_be32(pb); /* component flags */
    get_be32(pb); /* component flags mask */

425
    if(atom.size <= 24)
426 427 428
        return 0; /* nothing left to read */
    /* XXX: MP4 uses a C string, not a pascal one */
    /* component name */
429 430 431

    if(c->mp4) {
        /* .mp4: C string */
432
        while(get_byte(pb) && (++len < (atom.size - 24)));
433 434 435
    } else {
        /* .mov: PASCAL string */
        len = get_byte(pb);
436
        url_fskip(pb, len);
437
    }
438

439
    url_fskip(pb, atom.size - (url_ftell(pb) - atom.offset));
440 441 442
    return 0;
}

443
static int mov_mp4_read_descr_len(ByteIOContext *pb)
444
{
445
    int len = 0;
446 447
    int count = 4;
    while (count--) {
448
        int c = get_byte(pb);
449 450 451
        len = (len << 7) | (c & 0x7f);
        if (!(c & 0x80))
            break;
452 453 454 455
    }
    return len;
}

456
static int mov_mp4_read_descr(ByteIOContext *pb, int *tag)
457 458 459
{
    int len;
    *tag = get_byte(pb);
460
    len = mov_mp4_read_descr_len(pb);
461
    dprintf("MPEG4 description: tag=0x%02x len=%d\n", *tag, len);
462 463 464
    return len;
}

465
static int mov_read_esds(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
466 467 468 469
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    MOVStreamContext *sc = (MOVStreamContext *)st->priv_data;
    int tag, len;
470

471 472
    /* Well, broken but suffisant for some MP4 streams */
    get_be32(pb); /* version + flags */
473
    len = mov_mp4_read_descr(pb, &tag);
474
    if (tag == MP4ESDescrTag) {
475 476
        get_be16(pb); /* ID */
        get_byte(pb); /* priority */
477
    } else
478
        get_be16(pb); /* ID */
479

480
    len = mov_mp4_read_descr(pb, &tag);
481
    if (tag == MP4DecConfigDescrTag) {
482 483 484 485 486 487
        sc->esds.object_type_id = get_byte(pb);
        sc->esds.stream_type = get_byte(pb);
        sc->esds.buffer_size_db = get_be24(pb);
        sc->esds.max_bitrate = get_be32(pb);
        sc->esds.avg_bitrate = get_be32(pb);

488
        st->codec->codec_id= codec_get_id(ff_mov_obj_type, sc->esds.object_type_id);
B
Baptiste Coudurier 已提交
489
        dprintf("esds object type id %d\n", sc->esds.object_type_id);
490 491
        len = mov_mp4_read_descr(pb, &tag);
        if (tag == MP4DecSpecificDescrTag) {
492
            dprintf("Specific MPEG4 header len=%d\n", len);
493 494 495 496
            st->codec->extradata = (uint8_t*) av_mallocz(len + FF_INPUT_BUFFER_PADDING_SIZE);
            if (st->codec->extradata) {
                get_buffer(pb, st->codec->extradata, len);
                st->codec->extradata_size = len;
497 498 499 500
                /* from mplayer */
                if ((*(uint8_t *)st->codec->extradata >> 3) == 29) {
                    st->codec->codec_id = CODEC_ID_MP3ON4;
                }
501 502
            }
        }
503 504 505 506
    }
    return 0;
}

507 508
/* this atom contains actual media data */
static int mov_read_mdat(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
509
{
510 511
    if(atom.size == 0) /* wrong one (MP4) */
        return 0;
512 513 514 515
    c->mdat_list = av_realloc(c->mdat_list, (c->mdat_count + 1) * sizeof(*c->mdat_list));
    c->mdat_list[c->mdat_count].offset = atom.offset;
    c->mdat_list[c->mdat_count].size = atom.size;
    c->mdat_count++;
516 517 518 519 520 521 522 523 524
    c->found_mdat=1;
    c->mdat_offset = atom.offset;
    c->mdat_size = atom.size;
    if(c->found_moov)
        return 1; /* found both, just go */
    url_fskip(pb, atom.size);
    return 0; /* now go for moov */
}

525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542
static int mov_read_ftyp(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    uint32_t type = get_le32(pb);

    /* from mplayer */
    switch (type) {
    case MKTAG('i', 's', 'o', 'm'):
    case MKTAG('m', 'p', '4', '1'):
    case MKTAG('m', 'p', '4', '2'):
    case MKTAG('3', 'g', 'p', '1'):
    case MKTAG('3', 'g', 'p', '2'):
    case MKTAG('3', 'g', '2', 'a'):
    case MKTAG('3', 'g', 'p', '3'):
    case MKTAG('3', 'g', 'p', '4'):
    case MKTAG('3', 'g', 'p', '5'):
    case MKTAG('m', 'm', 'p', '4'): /* Mobile MP4 */
    case MKTAG('M', '4', 'A', ' '): /* Apple iTunes AAC-LC Audio */
    case MKTAG('M', '4', 'P', ' '): /* Apple iTunes AAC-LC Protected Audio */
543
    case MKTAG('m', 'j', 'p', '2'): /* Motion Jpeg 2000 */
544 545
        c->mp4 = 1;
    case MKTAG('q', 't', ' ', ' '):
546
    default:
547 548 549 550 551 552 553
        av_log(c->fc, AV_LOG_DEBUG, "ISO: File Type Major Brand: %.4s\n",(char *)&type);
    }
    get_be32(pb); /* minor version */
    url_fskip(pb, atom.size - 8);
    return 0;
}

554 555 556 557
/* this atom should contain all header atoms */
static int mov_read_moov(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    int err;
558

559 560 561 562 563 564 565 566 567 568 569 570
    err = mov_read_default(c, pb, atom);
    /* we parsed the 'moov' atom, we can terminate the parsing as soon as we find the 'mdat' */
    /* so we don't parse the whole file if over a network */
    c->found_moov=1;
    if(c->found_mdat)
        return 1; /* found both, just go */
    return 0; /* now go for mdat */
}


static int mov_read_mdhd(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
B
clean  
Baptiste Coudurier 已提交
571 572 573
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    MOVStreamContext *sc = (MOVStreamContext *)st->priv_data;
    int version = get_byte(pb);
574
    int lang;
575

576 577
    if (version > 1)
        return 1; /* unsupported */
578 579 580 581

    get_byte(pb); get_byte(pb);
    get_byte(pb); /* flags */

B
clean  
Baptiste Coudurier 已提交
582 583 584 585 586 587 588
    if (version == 1) {
        get_be64(pb);
        get_be64(pb);
    } else {
        get_be32(pb); /* creation time */
        get_be32(pb); /* modification time */
    }
589

B
clean  
Baptiste Coudurier 已提交
590 591
    sc->time_scale = get_be32(pb);
    st->duration = (version == 1) ? get_be64(pb) : get_be32(pb); /* duration */
592

593
    lang = get_be16(pb); /* language */
B
clean  
Baptiste Coudurier 已提交
594
    ff_mov_lang_to_iso639(lang, st->language);
595 596 597 598 599 600 601
    get_be16(pb); /* quality */

    return 0;
}

static int mov_read_mvhd(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
B
Baptiste Coudurier 已提交
602
    int version = get_byte(pb); /* version */
603 604
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */

B
Baptiste Coudurier 已提交
605 606 607 608 609 610 611
    if (version == 1) {
        get_be64(pb);
        get_be64(pb);
    } else {
        get_be32(pb); /* creation time */
        get_be32(pb); /* modification time */
    }
612 613
    c->time_scale = get_be32(pb); /* time scale */
#ifdef DEBUG
G
Gael Chardon 已提交
614
    av_log(NULL, AV_LOG_DEBUG, "time scale = %i\n", c->time_scale);
615
#endif
B
Baptiste Coudurier 已提交
616
    c->duration = (version == 1) ? get_be64(pb) : get_be32(pb); /* duration */
617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635
    get_be32(pb); /* preferred scale */

    get_be16(pb); /* preferred volume */

    url_fskip(pb, 10); /* reserved */

    url_fskip(pb, 36); /* display matrix */

    get_be32(pb); /* preview time */
    get_be32(pb); /* preview duration */
    get_be32(pb); /* poster time */
    get_be32(pb); /* selection time */
    get_be32(pb); /* selection duration */
    get_be32(pb); /* current time */
    get_be32(pb); /* next track ID */

    return 0;
}

636 637 638 639
static int mov_read_smi(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];

640 641
    if((uint64_t)atom.size > (1<<30))
        return -1;
642

643 644
    // currently SVQ3 decoder expect full STSD header - so let's fake it
    // this should be fixed and just SMI header should be passed
645 646 647 648 649
    av_free(st->codec->extradata);
    st->codec->extradata_size = 0x5a + atom.size;
    st->codec->extradata = (uint8_t*) av_mallocz(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);

    if (st->codec->extradata) {
650 651
        strcpy(st->codec->extradata, "SVQ3"); // fake
        get_buffer(pb, st->codec->extradata + 0x5a, atom.size);
652
        dprintf("Reading SMI %"PRId64"  %s\n", atom.size, (char*)st->codec->extradata + 0x5a);
653
    } else
654
        url_fskip(pb, atom.size);
655 656 657

    return 0;
}
658

659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692
static int mov_read_enda(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    int little_endian = get_be16(pb);

    if (little_endian) {
        switch (st->codec->codec_id) {
        case CODEC_ID_PCM_S24BE:
            st->codec->codec_id = CODEC_ID_PCM_S24LE;
            break;
        case CODEC_ID_PCM_S32BE:
            st->codec->codec_id = CODEC_ID_PCM_S32LE;
            break;
        default:
            break;
        }
    }
    return 0;
}

static int mov_read_alac(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];

    // currently ALAC decoder expect full atom header - so let's fake it
    // this should be fixed and just ALAC header should be passed

    av_free(st->codec->extradata);
    st->codec->extradata_size = 36;
    st->codec->extradata = (uint8_t*) av_mallocz(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);

    if (st->codec->extradata) {
        strcpy(st->codec->extradata + 4, "alac"); // fake
        get_buffer(pb, st->codec->extradata + 8, 36 - 8);
693
        dprintf("Reading alac %d  %s\n", st->codec->extradata_size, (char*)st->codec->extradata);
694 695 696 697 698
    } else
        url_fskip(pb, atom.size);
    return 0;
}

R
Roberto Togni 已提交
699 700 701 702 703 704
static int mov_read_wave(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];

    if((uint64_t)atom.size > (1<<30))
        return -1;
705

706 707 708 709 710 711 712 713 714 715 716 717
    if (st->codec->codec_id == CODEC_ID_QDM2) {
        // pass all frma atom to codec, needed at least for QDM2
        av_free(st->codec->extradata);
        st->codec->extradata_size = atom.size;
        st->codec->extradata = (uint8_t*) av_mallocz(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);

        if (st->codec->extradata) {
            get_buffer(pb, st->codec->extradata, atom.size);
        } else
            url_fskip(pb, atom.size);
    } else if (atom.size > 8) { /* to read frma, esds atoms */
        mov_read_default(c, pb, atom);
718
    } else
719
        url_fskip(pb, atom.size);
R
Roberto Togni 已提交
720 721 722
    return 0;
}

723 724 725 726 727 728 729 730 731 732 733 734 735 736 737 738 739 740 741 742 743
static int mov_read_jp2h(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];

    if((uint64_t)atom.size > (1<<30))
        return -1;

    av_free(st->codec->extradata);

    st->codec->extradata_size = atom.size + 8;
    st->codec->extradata = (uint8_t*) av_mallocz(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);

    /* pass all jp2h atom to codec */
    if (st->codec->extradata) {
        strcpy(st->codec->extradata + 4, "jp2h");
        get_buffer(pb, st->codec->extradata + 8, atom.size);
    } else
        url_fskip(pb, atom.size);
    return 0;
}

744 745 746 747
static int mov_read_avcC(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];

748 749 750
    if((uint64_t)atom.size > (1<<30))
        return -1;

751
    av_free(st->codec->extradata);
752

753 754
    st->codec->extradata_size = atom.size;
    st->codec->extradata = (uint8_t*) av_mallocz(st->codec->extradata_size + FF_INPUT_BUFFER_PADDING_SIZE);
755

756
    if (st->codec->extradata) {
757
        get_buffer(pb, st->codec->extradata, atom.size);
758
    } else
759
        url_fskip(pb, atom.size);
760 761 762 763

    return 0;
}

764 765 766 767
static int mov_read_stco(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    MOVStreamContext *sc = (MOVStreamContext *)st->priv_data;
768
    unsigned int i, entries;
769 770 771 772 773

    get_byte(pb); /* version */
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */

    entries = get_be32(pb);
774

775 776
    if(entries >= UINT_MAX/sizeof(int64_t))
        return -1;
777

778 779 780 781 782 783 784 785 786 787 788 789 790 791
    sc->chunk_count = entries;
    sc->chunk_offsets = (int64_t*) av_malloc(entries * sizeof(int64_t));
    if (!sc->chunk_offsets)
        return -1;
    if (atom.type == MKTAG('s', 't', 'c', 'o')) {
        for(i=0; i<entries; i++) {
            sc->chunk_offsets[i] = get_be32(pb);
        }
    } else if (atom.type == MKTAG('c', 'o', '6', '4')) {
        for(i=0; i<entries; i++) {
            sc->chunk_offsets[i] = get_be64(pb);
        }
    } else
        return -1;
792

793 794 795 796 797 798
    return 0;
}

static int mov_read_stsd(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
799
    MOVStreamContext *sc = (MOVStreamContext *)st->priv_data;
800 801
    int entries, frames_per_sample;
    uint32_t format;
802
    uint8_t codec_name[32];
803

804 805 806 807 808 809 810 811 812 813 814 815
    /* for palette traversal */
    int color_depth;
    int color_start;
    int color_count;
    int color_end;
    int color_index;
    int color_dec;
    int color_greyscale;
    unsigned char *color_table;
    int j;
    unsigned char r, g, b;

816 817 818 819 820
    get_byte(pb); /* version */
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */

    entries = get_be32(pb);

821
    while(entries--) { //Parsing Sample description table
822
        enum CodecID id;
823
        MOV_atom_t a = { 0, 0, 0 };
824
        offset_t start_pos = url_ftell(pb);
825
        int size = get_be32(pb); /* size */
826
        format = get_le32(pb); /* data format */
827

828 829 830
        get_be32(pb); /* reserved */
        get_be16(pb); /* reserved */
        get_be16(pb); /* index */
831

832 833 834 835 836 837
        if (st->codec->codec_tag) {
            /* multiple fourcc, just skip for now */
            url_fskip(pb, size - (url_ftell(pb) - start_pos));
            continue;
        }

838
        st->codec->codec_tag = format;
839 840 841
        id = codec_get_id(mov_audio_tags, format);
        if (id > 0) {
            st->codec->codec_type = CODEC_TYPE_AUDIO;
842
        } else if (format && format != MKTAG('m', 'p', '4', 's')) { /* skip old asf mpeg4 tag */
843
            id = codec_get_id(mov_video_tags, format);
844
            if (id <= 0)
845
                id = codec_get_id(codec_bmp_tags, format);
846 847 848 849
            if (id > 0)
                st->codec->codec_type = CODEC_TYPE_VIDEO;
        }

850 851 852 853 854
        dprintf("size=%d 4CC= %c%c%c%c codec_type=%d\n",
                size,
                (format >> 0) & 0xff, (format >> 8) & 0xff, (format >> 16) & 0xff, (format >> 24) & 0xff,
                st->codec->codec_type);

855
        if(st->codec->codec_type==CODEC_TYPE_VIDEO) {
856
            st->codec->codec_id = id;
857 858 859 860 861
            get_be16(pb); /* version */
            get_be16(pb); /* revision level */
            get_be32(pb); /* vendor */
            get_be32(pb); /* temporal quality */
            get_be32(pb); /* spacial quality */
862 863 864 865

            st->codec->width = get_be16(pb); /* width */
            st->codec->height = get_be16(pb); /* height */

866 867 868
            get_be32(pb); /* horiz resolution */
            get_be32(pb); /* vert resolution */
            get_be32(pb); /* data size, always 0 */
869
            frames_per_sample = get_be16(pb); /* frames per samples */
870
#ifdef DEBUG
871
            av_log(NULL, AV_LOG_DEBUG, "frames/samples = %d\n", frames_per_sample);
872
#endif
B
Baptiste Coudurier 已提交
873 874 875 876 877
            get_buffer(pb, codec_name, 32); /* codec name, pascal string (FIXME: true for mp4?) */
            if (codec_name[0] <= 31) {
                memcpy(st->codec->codec_name, &codec_name[1],codec_name[0]);
                st->codec->codec_name[codec_name[0]] = 0;
            }
878

879
            st->codec->bits_per_sample = get_be16(pb); /* depth */
880
            st->codec->color_table_id = get_be16(pb); /* colortable id */
881

882
            /* figure out the palette situation */
883 884
            color_depth = st->codec->bits_per_sample & 0x1F;
            color_greyscale = st->codec->bits_per_sample & 0x20;
885 886

            /* if the depth is 2, 4, or 8 bpp, file is palettized */
887
            if ((color_depth == 2) || (color_depth == 4) ||
888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904
                (color_depth == 8)) {

                if (color_greyscale) {

                    /* compute the greyscale palette */
                    color_count = 1 << color_depth;
                    color_index = 255;
                    color_dec = 256 / (color_count - 1);
                    for (j = 0; j < color_count; j++) {
                        r = g = b = color_index;
                        c->palette_control.palette[j] =
                            (r << 16) | (g << 8) | (b);
                        color_index -= color_dec;
                        if (color_index < 0)
                            color_index = 0;
                    }

905
                } else if (st->codec->color_table_id & 0x08) {
906 907 908 909

                    /* if flag bit 3 is set, use the default palette */
                    color_count = 1 << color_depth;
                    if (color_depth == 2)
M
Michael Niedermayer 已提交
910
                        color_table = ff_qt_default_palette_4;
911
                    else if (color_depth == 4)
M
Michael Niedermayer 已提交
912
                        color_table = ff_qt_default_palette_16;
913
                    else
M
Michael Niedermayer 已提交
914
                        color_table = ff_qt_default_palette_256;
915 916 917 918 919 920 921 922 923 924 925 926 927 928 929 930 931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946

                    for (j = 0; j < color_count; j++) {
                        r = color_table[j * 4 + 0];
                        g = color_table[j * 4 + 1];
                        b = color_table[j * 4 + 2];
                        c->palette_control.palette[j] =
                            (r << 16) | (g << 8) | (b);
                    }

                } else {

                    /* load the palette from the file */
                    color_start = get_be32(pb);
                    color_count = get_be16(pb);
                    color_end = get_be16(pb);
                    for (j = color_start; j <= color_end; j++) {
                        /* each R, G, or B component is 16 bits;
                         * only use the top 8 bits; skip alpha bytes
                         * up front */
                        get_byte(pb);
                        get_byte(pb);
                        r = get_byte(pb);
                        get_byte(pb);
                        g = get_byte(pb);
                        get_byte(pb);
                        b = get_byte(pb);
                        get_byte(pb);
                        c->palette_control.palette[j] =
                            (r << 16) | (g << 8) | (b);
                    }
                }

947 948
                st->codec->palctrl = &c->palette_control;
                st->codec->palctrl->palette_changed = 1;
949
            } else
950
                st->codec->palctrl = NULL;
951
        } else if(st->codec->codec_type==CODEC_TYPE_AUDIO) {
952
            int bits_per_sample;
953
            uint16_t version = get_be16(pb);
954

955
            st->codec->codec_id = id;
956 957
            get_be16(pb); /* revision level */
            get_be32(pb); /* vendor */
958

959
            st->codec->channels = get_be16(pb);             /* channel count */
B
Baptiste Coudurier 已提交
960
            dprintf("audio channels %d\n", st->codec->channels);
961 962 963 964 965 966 967 968 969 970
            st->codec->bits_per_sample = get_be16(pb);      /* sample size */
            /* do we need to force to 16 for AMR ? */

            /* handle specific s8 codec */
            get_be16(pb); /* compression id = 0*/
            get_be16(pb); /* packet size = 0 */

            st->codec->sample_rate = ((get_be32(pb) >> 16));

            switch (st->codec->codec_id) {
971 972 973 974 975
            case CODEC_ID_PCM_S8:
            case CODEC_ID_PCM_U8:
                if (st->codec->bits_per_sample == 16)
                    st->codec->codec_id = CODEC_ID_PCM_S16BE;
                break;
976
            case CODEC_ID_PCM_S16LE:
977 978 979 980 981 982 983 984 985 986 987 988 989 990
            case CODEC_ID_PCM_S16BE:
                if (st->codec->bits_per_sample == 8)
                    st->codec->codec_id = CODEC_ID_PCM_S8;
                break;
            case CODEC_ID_AMR_WB:
                st->codec->sample_rate = 16000; /* should really we ? */
                st->codec->channels=1; /* really needed */
                break;
            case CODEC_ID_AMR_NB:
                st->codec->sample_rate = 8000; /* should really we ? */
                st->codec->channels=1; /* really needed */
                break;
            default:
                break;
991
            }
992

993 994 995 996 997 998
            bits_per_sample = av_get_bits_per_sample(st->codec->codec_id);
            if (bits_per_sample) {
                st->codec->bits_per_sample = bits_per_sample;
                sc->sample_size = (bits_per_sample >> 3) * st->codec->channels;
            }

999 1000 1001
            //Read QT version 1 fields. In version 0 theese dont exist
            dprintf("version =%d mp4=%d\n",version,c->mp4);
            if(version==1) {
1002
                sc->sample_size_v1.den = get_be32(pb); /* samples per packet */
1003
                get_be32(pb); /* bytes per packet */
1004
                sc->sample_size_v1.num = get_be32(pb); /* bytes per frame */
1005
                get_be32(pb); /* bytes per sample */
1006 1007 1008 1009 1010 1011 1012 1013 1014
            } else if(version==2) {
                get_be32(pb); /* sizeof struct only */
                st->codec->sample_rate = av_int2dbl(get_be64(pb)); /* float 64 */
                st->codec->channels = get_be32(pb);
                get_be32(pb); /* always 0x7F000000 */
                get_be32(pb); /* bits per channel if sound is uncompressed */
                get_be32(pb); /* lcpm format specific flag */
                get_be32(pb); /* bytes per audio packet if constant */
                get_be32(pb); /* lpcm frames per audio packet if constant */
1015
            }
1016 1017 1018
        } else {
            /* other codec type, just skip (rtp, mp4s, tmcd ...) */
            url_fskip(pb, size - (url_ftell(pb) - start_pos));
1019
        }
1020 1021 1022 1023 1024 1025
        /* this will read extra atoms at the end (wave, alac, damr, avcC, SMI ...) */
        a.size = size - (url_ftell(pb) - start_pos);
        if (a.size > 8)
            mov_read_default(c, pb, a);
        else if (a.size > 0)
            url_fskip(pb, a.size);
1026
    }
1027

1028 1029 1030
    if(st->codec->codec_type==CODEC_TYPE_AUDIO && st->codec->sample_rate==0 && sc->time_scale>1) {
        st->codec->sample_rate= sc->time_scale;
    }
1031

1032
    /* special codec parameters handling */
1033
    switch (st->codec->codec_id) {
1034 1035 1036 1037 1038 1039 1040 1041 1042 1043 1044 1045
#ifdef CONFIG_H261_DECODER
    case CODEC_ID_H261:
#endif
#ifdef CONFIG_H263_DECODER
    case CODEC_ID_H263:
#endif
#ifdef CONFIG_MPEG4_DECODER
    case CODEC_ID_MPEG4:
#endif
        st->codec->width= 0; /* let decoder init width/height */
        st->codec->height= 0;
        break;
1046
#ifdef CONFIG_FAAD
1047
    case CODEC_ID_AAC:
1048 1049 1050
#endif
#ifdef CONFIG_VORBIS_DECODER
    case CODEC_ID_VORBIS:
1051
#endif
1052 1053 1054
    case CODEC_ID_MP3ON4:
        st->codec->sample_rate= 0; /* let decoder init parameters properly */
        break;
1055
#ifdef CONFIG_DV_DEMUXER
1056 1057 1058 1059 1060 1061 1062 1063 1064 1065
    case CODEC_ID_DVAUDIO:
        c->dv_fctx = av_alloc_format_context();
        c->dv_demux = dv_init_demux(c->dv_fctx);
        if (!c->dv_demux) {
            av_log(c->fc, AV_LOG_ERROR, "dv demux context init error\n");
            return -1;
        }
        sc->dv_audio_container = 1;
        st->codec->codec_id = CODEC_ID_PCM_S16LE;
        break;
1066
#endif
1067 1068 1069
    default:
        break;
    }
1070

1071 1072 1073
    return 0;
}

1074
static int mov_read_stsc(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
1075
{
1076 1077
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    MOVStreamContext *sc = (MOVStreamContext *)st->priv_data;
1078
    unsigned int i, entries;
1079

1080 1081 1082 1083
    get_byte(pb); /* version */
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */

    entries = get_be32(pb);
1084

1085 1086
    if(entries >= UINT_MAX / sizeof(MOV_sample_to_chunk_tbl))
        return -1;
1087

1088
#ifdef DEBUG
G
Gael Chardon 已提交
1089
av_log(NULL, AV_LOG_DEBUG, "track[%i].stsc.entries = %i\n", c->fc->nb_streams-1, entries);
1090
#endif
1091
    sc->sample_to_chunk_sz = entries;
1092 1093 1094
    sc->sample_to_chunk = (MOV_sample_to_chunk_tbl*) av_malloc(entries * sizeof(MOV_sample_to_chunk_tbl));
    if (!sc->sample_to_chunk)
        return -1;
1095 1096 1097 1098 1099 1100 1101 1102
    for(i=0; i<entries; i++) {
        sc->sample_to_chunk[i].first = get_be32(pb);
        sc->sample_to_chunk[i].count = get_be32(pb);
        sc->sample_to_chunk[i].id = get_be32(pb);
    }
    return 0;
}

1103 1104 1105 1106
static int mov_read_stss(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    MOVStreamContext *sc = (MOVStreamContext *)st->priv_data;
1107
    unsigned int i, entries;
1108 1109 1110 1111 1112

    get_byte(pb); /* version */
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */

    entries = get_be32(pb);
1113

1114 1115
    if(entries >= UINT_MAX / sizeof(long))
        return -1;
1116

1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127 1128 1129 1130 1131 1132
    sc->keyframe_count = entries;
#ifdef DEBUG
    av_log(NULL, AV_LOG_DEBUG, "keyframe_count = %ld\n", sc->keyframe_count);
#endif
    sc->keyframes = (long*) av_malloc(entries * sizeof(long));
    if (!sc->keyframes)
        return -1;
    for(i=0; i<entries; i++) {
        sc->keyframes[i] = get_be32(pb);
#ifdef DEBUG
/*        av_log(NULL, AV_LOG_DEBUG, "keyframes[]=%ld\n", sc->keyframes[i]); */
#endif
    }
    return 0;
}

1133
static int mov_read_stsz(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
1134
{
1135 1136
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    MOVStreamContext *sc = (MOVStreamContext *)st->priv_data;
1137
    unsigned int i, entries, sample_size;
1138

1139 1140
    get_byte(pb); /* version */
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */
1141

1142 1143 1144
    sample_size = get_be32(pb);
    if (!sc->sample_size) /* do not overwrite value computed in stsd */
        sc->sample_size = sample_size;
1145
    entries = get_be32(pb);
1146 1147 1148
    if(entries >= UINT_MAX / sizeof(long))
        return -1;

1149
    sc->sample_count = entries;
1150 1151 1152
    if (sample_size)
        return 0;

1153
#ifdef DEBUG
G
Gael Chardon 已提交
1154
    av_log(NULL, AV_LOG_DEBUG, "sample_size = %ld sample_count = %ld\n", sc->sample_size, sc->sample_count);
1155
#endif
1156 1157 1158
    sc->sample_sizes = (long*) av_malloc(entries * sizeof(long));
    if (!sc->sample_sizes)
        return -1;
1159 1160 1161
    for(i=0; i<entries; i++) {
        sc->sample_sizes[i] = get_be32(pb);
#ifdef DEBUG
1162
        av_log(NULL, AV_LOG_DEBUG, "sample_sizes[]=%ld\n", sc->sample_sizes[i]);
1163 1164 1165 1166 1167
#endif
    }
    return 0;
}

1168
static int mov_read_stts(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
1169
{
1170
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
1171
    MOVStreamContext *sc = (MOVStreamContext *)st->priv_data;
1172
    unsigned int i, entries;
1173 1174
    int64_t duration=0;
    int64_t total_sample_count=0;
1175

1176 1177 1178
    get_byte(pb); /* version */
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */
    entries = get_be32(pb);
M
cleanup  
Michael Niedermayer 已提交
1179
    if(entries >= UINT_MAX / sizeof(Time2Sample))
1180
        return -1;
1181

1182 1183
    sc->stts_count = entries;
    sc->stts_data = av_malloc(entries * sizeof(Time2Sample));
1184

1185
#ifdef DEBUG
G
Gael Chardon 已提交
1186
av_log(NULL, AV_LOG_DEBUG, "track[%i].stts.entries = %i\n", c->fc->nb_streams-1, entries);
1187
#endif
1188 1189 1190

    sc->time_rate=0;

1191
    for(i=0; i<entries; i++) {
M
cleanup  
Michael Niedermayer 已提交
1192 1193
        int sample_duration;
        int sample_count;
1194

1195
        sample_count=get_be32(pb);
1196
        sample_duration = get_be32(pb);
1197 1198 1199 1200
        sc->stts_data[i].count= sample_count;
        sc->stts_data[i].duration= sample_duration;

        sc->time_rate= ff_gcd(sc->time_rate, sample_duration);
1201

1202 1203
        dprintf("sample_count=%d, sample_duration=%d\n",sample_count,sample_duration);

B
Baptiste Coudurier 已提交
1204
        duration+=(int64_t)sample_duration*sample_count;
1205 1206 1207
        total_sample_count+=sample_count;
    }

1208 1209 1210
    st->nb_frames= total_sample_count;
    if(duration)
        st->duration= duration;
1211 1212 1213
    return 0;
}

M
Michael Niedermayer 已提交
1214 1215
static int mov_read_ctts(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
1216 1217
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    MOVStreamContext *sc = (MOVStreamContext *)st->priv_data;
M
Michael Niedermayer 已提交
1218 1219 1220 1221 1222 1223 1224 1225
    unsigned int i, entries;

    get_byte(pb); /* version */
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */
    entries = get_be32(pb);
    if(entries >= UINT_MAX / sizeof(Time2Sample))
        return -1;

1226 1227
    sc->ctts_count = entries;
    sc->ctts_data = av_malloc(entries * sizeof(Time2Sample));
M
Michael Niedermayer 已提交
1228

1229 1230
    dprintf("track[%i].ctts.entries = %i\n", c->fc->nb_streams-1, entries);

M
Michael Niedermayer 已提交
1231
    for(i=0; i<entries; i++) {
1232 1233 1234
        int count    =get_be32(pb);
        int duration =get_be32(pb);

1235 1236 1237 1238 1239 1240
        if (duration < 0) {
            av_log(c->fc, AV_LOG_ERROR, "negative ctts, ignoring\n");
            sc->ctts_count = 0;
            url_fskip(pb, 8 * (entries - i - 1));
            break;
        }
1241 1242 1243 1244
        sc->ctts_data[i].count   = count;
        sc->ctts_data[i].duration= duration;

        sc->time_rate= ff_gcd(sc->time_rate, duration);
M
Michael Niedermayer 已提交
1245 1246 1247 1248
    }
    return 0;
}

1249 1250 1251 1252 1253 1254 1255 1256 1257
static int mov_read_trak(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    AVStream *st;
    MOVStreamContext *sc;

    st = av_new_stream(c->fc, c->fc->nb_streams);
    if (!st) return -2;
    sc = (MOVStreamContext*) av_mallocz(sizeof(MOVStreamContext));
    if (!sc) {
1258
        av_free(st);
1259 1260 1261 1262
        return -1;
    }

    st->priv_data = sc;
1263
    st->codec->codec_type = CODEC_TYPE_DATA;
F
Fabrice Bellard 已提交
1264
    st->start_time = 0; /* XXX: check */
1265 1266 1267 1268 1269 1270 1271
    c->streams[c->fc->nb_streams-1] = sc;

    return mov_read_default(c, pb, atom);
}

static int mov_read_tkhd(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
B
clean  
Baptiste Coudurier 已提交
1272 1273
    AVStream *st = c->fc->streams[c->fc->nb_streams-1];
    int version = get_byte(pb);
1274 1275 1276 1277 1278 1279 1280 1281 1282 1283

    get_byte(pb); get_byte(pb);
    get_byte(pb); /* flags */
    /*
    MOV_TRACK_ENABLED 0x0001
    MOV_TRACK_IN_MOVIE 0x0002
    MOV_TRACK_IN_PREVIEW 0x0004
    MOV_TRACK_IN_POSTER 0x0008
    */

B
Baptiste Coudurier 已提交
1284 1285 1286 1287 1288 1289 1290
    if (version == 1) {
        get_be64(pb);
        get_be64(pb);
    } else {
        get_be32(pb); /* creation time */
        get_be32(pb); /* modification time */
    }
1291 1292
    st->id = (int)get_be32(pb); /* track id (NOT 0 !)*/
    get_be32(pb); /* reserved */
F
Fabrice Bellard 已提交
1293
    st->start_time = 0; /* check */
B
Baptiste Coudurier 已提交
1294
    (version == 1) ? get_be64(pb) : get_be32(pb); /* highlevel (considering edits) duration in movie timebase */
1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305
    get_be32(pb); /* reserved */
    get_be32(pb); /* reserved */

    get_be16(pb); /* layer */
    get_be16(pb); /* alternate group */
    get_be16(pb); /* volume */
    get_be16(pb); /* reserved */

    url_fskip(pb, 36); /* display matrix */

    /* those are fixed-point */
B
Baptiste Coudurier 已提交
1306 1307
    get_be32(pb); /* track width */
    get_be32(pb); /* track height */
1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327

    return 0;
}

/* this atom should be null (from specs), but some buggy files put the 'moov' atom inside it... */
/* like the files created with Adobe Premiere 5.0, for samples see */
/* http://graphics.tudelft.nl/~wouter/publications/soundtests/ */
static int mov_read_wide(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
    int err;

    if (atom.size < 8)
        return 0; /* continue */
    if (get_be32(pb) != 0) { /* 0 sized mdat atom... use the 'wide' atom size */
        url_fskip(pb, atom.size - 4);
        return 0;
    }
    atom.type = get_le32(pb);
    atom.offset += 8;
    atom.size -= 8;
1328
    if (atom.type != MKTAG('m', 'd', 'a', 't')) {
1329 1330 1331 1332 1333 1334 1335 1336
        url_fskip(pb, atom.size);
        return 0;
    }
    err = mov_read_mdat(c, pb, atom);
    return err;
}


1337
#ifdef CONFIG_ZLIB
1338
static int null_read_packet(void *opaque, uint8_t *buf, int buf_size)
1339 1340 1341 1342
{
    return -1;
}

1343
static int mov_read_cmov(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
1344 1345
{
    ByteIOContext ctx;
1346 1347
    uint8_t *cmov_data;
    uint8_t *moov_data; /* uncompressed data */
1348 1349
    long cmov_len, moov_len;
    int ret;
1350

1351 1352 1353 1354
    get_be32(pb); /* dcom atom */
    if (get_le32(pb) != MKTAG( 'd', 'c', 'o', 'm' ))
        return -1;
    if (get_le32(pb) != MKTAG( 'z', 'l', 'i', 'b' )) {
1355
        av_log(NULL, AV_LOG_ERROR, "unknown compression for cmov atom !");
1356 1357 1358 1359 1360 1361
        return -1;
    }
    get_be32(pb); /* cmvd atom */
    if (get_le32(pb) != MKTAG( 'c', 'm', 'v', 'd' ))
        return -1;
    moov_len = get_be32(pb); /* uncompressed size */
1362
    cmov_len = atom.size - 6 * 4;
1363

1364
    cmov_data = (uint8_t *) av_malloc(cmov_len);
1365 1366
    if (!cmov_data)
        return -1;
1367
    moov_data = (uint8_t *) av_malloc(moov_len);
1368 1369 1370 1371 1372
    if (!moov_data) {
        av_free(cmov_data);
        return -1;
    }
    get_buffer(pb, cmov_data, cmov_len);
1373
    if(uncompress (moov_data, (uLongf *) &moov_len, (const Bytef *)cmov_data, cmov_len) != Z_OK)
1374 1375 1376 1377
        return -1;
    if(init_put_byte(&ctx, moov_data, moov_len, 0, NULL, null_read_packet, NULL, NULL) != 0)
        return -1;
    ctx.buf_end = ctx.buffer + moov_len;
1378 1379 1380
    atom.type = MKTAG( 'm', 'o', 'o', 'v' );
    atom.offset = 0;
    atom.size = moov_len;
1381
#ifdef DEBUG
M
Michael Niedermayer 已提交
1382
//    { int fd = open("/tmp/uncompheader.mov", O_WRONLY | O_CREAT); write(fd, moov_data, moov_len); close(fd); }
1383
#endif
1384
    ret = mov_read_default(c, &ctx, atom);
1385 1386
    av_free(moov_data);
    av_free(cmov_data);
1387

1388 1389 1390 1391
    return ret;
}
#endif

G
Gael Chardon 已提交
1392 1393 1394
/* edit list atom */
static int mov_read_elst(MOVContext *c, ByteIOContext *pb, MOV_atom_t atom)
{
B
Baptiste Coudurier 已提交
1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407
    int i, edit_count;

    get_byte(pb); /* version */
    get_byte(pb); get_byte(pb); get_byte(pb); /* flags */
    edit_count= c->streams[c->fc->nb_streams-1]->edit_count = get_be32(pb);     /* entries */

    for(i=0; i<edit_count; i++){
        get_be32(pb); /* Track duration */
        get_be32(pb); /* Media time */
        get_be32(pb); /* Media rate */
    }
    dprintf("track[%i].edit_count = %i\n", c->fc->nb_streams-1, c->streams[c->fc->nb_streams-1]->edit_count);
    return 0;
G
Gael Chardon 已提交
1408 1409
}

1410 1411
static const MOVParseTableEntry mov_default_parse_table[] = {
/* mp4 atoms */
1412 1413 1414
{ MKTAG( 'c', 'o', '6', '4' ), mov_read_stco },
{ MKTAG( 'c', 'p', 'r', 't' ), mov_read_default },
{ MKTAG( 'c', 'r', 'h', 'd' ), mov_read_default },
M
Michael Niedermayer 已提交
1415
{ MKTAG( 'c', 't', 't', 's' ), mov_read_ctts }, /* composition time to sample */
1416 1417 1418 1419
{ MKTAG( 'd', 'i', 'n', 'f' ), mov_read_default }, /* data information */
{ MKTAG( 'd', 'p', 'n', 'd' ), mov_read_leaf },
{ MKTAG( 'd', 'r', 'e', 'f' ), mov_read_leaf },
{ MKTAG( 'e', 'd', 't', 's' ), mov_read_default },
1420
{ MKTAG( 'e', 'l', 's', 't' ), mov_read_elst },
1421
{ MKTAG( 'e', 'n', 'd', 'a' ), mov_read_enda },
1422
{ MKTAG( 'f', 'r', 'e', 'e' ), mov_read_leaf },
1423
{ MKTAG( 'f', 't', 'y', 'p' ), mov_read_ftyp },
1424 1425 1426 1427
{ MKTAG( 'h', 'd', 'l', 'r' ), mov_read_hdlr },
{ MKTAG( 'h', 'i', 'n', 't' ), mov_read_leaf },
{ MKTAG( 'h', 'm', 'h', 'd' ), mov_read_leaf },
{ MKTAG( 'i', 'o', 'd', 's' ), mov_read_leaf },
1428
{ MKTAG( 'j', 'p', '2', 'h' ), mov_read_jp2h },
1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441
{ MKTAG( 'm', 'd', 'a', 't' ), mov_read_mdat },
{ MKTAG( 'm', 'd', 'h', 'd' ), mov_read_mdhd },
{ MKTAG( 'm', 'd', 'i', 'a' ), mov_read_default },
{ MKTAG( 'm', 'i', 'n', 'f' ), mov_read_default },
{ MKTAG( 'm', 'o', 'o', 'v' ), mov_read_moov },
{ MKTAG( 'm', 'p', '4', 'a' ), mov_read_default },
{ MKTAG( 'm', 'p', '4', 's' ), mov_read_default },
{ MKTAG( 'm', 'p', '4', 'v' ), mov_read_default },
{ MKTAG( 'm', 'p', 'o', 'd' ), mov_read_leaf },
{ MKTAG( 'm', 'v', 'h', 'd' ), mov_read_mvhd },
{ MKTAG( 'n', 'm', 'h', 'd' ), mov_read_leaf },
{ MKTAG( 'o', 'd', 'h', 'd' ), mov_read_default },
{ MKTAG( 's', 'd', 'h', 'd' ), mov_read_default },
1442
{ MKTAG( 's', 'k', 'i', 'p' ), mov_read_leaf },
1443
{ MKTAG( 's', 'm', 'h', 'd' ), mov_read_leaf }, /* sound media info header */
1444
{ MKTAG( 'S', 'M', 'I', ' ' ), mov_read_smi }, /* Sorenson extension ??? */
1445
{ MKTAG( 'a', 'l', 'a', 'c' ), mov_read_alac }, /* alac specific atom */
1446
{ MKTAG( 'a', 'v', 'c', 'C' ), mov_read_avcC },
1447 1448 1449 1450 1451 1452
{ MKTAG( 's', 't', 'b', 'l' ), mov_read_default },
{ MKTAG( 's', 't', 'c', 'o' ), mov_read_stco },
{ MKTAG( 's', 't', 'd', 'p' ), mov_read_default },
{ MKTAG( 's', 't', 's', 'c' ), mov_read_stsc },
{ MKTAG( 's', 't', 's', 'd' ), mov_read_stsd }, /* sample description */
{ MKTAG( 's', 't', 's', 'h' ), mov_read_default },
1453
{ MKTAG( 's', 't', 's', 's' ), mov_read_stss }, /* sync sample */
1454 1455 1456 1457 1458 1459 1460 1461
{ MKTAG( 's', 't', 's', 'z' ), mov_read_stsz }, /* sample size */
{ MKTAG( 's', 't', 't', 's' ), mov_read_stts },
{ MKTAG( 't', 'k', 'h', 'd' ), mov_read_tkhd }, /* track header */
{ MKTAG( 't', 'r', 'a', 'k' ), mov_read_trak },
{ MKTAG( 't', 'r', 'e', 'f' ), mov_read_default }, /* not really */
{ MKTAG( 'u', 'd', 't', 'a' ), mov_read_leaf },
{ MKTAG( 'u', 'r', 'l', ' ' ), mov_read_leaf },
{ MKTAG( 'u', 'r', 'n', ' ' ), mov_read_leaf },
1462
{ MKTAG( 'u', 'u', 'i', 'd' ), mov_read_leaf },
1463
{ MKTAG( 'v', 'm', 'h', 'd' ), mov_read_leaf }, /* video media info header */
R
Roberto Togni 已提交
1464
{ MKTAG( 'w', 'a', 'v', 'e' ), mov_read_wave },
1465
/* extra mp4 */
1466
{ MKTAG( 'M', 'D', 'E', 'S' ), mov_read_leaf },
1467
/* QT atoms */
1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482 1483 1484
{ MKTAG( 'c', 'h', 'a', 'p' ), mov_read_leaf },
{ MKTAG( 'c', 'l', 'i', 'p' ), mov_read_default },
{ MKTAG( 'c', 'r', 'g', 'n' ), mov_read_leaf },
{ MKTAG( 'c', 't', 'a', 'b' ), mov_read_ctab },
{ MKTAG( 'e', 's', 'd', 's' ), mov_read_esds },
{ MKTAG( 'k', 'm', 'a', 't' ), mov_read_leaf },
{ MKTAG( 'm', 'a', 't', 't' ), mov_read_default },
{ MKTAG( 'r', 'd', 'r', 'f' ), mov_read_leaf },
{ MKTAG( 'r', 'm', 'd', 'a' ), mov_read_default },
{ MKTAG( 'r', 'm', 'd', 'r' ), mov_read_leaf },
{ MKTAG( 'r', 'm', 'r', 'a' ), mov_read_default },
{ MKTAG( 's', 'c', 'p', 't' ), mov_read_leaf },
{ MKTAG( 's', 's', 'r', 'c' ), mov_read_leaf },
{ MKTAG( 's', 'y', 'n', 'c' ), mov_read_leaf },
{ MKTAG( 't', 'c', 'm', 'd' ), mov_read_leaf },
{ MKTAG( 'w', 'i', 'd', 'e' ), mov_read_wide }, /* place holder */
//{ MKTAG( 'r', 'm', 'q', 'u' ), mov_read_leaf },
1485
#ifdef CONFIG_ZLIB
1486
{ MKTAG( 'c', 'm', 'o', 'v' ), mov_read_cmov },
1487
#else
1488
{ MKTAG( 'c', 'm', 'o', 'v' ), mov_read_leaf },
1489
#endif
1490
{ 0L, mov_read_leaf }
1491 1492 1493 1494 1495
};

static void mov_free_stream_context(MOVStreamContext *sc)
{
    if(sc) {
1496
        av_freep(&sc->ctts_data);
M
Michael Niedermayer 已提交
1497
        av_freep(&sc);
1498 1499 1500
    }
}

1501
/* XXX: is it sufficient ? */
F
Fabrice Bellard 已提交
1502 1503
static int mov_probe(AVProbeData *p)
{
1504 1505
    unsigned int offset;
    uint32_t tag;
1506
    int score = 0;
1507

F
Fabrice Bellard 已提交
1508 1509 1510
    /* check file header */
    if (p->buf_size <= 12)
        return 0;
1511 1512 1513 1514
    offset = 0;
    for(;;) {
        /* ignore invalid offset */
        if ((offset + 8) > (unsigned int)p->buf_size)
1515
            return score;
1516
        tag = LE_32(p->buf + offset + 4);
1517
        switch(tag) {
1518
        /* check for obvious tags */
1519
        case MKTAG( 'j', 'P', ' ', ' ' ): /* jpeg 2000 signature */
1520
        case MKTAG( 'm', 'o', 'o', 'v' ):
1521 1522
        case MKTAG( 'm', 'd', 'a', 't' ):
        case MKTAG( 'p', 'n', 'o', 't' ): /* detect movs with preview pics like ew.mov and april.mov */
Z
Zdenek Kabelac 已提交
1523
        case MKTAG( 'u', 'd', 't', 'a' ): /* Packet Video PVAuthor adds this and a lot of more junk */
1524
            return AVPROBE_SCORE_MAX;
1525 1526 1527 1528 1529 1530
        /* those are more common words, so rate then a bit less */
        case MKTAG( 'w', 'i', 'd', 'e' ):
        case MKTAG( 'f', 'r', 'e', 'e' ):
        case MKTAG( 'j', 'u', 'n', 'k' ):
        case MKTAG( 'p', 'i', 'c', 't' ):
            return AVPROBE_SCORE_MAX - 5;
1531
        case MKTAG( 'f', 't', 'y', 'p' ):
1532
        case MKTAG( 's', 'k', 'i', 'p' ):
1533
        case MKTAG( 'u', 'u', 'i', 'd' ):
1534
            offset = BE_32(p->buf+offset) + offset;
1535 1536
            /* if we only find those cause probedata is too small at least rate them */
            score = AVPROBE_SCORE_MAX - 50;
1537 1538 1539
            break;
        default:
            /* unrecognized tag */
1540
            return score;
1541
        }
1542
    }
1543
    return score;
F
Fabrice Bellard 已提交
1544 1545
}

1546 1547 1548 1549 1550 1551 1552 1553 1554 1555
static void mov_build_index(MOVContext *mov, AVStream *st)
{
    MOVStreamContext *sc = st->priv_data;
    offset_t current_offset;
    int64_t current_dts = 0;
    int stts_index = 0;
    int stsc_index = 0;
    int stss_index = 0;
    int i, j, k;

1556
    if (sc->sample_sizes || st->codec->codec_type == CODEC_TYPE_VIDEO || sc->dv_audio_container) {
1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597 1598 1599
        int keyframe, sample_size;
        int current_sample = 0;
        int stts_sample = 0;
        int distance = 0;

        st->nb_frames = sc->sample_count;
        for (i = 0; i < sc->chunk_count; i++) {
            current_offset = sc->chunk_offsets[i];
            if (stsc_index + 1 < sc->sample_to_chunk_sz && i + 1 == sc->sample_to_chunk[stsc_index + 1].first)
                stsc_index++;
            for (j = 0; j < sc->sample_to_chunk[stsc_index].count; j++) {
                keyframe = !sc->keyframe_count || current_sample + 1 == sc->keyframes[stss_index];
                if (keyframe) {
                    distance = 0;
                    if (stss_index + 1 < sc->keyframe_count)
                        stss_index++;
                }
                sample_size = sc->sample_size > 0 ? sc->sample_size : sc->sample_sizes[current_sample];
                dprintf("AVIndex stream %d, sample %d, offset %llx, dts %lld, size %d, distance %d, keyframe %d\n",
                        st->index, current_sample, current_offset, current_dts, sample_size, distance, keyframe);
                av_add_index_entry(st, current_offset, current_dts, sample_size, distance, keyframe ? AVINDEX_KEYFRAME : 0);
                current_offset += sample_size;
                assert(sc->stts_data[stts_index].duration % sc->time_rate == 0);
                current_dts += sc->stts_data[stts_index].duration / sc->time_rate;
                distance++;
                stts_sample++;
                if (current_sample + 1 < sc->sample_count)
                    current_sample++;
                if (stts_index + 1 < sc->stts_count && stts_sample == sc->stts_data[stts_index].count) {
                    stts_sample = 0;
                    stts_index++;
                }
            }
        }
    } else { /* read whole chunk */
        int chunk_samples, chunk_size, chunk_duration;

        for (i = 0; i < sc->chunk_count; i++) {
            current_offset = sc->chunk_offsets[i];
            if (stsc_index + 1 < sc->sample_to_chunk_sz && i + 1 == sc->sample_to_chunk[stsc_index + 1].first)
                stsc_index++;
            chunk_samples = sc->sample_to_chunk[stsc_index].count;
            /* get chunk size */
1600
            if (sc->sample_size > 1 || st->codec->bits_per_sample == 8)
1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614 1615 1616 1617 1618 1619 1620 1621 1622 1623 1624 1625 1626 1627 1628 1629 1630 1631 1632 1633 1634 1635 1636 1637 1638 1639 1640 1641 1642 1643 1644 1645 1646 1647 1648 1649 1650 1651
                chunk_size = chunk_samples * sc->sample_size;
            else if (sc->sample_size_v1.den > 0 && (chunk_samples * sc->sample_size_v1.num % sc->sample_size_v1.den == 0))
                chunk_size = chunk_samples * sc->sample_size_v1.num / sc->sample_size_v1.den;
            else { /* workaround to find nearest next chunk offset */
                chunk_size = INT_MAX;
                for (j = 0; j < mov->total_streams; j++) {
                    MOVStreamContext *msc = mov->streams[j];

                    for (k = msc->next_chunk; k < msc->chunk_count; k++) {
                        if (msc->chunk_offsets[k] > current_offset && msc->chunk_offsets[k] - current_offset < chunk_size) {
                            chunk_size = msc->chunk_offsets[k] - current_offset;
                            msc->next_chunk = k;
                            break;
                        }
                    }
                }
                /* check for last chunk */
                if (chunk_size == INT_MAX)
                    for (j = 0; j < mov->mdat_count; j++) {
                        dprintf("mdat %d, offset %llx, size %lld, current offset %llx\n",
                                j, mov->mdat_list[j].offset, mov->mdat_list[j].size, current_offset);
                        if (mov->mdat_list[j].offset <= current_offset && mov->mdat_list[j].offset + mov->mdat_list[j].size > current_offset)
                            chunk_size = mov->mdat_list[j].offset + mov->mdat_list[j].size - current_offset;
                    }
                assert(chunk_size != INT_MAX);
                for (j = 0; j < mov->total_streams; j++) {
                    mov->streams[j]->next_chunk = 0;
                }
            }
            av_add_index_entry(st, current_offset, current_dts, chunk_size, 0, AVINDEX_KEYFRAME);
            /* get chunk duration */
            chunk_duration = 0;
            while (chunk_samples > 0) {
                if (chunk_samples < sc->stts_data[stts_index].count) {
                    chunk_duration += sc->stts_data[stts_index].duration * chunk_samples;
                    sc->stts_data[stts_index].count -= chunk_samples;
                    break;
                } else {
                    chunk_duration += sc->stts_data[stts_index].duration * chunk_samples;
                    chunk_samples -= sc->stts_data[stts_index].count;
                    if (stts_index + 1 < sc->stts_count) {
                        stts_index++;
                    }
                }
            }
            dprintf("AVIndex stream %d, chunk %d, offset %llx, dts %lld, size %d, duration %d\n",
                    st->index, i, current_offset, current_dts, chunk_size, chunk_duration);
            assert(chunk_duration % sc->time_rate == 0);
            current_dts += chunk_duration / sc->time_rate;
        }
    }
1652 1653
    /* adjust sample count to avindex entries */
    sc->sample_count = st->nb_index_entries;
1654 1655
}

Z
Zdenek Kabelac 已提交
1656
static int mov_read_header(AVFormatContext *s, AVFormatParameters *ap)
1657
{
1658
    MOVContext *mov = (MOVContext *) s->priv_data;
1659
    ByteIOContext *pb = &s->pb;
1660
    int i, err;
1661
    MOV_atom_t atom = { 0, 0, 0 };
1662 1663

    mov->fc = s;
1664
    mov->parse_table = mov_default_parse_table;
1665

1666
    if(!url_is_streamed(pb)) /* .mov and .mp4 aren't streamable anyway (only progressive download if moov is before mdat) */
1667
        atom.size = url_fsize(pb);
1668
    else
1669
        atom.size = 0x7FFFFFFFFFFFFFFFLL;
1670 1671

    /* check MOV header */
1672
    err = mov_read_default(mov, pb, atom);
1673
    if (err<0 || (!mov->found_moov && !mov->found_mdat)) {
1674 1675 1676
        av_log(s, AV_LOG_ERROR, "mov: header not found !!! (err:%d, moov:%d, mdat:%d) pos:%"PRId64"\n",
                err, mov->found_moov, mov->found_mdat, url_ftell(pb));
        return -1;
1677
    }
1678 1679
    dprintf("on_parse_exit_offset=%d\n", (int) url_ftell(pb));

1680 1681 1682 1683
    /* some cleanup : make sure we are on the mdat atom */
    if(!url_is_streamed(pb) && (url_ftell(pb) != mov->mdat_offset))
        url_fseek(pb, mov->mdat_offset, SEEK_SET);

1684
    mov->total_streams = s->nb_streams;
1685

1686 1687
    for(i=0; i<mov->total_streams; i++) {
        MOVStreamContext *sc = mov->streams[i];
1688

1689 1690 1691 1692 1693 1694 1695 1696 1697
        if(!sc->time_rate)
            sc->time_rate=1;
        if(!sc->time_scale)
            sc->time_scale= mov->time_scale;
        av_set_pts_info(s->streams[i], 64, sc->time_rate, sc->time_scale);

        if(s->streams[i]->duration != AV_NOPTS_VALUE){
            assert(s->streams[i]->duration % sc->time_rate == 0);
            s->streams[i]->duration /= sc->time_rate;
1698
        }
1699
        sc->ffindex = i;
1700
        mov_build_index(mov, s->streams[i]);
1701
    }
1702

1703 1704 1705 1706 1707 1708 1709 1710 1711
    for(i=0; i<mov->total_streams; i++) {
        /* dont need those anymore */
        av_freep(&mov->streams[i]->chunk_offsets);
        av_freep(&mov->streams[i]->sample_to_chunk);
        av_freep(&mov->streams[i]->sample_sizes);
        av_freep(&mov->streams[i]->keyframes);
        av_freep(&mov->streams[i]->stts_data);
    }
    av_freep(&mov->mdat_list);
1712 1713 1714
    return 0;
}

Z
Zdenek Kabelac 已提交
1715
static int mov_read_packet(AVFormatContext *s, AVPacket *pkt)
1716
{
1717 1718 1719
    MOVContext *mov = s->priv_data;
    MOVStreamContext *sc = 0;
    AVIndexEntry *sample = 0;
1720
    int64_t best_dts = INT64_MAX;
1721
    int i;
1722

1723
    for (i = 0; i < mov->total_streams; i++) {
1724
        MOVStreamContext *msc = mov->streams[i];
1725

1726 1727 1728 1729 1730 1731 1732 1733 1734
        if (s->streams[i]->discard != AVDISCARD_ALL && msc->current_sample < msc->sample_count) {
            AVIndexEntry *current_sample = &s->streams[i]->index_entries[msc->current_sample];
            int64_t dts = av_rescale(current_sample->timestamp * (int64_t)msc->time_rate, AV_TIME_BASE, msc->time_scale);

            dprintf("stream %d, sample %ld, dts %lld\n", i, msc->current_sample, dts);
            if (dts < best_dts) {
                sample = current_sample;
                best_dts = dts;
                sc = msc;
1735
            }
1736 1737
        }
    }
1738 1739 1740 1741
    if (!sample)
        return -1;
    /* must be done just before reading, to avoid infinite loop on sample */
    sc->current_sample++;
1742 1743
    if (sample->pos >= url_fsize(&s->pb)) {
        av_log(mov->fc, AV_LOG_ERROR, "stream %d, offset 0x%llx: partial file\n", sc->ffindex, sample->pos);
1744
        return -1;
1745
    }
1746
#ifdef CONFIG_DV_DEMUXER
1747 1748 1749 1750
    if (sc->dv_audio_container) {
        dv_get_packet(mov->dv_demux, pkt);
        dprintf("dv audio pkt size %d\n", pkt->size);
    } else {
1751
#endif
1752 1753
        url_fseek(&s->pb, sample->pos, SEEK_SET);
        av_get_packet(&s->pb, pkt, sample->size);
1754
#ifdef CONFIG_DV_DEMUXER
1755 1756 1757 1758 1759 1760
        if (mov->dv_demux) {
            void *pkt_destruct_func = pkt->destruct;
            dv_produce_packet(mov->dv_demux, pkt, pkt->data, pkt->size);
            pkt->destruct = pkt_destruct_func;
        }
    }
1761
#endif
1762 1763 1764 1765 1766 1767 1768 1769 1770 1771
    pkt->stream_index = sc->ffindex;
    pkt->dts = sample->timestamp;
    if (sc->ctts_data) {
        assert(sc->ctts_data[sc->sample_to_ctime_index].duration % sc->time_rate == 0);
        pkt->pts = pkt->dts + sc->ctts_data[sc->sample_to_ctime_index].duration / sc->time_rate;
        /* update ctts context */
        sc->sample_to_ctime_sample++;
        if (sc->sample_to_ctime_index < sc->ctts_count && sc->ctts_data[sc->sample_to_ctime_index].count == sc->sample_to_ctime_sample) {
            sc->sample_to_ctime_index++;
            sc->sample_to_ctime_sample = 0;
1772
        }
1773 1774
    } else {
        pkt->pts = pkt->dts;
1775
    }
1776 1777 1778 1779 1780
    pkt->flags |= sample->flags & AVINDEX_KEYFRAME ? PKT_FLAG_KEY : 0;
    pkt->pos = sample->pos;
    dprintf("stream %d, pts %lld, dts %lld, pos 0x%llx, duration %d\n", pkt->stream_index, pkt->pts, pkt->dts, pkt->pos, pkt->duration);
    return 0;
}
1781

1782 1783 1784 1785 1786
static int mov_seek_stream(AVStream *st, int64_t timestamp, int flags)
{
    MOVStreamContext *sc = st->priv_data;
    int sample, time_sample;
    int i;
1787

1788 1789 1790 1791 1792 1793 1794 1795 1796 1797 1798 1799 1800 1801 1802
    sample = av_index_search_timestamp(st, timestamp, flags);
    dprintf("stream %d, timestamp %lld, sample %d\n", st->index, timestamp, sample);
    if (sample < 0) /* not sure what to do */
        return -1;
    sc->current_sample = sample;
    dprintf("stream %d, found sample %ld\n", st->index, sc->current_sample);
    /* adjust ctts index */
    if (sc->ctts_data) {
        time_sample = 0;
        for (i = 0; i < sc->ctts_count; i++) {
            time_sample += sc->ctts_data[i].count;
            if (time_sample >= sc->current_sample) {
                sc->sample_to_ctime_index = i;
                sc->sample_to_ctime_sample = time_sample - sc->current_sample;
                break;
1803
            }
1804 1805
        }
    }
1806
    return sample;
1807 1808
}

1809
static int mov_read_seek(AVFormatContext *s, int stream_index, int64_t sample_time, int flags)
G
Gael Chardon 已提交
1810
{
1811 1812 1813 1814
    AVStream *st;
    int64_t seek_timestamp, timestamp;
    int sample;
    int i;
G
Gael Chardon 已提交
1815

1816
    if (stream_index >= s->nb_streams)
G
Gael Chardon 已提交
1817 1818
        return -1;

1819 1820 1821
    st = s->streams[stream_index];
    sample = mov_seek_stream(st, sample_time, flags);
    if (sample < 0)
G
Gael Chardon 已提交
1822 1823
        return -1;

1824 1825
    /* adjust seek timestamp to found sample timestamp */
    seek_timestamp = st->index_entries[sample].timestamp;
G
Gael Chardon 已提交
1826

1827 1828 1829 1830
    for (i = 0; i < s->nb_streams; i++) {
        st = s->streams[i];
        if (stream_index == i || st->discard == AVDISCARD_ALL)
            continue;
G
Gael Chardon 已提交
1831

1832 1833
        timestamp = av_rescale_q(seek_timestamp, s->streams[stream_index]->time_base, st->time_base);
        mov_seek_stream(st, timestamp, flags);
1834
    }
G
Gael Chardon 已提交
1835 1836 1837
    return 0;
}

Z
Zdenek Kabelac 已提交
1838
static int mov_read_close(AVFormatContext *s)
1839 1840
{
    int i;
1841
    MOVContext *mov = (MOVContext *) s->priv_data;
1842 1843
    for(i=0; i<mov->total_streams; i++)
        mov_free_stream_context(mov->streams[i]);
1844 1845
    /* free color tabs */
    for(i=0; i<mov->ctab_size; i++)
1846
        av_freep(&mov->ctab[i]);
1847 1848 1849 1850 1851 1852 1853 1854
    if(mov->dv_demux){
        for(i=0; i<mov->dv_fctx->nb_streams; i++){
            av_freep(&mov->dv_fctx->streams[i]->codec);
            av_freep(&mov->dv_fctx->streams[i]);
        }
        av_freep(&mov->dv_fctx);
        av_freep(&mov->dv_demux);
    }
1855
    av_freep(&mov->ctab);
1856 1857 1858
    return 0;
}

1859
AVInputFormat mov_demuxer = {
1860 1861
    "mov,mp4,m4a,3gp,3g2,mj2",
    "QuickTime/MPEG4/Motion JPEG 2000 format",
F
Fabrice Bellard 已提交
1862 1863
    sizeof(MOVContext),
    mov_probe,
1864 1865 1866
    mov_read_header,
    mov_read_packet,
    mov_read_close,
G
Gael Chardon 已提交
1867
    mov_read_seek,
1868
};