h264_ps.c 30.5 KB
Newer Older
1 2 3 4
/*
 * H.26L/H.264/AVC/JVT/14496-10/... parameter set decoding
 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
 *
5
 * This file is part of Libav.
6
 *
7
 * Libav is free software; you can redistribute it and/or
8 9 10 11
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
12
 * Libav is distributed in the hope that it will be useful,
13 14 15 16 17
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with Libav; if not, write to the Free Software
19 20 21 22
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

/**
23
 * @file
24
 * H.264 / AVC / MPEG-4 part10 parameter set decoding.
25 26 27
 * @author Michael Niedermayer <michaelni@gmx.at>
 */

28 29
#include <inttypes.h>

30
#include "libavutil/imgutils.h"
31
#include "internal.h"
32
#include "mathops.h"
33
#include "avcodec.h"
34
#include "h264data.h"
35
#include "h264_ps.h"
36 37
#include "golomb.h"

38 39 40
#define MAX_LOG2_MAX_FRAME_NUM    (12 + 4)
#define MIN_LOG2_MAX_FRAME_NUM    4

41 42
#define EXTENDED_SAR       255

43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60
static const AVRational pixel_aspect[17] = {
    {   0,  1 },
    {   1,  1 },
    {  12, 11 },
    {  10, 11 },
    {  16, 11 },
    {  40, 33 },
    {  24, 11 },
    {  20, 11 },
    {  32, 11 },
    {  80, 33 },
    {  18, 11 },
    {  15, 11 },
    {  64, 33 },
    { 160, 99 },
    {   4,  3 },
    {   3,  2 },
    {   2,  1 },
61 62
};

63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88
static const uint8_t default_scaling4[2][16] = {
    {  6, 13, 20, 28, 13, 20, 28, 32,
      20, 28, 32, 37, 28, 32, 37, 42 },
    { 10, 14, 20, 24, 14, 20, 24, 27,
      20, 24, 27, 30, 24, 27, 30, 34 }
};

static const uint8_t default_scaling8[2][64] = {
    {  6, 10, 13, 16, 18, 23, 25, 27,
      10, 11, 16, 18, 23, 25, 27, 29,
      13, 16, 18, 23, 25, 27, 29, 31,
      16, 18, 23, 25, 27, 29, 31, 33,
      18, 23, 25, 27, 29, 31, 33, 36,
      23, 25, 27, 29, 31, 33, 36, 38,
      25, 27, 29, 31, 33, 36, 38, 40,
      27, 29, 31, 33, 36, 38, 40, 42 },
    {  9, 13, 15, 17, 19, 21, 22, 24,
      13, 13, 17, 19, 21, 22, 24, 25,
      15, 17, 19, 21, 22, 24, 25, 27,
      17, 19, 21, 22, 24, 25, 27, 28,
      19, 21, 22, 24, 25, 27, 28, 30,
      21, 22, 24, 25, 27, 28, 30, 32,
      22, 24, 25, 27, 28, 30, 32, 33,
      24, 25, 27, 28, 30, 32, 33, 35 }
};

89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
/* maximum number of MBs in the DPB for a given level */
static const int level_max_dpb_mbs[][2] = {
    { 10, 396       },
    { 11, 900       },
    { 12, 2376      },
    { 13, 2376      },
    { 20, 2376      },
    { 21, 4752      },
    { 22, 8100      },
    { 30, 8100      },
    { 31, 18000     },
    { 32, 20480     },
    { 40, 32768     },
    { 41, 32768     },
    { 42, 34816     },
    { 50, 110400    },
    { 51, 184320    },
    { 52, 184320    },
};

109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132
static void remove_pps(H264ParamSets *s, int id)
{
    if (s->pps_list[id] && s->pps == (const PPS*)s->pps_list[id]->data)
        s->pps = NULL;
    av_buffer_unref(&s->pps_list[id]);
}

static void remove_sps(H264ParamSets *s, int id)
{
    int i;
    if (s->sps_list[id]) {
        if (s->sps == (SPS*)s->sps_list[id]->data)
            s->sps = NULL;

        /* drop all PPS that depend on this SPS */
        for (i = 0; i < FF_ARRAY_ELEMS(s->pps_list); i++)
            if (s->pps_list[i] && ((PPS*)s->pps_list[i]->data)->sps_id == id)
                remove_pps(s, i);
    }
    av_buffer_unref(&s->sps_list[id]);
}

static inline int decode_hrd_parameters(GetBitContext *gb, AVCodecContext *avctx,
                                        SPS *sps)
133
{
134
    int cpb_count, i;
135
    cpb_count = get_ue_golomb_31(gb) + 1;
136

137
    if (cpb_count > 32U) {
138
        av_log(avctx, AV_LOG_ERROR, "cpb_count %d invalid\n", cpb_count);
139
        return AVERROR_INVALIDDATA;
140 141
    }

142 143
    get_bits(gb, 4); /* bit_rate_scale */
    get_bits(gb, 4); /* cpb_size_scale */
144
    for (i = 0; i < cpb_count; i++) {
145 146 147 148 149 150 151 152
        get_ue_golomb_long(gb); /* bit_rate_value_minus1 */
        get_ue_golomb_long(gb); /* cpb_size_value_minus1 */
        get_bits1(gb);          /* cbr_flag */
    }
    sps->initial_cpb_removal_delay_length = get_bits(gb, 5) + 1;
    sps->cpb_removal_delay_length         = get_bits(gb, 5) + 1;
    sps->dpb_output_delay_length          = get_bits(gb, 5) + 1;
    sps->time_offset_length               = get_bits(gb, 5);
153
    sps->cpb_cnt                          = cpb_count;
154 155 156
    return 0;
}

157 158
static inline int decode_vui_parameters(GetBitContext *gb, AVCodecContext *avctx,
                                        SPS *sps)
159
{
160 161 162
    int aspect_ratio_info_present_flag;
    unsigned int aspect_ratio_idc;

163
    aspect_ratio_info_present_flag = get_bits1(gb);
164

165
    if (aspect_ratio_info_present_flag) {
166
        aspect_ratio_idc = get_bits(gb, 8);
167
        if (aspect_ratio_idc == EXTENDED_SAR) {
168 169
            sps->sar.num = get_bits(gb, 16);
            sps->sar.den = get_bits(gb, 16);
170 171 172
        } else if (aspect_ratio_idc < FF_ARRAY_ELEMS(pixel_aspect)) {
            sps->sar = pixel_aspect[aspect_ratio_idc];
        } else {
173
            av_log(avctx, AV_LOG_ERROR, "illegal aspect ratio\n");
174
            return AVERROR_INVALIDDATA;
175
        }
176 177 178
    } else {
        sps->sar.num =
        sps->sar.den = 0;
179 180
    }

181 182
    if (get_bits1(gb))      /* overscan_info_present_flag */
        get_bits1(gb);      /* overscan_appropriate_flag */
183

184
    sps->video_signal_type_present_flag = get_bits1(gb);
185
    if (sps->video_signal_type_present_flag) {
186 187
        get_bits(gb, 3);                 /* video_format */
        sps->full_range = get_bits1(gb); /* video_full_range_flag */
188

189
        sps->colour_description_present_flag = get_bits1(gb);
190
        if (sps->colour_description_present_flag) {
191 192 193
            sps->color_primaries = get_bits(gb, 8); /* colour_primaries */
            sps->color_trc       = get_bits(gb, 8); /* transfer_characteristics */
            sps->colorspace      = get_bits(gb, 8); /* matrix_coefficients */
194
            if (sps->color_primaries >= AVCOL_PRI_NB)
195
                sps->color_primaries = AVCOL_PRI_UNSPECIFIED;
196
            if (sps->color_trc >= AVCOL_TRC_NB)
197
                sps->color_trc = AVCOL_TRC_UNSPECIFIED;
198
            if (sps->colorspace >= AVCOL_SPC_NB)
199
                sps->colorspace = AVCOL_SPC_UNSPECIFIED;
200 201 202
        }
    }

203
    /* chroma_location_info_present_flag */
204
    if (get_bits1(gb)) {
205
        /* chroma_sample_location_type_top_field */
206 207
        avctx->chroma_sample_location = get_ue_golomb(gb) + 1;
        get_ue_golomb(gb);  /* chroma_sample_location_type_bottom_field */
208 209
    }

210
    sps->timing_info_present_flag = get_bits1(gb);
211
    if (sps->timing_info_present_flag) {
212 213
        sps->num_units_in_tick = get_bits_long(gb, 32);
        sps->time_scale        = get_bits_long(gb, 32);
214
        if (!sps->num_units_in_tick || !sps->time_scale) {
215
            av_log(avctx, AV_LOG_ERROR,
216
                   "time_scale/num_units_in_tick invalid or unsupported (%"PRIu32"/%"PRIu32")\n",
217
                   sps->time_scale, sps->num_units_in_tick);
218
            return AVERROR_INVALIDDATA;
219
        }
220
        sps->fixed_frame_rate_flag = get_bits1(gb);
221 222
    }

223
    sps->nal_hrd_parameters_present_flag = get_bits1(gb);
224
    if (sps->nal_hrd_parameters_present_flag)
225
        if (decode_hrd_parameters(gb, avctx, sps) < 0)
226
            return AVERROR_INVALIDDATA;
227
    sps->vcl_hrd_parameters_present_flag = get_bits1(gb);
228
    if (sps->vcl_hrd_parameters_present_flag)
229
        if (decode_hrd_parameters(gb, avctx, sps) < 0)
230
            return AVERROR_INVALIDDATA;
231 232
    if (sps->nal_hrd_parameters_present_flag ||
        sps->vcl_hrd_parameters_present_flag)
233 234
        get_bits1(gb);     /* low_delay_hrd_flag */
    sps->pic_struct_present_flag = get_bits1(gb);
235

236
    sps->bitstream_restriction_flag = get_bits1(gb);
237
    if (sps->bitstream_restriction_flag) {
238 239 240 241 242 243 244 245 246
        get_bits1(gb);     /* motion_vectors_over_pic_boundaries_flag */
        get_ue_golomb(gb); /* max_bytes_per_pic_denom */
        get_ue_golomb(gb); /* max_bits_per_mb_denom */
        get_ue_golomb(gb); /* log2_max_mv_length_horizontal */
        get_ue_golomb(gb); /* log2_max_mv_length_vertical */
        sps->num_reorder_frames = get_ue_golomb(gb);
        get_ue_golomb(gb); /*max_dec_frame_buffering*/

        if (get_bits_left(gb) < 0) {
247 248
            sps->num_reorder_frames         = 0;
            sps->bitstream_restriction_flag = 0;
249 250
        }

251 252
        if (sps->num_reorder_frames > 16U
            /* max_dec_frame_buffering || max_dec_frame_buffering > 16 */) {
253
            av_log(avctx, AV_LOG_ERROR,
254 255 256
                   "Clipping illegal num_reorder_frames %d\n",
                   sps->num_reorder_frames);
            sps->num_reorder_frames = 16;
257
            return AVERROR_INVALIDDATA;
258 259
        }
    }
260 261 262
    if (get_bits_left(gb) < 0) {
        av_log(avctx, AV_LOG_ERROR,
               "Overread VUI by %d bits\n", -get_bits_left(gb));
263 264
        return AVERROR_INVALIDDATA;
    }
265 266 267 268

    return 0;
}

269
static void decode_scaling_list(GetBitContext *gb, uint8_t *factors, int size,
270 271 272
                                const uint8_t *jvt_list,
                                const uint8_t *fallback_list)
{
273
    int i, last = 8, next = 8;
274
    const uint8_t *scan = size == 16 ? ff_zigzag_scan : ff_zigzag_direct;
275
    if (!get_bits1(gb)) /* matrix not written, we use the predicted one */
276
        memcpy(factors, fallback_list, size * sizeof(uint8_t));
277
    else
278 279
        for (i = 0; i < size; i++) {
            if (next)
280
                next = (last + get_se_golomb(gb)) & 0xff;
281 282 283 284 285
            if (!i && !next) { /* matrix not written, we use the preset one */
                memcpy(factors, jvt_list, size * sizeof(uint8_t));
                break;
            }
            last = factors[scan[i]] = next ? next : last;
286 287 288
        }
}

289
static void decode_scaling_matrices(GetBitContext *gb, SPS *sps,
290 291 292 293
                                    PPS *pps, int is_sps,
                                    uint8_t(*scaling_matrix4)[16],
                                    uint8_t(*scaling_matrix8)[64])
{
294 295 296 297 298
    int fallback_sps = !is_sps && sps->scaling_matrix_present;
    const uint8_t *fallback[4] = {
        fallback_sps ? sps->scaling_matrix4[0] : default_scaling4[0],
        fallback_sps ? sps->scaling_matrix4[3] : default_scaling4[1],
        fallback_sps ? sps->scaling_matrix8[0] : default_scaling8[0],
299
        fallback_sps ? sps->scaling_matrix8[3] : default_scaling8[1]
300
    };
301
    if (get_bits1(gb)) {
302
        sps->scaling_matrix_present |= is_sps;
303 304 305 306 307 308
        decode_scaling_list(gb, scaling_matrix4[0], 16, default_scaling4[0], fallback[0]);        // Intra, Y
        decode_scaling_list(gb, scaling_matrix4[1], 16, default_scaling4[0], scaling_matrix4[0]); // Intra, Cr
        decode_scaling_list(gb, scaling_matrix4[2], 16, default_scaling4[0], scaling_matrix4[1]); // Intra, Cb
        decode_scaling_list(gb, scaling_matrix4[3], 16, default_scaling4[1], fallback[1]);        // Inter, Y
        decode_scaling_list(gb, scaling_matrix4[4], 16, default_scaling4[1], scaling_matrix4[3]); // Inter, Cr
        decode_scaling_list(gb, scaling_matrix4[5], 16, default_scaling4[1], scaling_matrix4[4]); // Inter, Cb
309
        if (is_sps || pps->transform_8x8_mode) {
310
            decode_scaling_list(gb, scaling_matrix8[0], 64, default_scaling8[0], fallback[2]); // Intra, Y
311
            if (sps->chroma_format_idc == 3) {
312 313
                decode_scaling_list(gb, scaling_matrix8[1], 64, default_scaling8[0], scaling_matrix8[0]); // Intra, Cr
                decode_scaling_list(gb, scaling_matrix8[2], 64, default_scaling8[0], scaling_matrix8[1]); // Intra, Cb
314
            }
315
            decode_scaling_list(gb, scaling_matrix8[3], 64, default_scaling8[1], fallback[3]); // Inter, Y
316
            if (sps->chroma_format_idc == 3) {
317 318
                decode_scaling_list(gb, scaling_matrix8[4], 64, default_scaling8[1], scaling_matrix8[3]); // Inter, Cr
                decode_scaling_list(gb, scaling_matrix8[5], 64, default_scaling8[1], scaling_matrix8[4]); // Inter, Cb
319
            }
320 321 322 323
        }
    }
}

324 325
int ff_h264_decode_seq_parameter_set(GetBitContext *gb, AVCodecContext *avctx,
                                     H264ParamSets *ps)
326
{
327
    AVBufferRef *sps_buf;
328
    int profile_idc, level_idc, constraint_set_flags = 0;
329
    unsigned int sps_id;
330
    int i, log2_max_frame_num_minus4;
331 332
    SPS *sps;

333 334 335 336 337 338 339 340 341 342
    profile_idc           = get_bits(gb, 8);
    constraint_set_flags |= get_bits1(gb) << 0;   // constraint_set0_flag
    constraint_set_flags |= get_bits1(gb) << 1;   // constraint_set1_flag
    constraint_set_flags |= get_bits1(gb) << 2;   // constraint_set2_flag
    constraint_set_flags |= get_bits1(gb) << 3;   // constraint_set3_flag
    constraint_set_flags |= get_bits1(gb) << 4;   // constraint_set4_flag
    constraint_set_flags |= get_bits1(gb) << 5;   // constraint_set5_flag
    skip_bits(gb, 2);                             // reserved_zero_2bits
    level_idc = get_bits(gb, 8);
    sps_id    = get_ue_golomb_31(gb);
343

344
    if (sps_id >= MAX_SPS_COUNT) {
345
        av_log(avctx, AV_LOG_ERROR, "sps_id %u out of range\n", sps_id);
346
        return AVERROR_INVALIDDATA;
347
    }
348 349 350

    sps_buf = av_buffer_allocz(sizeof(*sps));
    if (!sps_buf)
351
        return AVERROR(ENOMEM);
352
    sps = (SPS*)sps_buf->data;
353

354
    sps->sps_id               = sps_id;
355 356
    sps->time_offset_length   = 24;
    sps->profile_idc          = profile_idc;
357
    sps->constraint_set_flags = constraint_set_flags;
358
    sps->level_idc            = level_idc;
359 360 361 362 363

    memset(sps->scaling_matrix4, 16, sizeof(sps->scaling_matrix4));
    memset(sps->scaling_matrix8, 16, sizeof(sps->scaling_matrix8));
    sps->scaling_matrix_present = 0;

364 365 366 367 368 369 370 371 372 373 374
    if (sps->profile_idc == 100 ||  // High profile
        sps->profile_idc == 110 ||  // High10 profile
        sps->profile_idc == 122 ||  // High422 profile
        sps->profile_idc == 244 ||  // High444 Predictive profile
        sps->profile_idc ==  44 ||  // Cavlc444 profile
        sps->profile_idc ==  83 ||  // Scalable Constrained High profile (SVC)
        sps->profile_idc ==  86 ||  // Scalable High Intra profile (SVC)
        sps->profile_idc == 118 ||  // Stereo High profile (MVC)
        sps->profile_idc == 128 ||  // Multiview High profile (MVC)
        sps->profile_idc == 138 ||  // Multiview Depth High profile (MVCD)
        sps->profile_idc == 144) {  // old High444 profile
375
        sps->chroma_format_idc = get_ue_golomb_31(gb);
376
        if (sps->chroma_format_idc > 3) {
377
            avpriv_request_sample(avctx, "chroma_format_idc %u",
378
                                  sps->chroma_format_idc);
379
            goto fail;
380
        } else if (sps->chroma_format_idc == 3) {
381
            sps->residual_color_transform_flag = get_bits1(gb);
382
        }
383 384
        sps->bit_depth_luma   = get_ue_golomb(gb) + 8;
        sps->bit_depth_chroma = get_ue_golomb(gb) + 8;
385
        if (sps->bit_depth_chroma != sps->bit_depth_luma) {
386
            avpriv_request_sample(avctx,
387 388 389
                                  "Different chroma and luma bit depth");
            goto fail;
        }
390 391
        sps->transform_bypass = get_bits1(gb);
        decode_scaling_matrices(gb, sps, NULL, 1,
392 393 394 395 396
                                sps->scaling_matrix4, sps->scaling_matrix8);
    } else {
        sps->chroma_format_idc = 1;
        sps->bit_depth_luma    = 8;
        sps->bit_depth_chroma  = 8;
397 398
    }

399
    log2_max_frame_num_minus4 = get_ue_golomb(gb);
400 401
    if (log2_max_frame_num_minus4 < MIN_LOG2_MAX_FRAME_NUM - 4 ||
        log2_max_frame_num_minus4 > MAX_LOG2_MAX_FRAME_NUM - 4) {
402
        av_log(avctx, AV_LOG_ERROR,
403 404
               "log2_max_frame_num_minus4 out of range (0-12): %d\n",
               log2_max_frame_num_minus4);
405
        goto fail;
406 407 408
    }
    sps->log2_max_frame_num = log2_max_frame_num_minus4 + 4;

409
    sps->poc_type = get_ue_golomb_31(gb);
410

411
    if (sps->poc_type == 0) { // FIXME #define
412
        sps->log2_max_poc_lsb = get_ue_golomb(gb) + 4;
413
    } else if (sps->poc_type == 1) { // FIXME #define
414 415 416 417
        sps->delta_pic_order_always_zero_flag = get_bits1(gb);
        sps->offset_for_non_ref_pic           = get_se_golomb(gb);
        sps->offset_for_top_to_bottom_field   = get_se_golomb(gb);
        sps->poc_cycle_length                 = get_ue_golomb(gb);
418

419 420
        if ((unsigned)sps->poc_cycle_length >=
            FF_ARRAY_ELEMS(sps->offset_for_ref_frame)) {
421
            av_log(avctx, AV_LOG_ERROR,
422
                   "poc_cycle_length overflow %d\n", sps->poc_cycle_length);
423 424 425
            goto fail;
        }

426
        for (i = 0; i < sps->poc_cycle_length; i++)
427
            sps->offset_for_ref_frame[i] = get_se_golomb(gb);
428
    } else if (sps->poc_type != 2) {
429
        av_log(avctx, AV_LOG_ERROR, "illegal POC type %d\n", sps->poc_type);
430 431 432
        goto fail;
    }

433
    sps->ref_frame_count = get_ue_golomb_31(gb);
434
    if (sps->ref_frame_count > MAX_DELAYED_PIC_COUNT) {
435
        av_log(avctx, AV_LOG_ERROR,
436
               "too many reference frames %d\n", sps->ref_frame_count);
437 438
        goto fail;
    }
439 440 441
    sps->gaps_in_frame_num_allowed_flag = get_bits1(gb);
    sps->mb_width                       = get_ue_golomb(gb) + 1;
    sps->mb_height                      = get_ue_golomb(gb) + 1;
442 443 444
    if ((unsigned)sps->mb_width  >= INT_MAX / 16 ||
        (unsigned)sps->mb_height >= INT_MAX / 16 ||
        av_image_check_size(16 * sps->mb_width,
445 446
                            16 * sps->mb_height, 0, avctx)) {
        av_log(avctx, AV_LOG_ERROR, "mb_width/height overflow\n");
447 448 449
        goto fail;
    }

450
    sps->frame_mbs_only_flag = get_bits1(gb);
451
    if (!sps->frame_mbs_only_flag)
452
        sps->mb_aff = get_bits1(gb);
453
    else
454
        sps->mb_aff = 0;
455

456
    sps->direct_8x8_inference_flag = get_bits1(gb);
457
    if (!sps->frame_mbs_only_flag && !sps->direct_8x8_inference_flag) {
458
        av_log(avctx, AV_LOG_ERROR,
459
               "This stream was generated by a broken encoder, invalid 8x8 inference\n");
460 461
        goto fail;
    }
462 463

#ifndef ALLOW_INTERLACE
464
    if (sps->mb_aff)
465
        av_log(avctx, AV_LOG_ERROR,
466
               "MBAFF support not included; enable it at compile-time.\n");
467
#endif
468
    sps->crop = get_bits1(gb);
469
    if (sps->crop) {
470 471 472 473
        unsigned int crop_left   = get_ue_golomb(gb);
        unsigned int crop_right  = get_ue_golomb(gb);
        unsigned int crop_top    = get_ue_golomb(gb);
        unsigned int crop_bottom = get_ue_golomb(gb);
A
Anton Khirnov 已提交
474

475 476
        if (avctx->flags2 & AV_CODEC_FLAG2_IGNORE_CROP) {
            av_log(avctx, AV_LOG_DEBUG, "discarding sps cropping, original "
477
                                           "values are l:%d r:%d t:%d b:%d\n",
478
                   crop_left, crop_right, crop_top, crop_bottom);
479 480 481 482 483

            sps->crop_left   =
            sps->crop_right  =
            sps->crop_top    =
            sps->crop_bottom = 0;
A
Anton Khirnov 已提交
484
        } else {
485 486 487
            int vsub   = (sps->chroma_format_idc == 1) ? 1 : 0;
            int hsub   = (sps->chroma_format_idc == 1 ||
                          sps->chroma_format_idc == 2) ? 1 : 0;
A
Anton Khirnov 已提交
488 489 490 491
            int step_x = 1 << hsub;
            int step_y = (2 - sps->frame_mbs_only_flag) << vsub;

            if (crop_left & (0x1F >> (sps->bit_depth_luma > 8)) &&
492
                !(avctx->flags & AV_CODEC_FLAG_UNALIGNED)) {
A
Anton Khirnov 已提交
493
                crop_left &= ~(0x1F >> (sps->bit_depth_luma > 8));
494
                av_log(avctx, AV_LOG_WARNING,
495
                       "Reducing left cropping to %d "
A
Anton Khirnov 已提交
496 497 498 499
                       "chroma samples to preserve alignment.\n",
                       crop_left);
            }

500 501 502 503 504 505
            if (INT_MAX / step_x             <= crop_left               ||
                INT_MAX / step_x - crop_left <= crop_right              ||
                16 * sps->mb_width <= step_x * (crop_left + crop_right) ||
                INT_MAX / step_y             <= crop_top                ||
                INT_MAX / step_y - crop_top  <= crop_bottom             ||
                16 * sps->mb_height <= step_y * (crop_top + crop_bottom)) {
506 507
                av_log(avctx, AV_LOG_WARNING, "Invalid crop parameters\n");
                if (avctx->err_recognition & AV_EF_EXPLODE)
508 509 510 511
                    goto fail;
                crop_left = crop_right = crop_top = crop_bottom = 0;
            }

A
Anton Khirnov 已提交
512 513 514 515
            sps->crop_left   = crop_left   * step_x;
            sps->crop_right  = crop_right  * step_x;
            sps->crop_top    = crop_top    * step_y;
            sps->crop_bottom = crop_bottom * step_y;
516
        }
517 518 519 520 521 522
    } else {
        sps->crop_left   =
        sps->crop_right  =
        sps->crop_top    =
        sps->crop_bottom =
        sps->crop        = 0;
523 524
    }

525
    sps->vui_parameters_present_flag = get_bits1(gb);
526
    if (sps->vui_parameters_present_flag) {
527 528
        int ret = decode_vui_parameters(gb, avctx, sps);
        if (ret < 0 && avctx->err_recognition & AV_EF_EXPLODE)
529
            goto fail;
530
    }
531

532 533
    /* if the maximum delay is not stored in the SPS, derive it based on the
     * level */
534 535
    if (!sps->bitstream_restriction_flag &&
        (sps->ref_frame_count || avctx->strict_std_compliance >= FF_COMPLIANCE_STRICT)) {
536 537 538 539 540 541 542 543 544 545
        sps->num_reorder_frames = MAX_DELAYED_PIC_COUNT - 1;
        for (i = 0; i < FF_ARRAY_ELEMS(level_max_dpb_mbs); i++) {
            if (level_max_dpb_mbs[i][0] == sps->level_idc) {
                sps->num_reorder_frames = FFMIN(level_max_dpb_mbs[i][1] / (sps->mb_width * sps->mb_height),
                                                sps->num_reorder_frames);
                break;
            }
        }
    }

546 547
    if (!sps->sar.den)
        sps->sar.den = 1;
548

549
    if (avctx->debug & FF_DEBUG_PICT_INFO) {
550
        static const char csp[4][5] = { "Gray", "420", "422", "444" };
551
        av_log(avctx, AV_LOG_DEBUG,
552
               "sps:%u profile:%d/%d poc:%d ref:%d %dx%d %s %s crop:%u/%u/%u/%u %s %s %"PRId32"/%"PRId32"\n",
553 554 555 556 557 558 559 560 561
               sps_id, sps->profile_idc, sps->level_idc,
               sps->poc_type,
               sps->ref_frame_count,
               sps->mb_width, sps->mb_height,
               sps->frame_mbs_only_flag ? "FRM" : (sps->mb_aff ? "MB-AFF" : "PIC-AFF"),
               sps->direct_8x8_inference_flag ? "8B8" : "",
               sps->crop_left, sps->crop_right,
               sps->crop_top, sps->crop_bottom,
               sps->vui_parameters_present_flag ? "VUI" : "",
562
               csp[sps->chroma_format_idc],
563
               sps->timing_info_present_flag ? sps->num_units_in_tick : 0,
564
               sps->timing_info_present_flag ? sps->time_scale : 0);
565 566
    }

567 568 569 570 571 572 573 574 575 576
    /* check if this is a repeat of an already parsed SPS, then keep the
     * original one.
     * otherwise drop all PPSes that depend on it */
    if (ps->sps_list[sps_id] &&
        !memcmp(ps->sps_list[sps_id]->data, sps_buf->data, sps_buf->size)) {
        av_buffer_unref(&sps_buf);
    } else {
        remove_sps(ps, sps_id);
        ps->sps_list[sps_id] = sps_buf;
    }
577

578
    return 0;
579

580
fail:
581
    av_buffer_unref(&sps_buf);
582
    return AVERROR_INVALIDDATA;
583 584
}

585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654
static void init_dequant8_coeff_table(PPS *pps, const SPS *sps)
{
    int i, j, q, x;
    const int max_qp = 51 + 6 * (sps->bit_depth_luma - 8);

    for (i = 0; i < 6; i++) {
        pps->dequant8_coeff[i] = pps->dequant8_buffer[i];
        for (j = 0; j < i; j++)
            if (!memcmp(pps->scaling_matrix8[j], pps->scaling_matrix8[i],
                        64 * sizeof(uint8_t))) {
                pps->dequant8_coeff[i] = pps->dequant8_buffer[j];
                break;
            }
        if (j < i)
            continue;

        for (q = 0; q < max_qp + 1; q++) {
            int shift = ff_h264_quant_div6[q];
            int idx   = ff_h264_quant_rem6[q];
            for (x = 0; x < 64; x++)
                pps->dequant8_coeff[i][q][(x >> 3) | ((x & 7) << 3)] =
                    ((uint32_t)ff_h264_dequant8_coeff_init[idx][ff_h264_dequant8_coeff_init_scan[((x >> 1) & 12) | (x & 3)]] *
                     pps->scaling_matrix8[i][x]) << shift;
        }
    }
}

static void init_dequant4_coeff_table(PPS *pps, const SPS *sps)
{
    int i, j, q, x;
    const int max_qp = 51 + 6 * (sps->bit_depth_luma - 8);
    for (i = 0; i < 6; i++) {
        pps->dequant4_coeff[i] = pps->dequant4_buffer[i];
        for (j = 0; j < i; j++)
            if (!memcmp(pps->scaling_matrix4[j], pps->scaling_matrix4[i],
                        16 * sizeof(uint8_t))) {
                pps->dequant4_coeff[i] = pps->dequant4_buffer[j];
                break;
            }
        if (j < i)
            continue;

        for (q = 0; q < max_qp + 1; q++) {
            int shift = ff_h264_quant_div6[q] + 2;
            int idx   = ff_h264_quant_rem6[q];
            for (x = 0; x < 16; x++)
                pps->dequant4_coeff[i][q][(x >> 2) | ((x << 2) & 0xF)] =
                    ((uint32_t)ff_h264_dequant4_coeff_init[idx][(x & 1) + ((x >> 2) & 1)] *
                     pps->scaling_matrix4[i][x]) << shift;
        }
    }
}

static void init_dequant_tables(PPS *pps, const SPS *sps)
{
    int i, x;
    init_dequant4_coeff_table(pps, sps);
    if (pps->transform_8x8_mode)
        init_dequant8_coeff_table(pps, sps);
    if (sps->transform_bypass) {
        for (i = 0; i < 6; i++)
            for (x = 0; x < 16; x++)
                pps->dequant4_coeff[i][0][x] = 1 << 6;
        if (pps->transform_8x8_mode)
            for (i = 0; i < 6; i++)
                for (x = 0; x < 64; x++)
                    pps->dequant8_coeff[i][0][x] = 1 << 6;
    }
}

655
static void build_qp_table(PPS *pps, int t, int index, const int depth)
656 657
{
    int i;
658 659 660 661
    const int max_qp = 51 + 6 * (depth - 8);
    for (i = 0; i < max_qp + 1; i++)
        pps->chroma_qp_table[t][i] =
            ff_h264_chroma_qp[depth - 8][av_clip(i + index, 0, max_qp)];
662 663
}

664 665
int ff_h264_decode_picture_parameter_set(GetBitContext *gb, AVCodecContext *avctx,
                                         H264ParamSets *ps, int bit_length)
666
{
667 668 669
    AVBufferRef *pps_buf;
    SPS *sps;
    unsigned int pps_id = get_ue_golomb(gb);
670
    PPS *pps;
671
    int qp_bd_offset;
672
    int bits_left;
673
    int ret;
674

675
    if (pps_id >= MAX_PPS_COUNT) {
676
        av_log(avctx, AV_LOG_ERROR, "pps_id %u out of range\n", pps_id);
677
        return AVERROR_INVALIDDATA;
678 679
    }

680 681
    pps_buf = av_buffer_allocz(sizeof(*pps));
    if (!pps_buf)
682
        return AVERROR(ENOMEM);
683 684 685
    pps = (PPS*)pps_buf->data;

    pps->sps_id = get_ue_golomb_31(gb);
686
    if ((unsigned)pps->sps_id >= MAX_SPS_COUNT ||
687 688
        !ps->sps_list[pps->sps_id]) {
        av_log(avctx, AV_LOG_ERROR, "sps_id %u out of range\n", pps->sps_id);
689
        ret = AVERROR_INVALIDDATA;
690 691
        goto fail;
    }
692
    sps = (SPS*)ps->sps_list[pps->sps_id]->data;
693 694

    if (sps->bit_depth_luma > 10) {
695
        av_log(avctx, AV_LOG_ERROR,
696 697
               "Unimplemented luma bit depth=%d (max=10)\n",
               sps->bit_depth_luma);
698 699
        ret = AVERROR_PATCHWELCOME;
        goto fail;
700
    }
701

702 703 704
    pps->cabac             = get_bits1(gb);
    pps->pic_order_present = get_bits1(gb);
    pps->slice_group_count = get_ue_golomb(gb) + 1;
705
    if (pps->slice_group_count > 1) {
706 707
        pps->mb_slice_group_map_type = get_ue_golomb(gb);
        av_log(avctx, AV_LOG_ERROR, "FMO not supported\n");
708
        switch (pps->mb_slice_group_map_type) {
709 710
        case 0:
#if 0
711 712
    |       for (i = 0; i <= num_slice_groups_minus1; i++)  |   |      |
    |           run_length[i]                               |1  |ue(v) |
713 714 715 716
#endif
            break;
        case 2:
#if 0
717 718 719 720
    |       for (i = 0; i < num_slice_groups_minus1; i++) { |   |      |
    |           top_left_mb[i]                              |1  |ue(v) |
    |           bottom_right_mb[i]                          |1  |ue(v) |
    |       }                                               |   |      |
721 722 723 724 725 726
#endif
            break;
        case 3:
        case 4:
        case 5:
#if 0
727 728
    |       slice_group_change_direction_flag               |1  |u(1)  |
    |       slice_group_change_rate_minus1                  |1  |ue(v) |
729 730 731 732
#endif
            break;
        case 6:
#if 0
733 734 735
    |       slice_group_id_cnt_minus1                       |1  |ue(v) |
    |       for (i = 0; i <= slice_group_id_cnt_minus1; i++)|   |      |
    |           slice_group_id[i]                           |1  |u(v)  |
736 737 738 739
#endif
            break;
        }
    }
740 741
    pps->ref_count[0] = get_ue_golomb(gb) + 1;
    pps->ref_count[1] = get_ue_golomb(gb) + 1;
742
    if (pps->ref_count[0] - 1 > 32 - 1 || pps->ref_count[1] - 1 > 32 - 1) {
743
        av_log(avctx, AV_LOG_ERROR, "reference overflow (pps)\n");
744
        ret = AVERROR_INVALIDDATA;
745 746 747
        goto fail;
    }

748 749
    qp_bd_offset = 6 * (sps->bit_depth_luma - 8);

750 751 752 753 754 755 756 757
    pps->weighted_pred                        = get_bits1(gb);
    pps->weighted_bipred_idc                  = get_bits(gb, 2);
    pps->init_qp                              = get_se_golomb(gb) + 26 + qp_bd_offset;
    pps->init_qs                              = get_se_golomb(gb) + 26 + qp_bd_offset;
    pps->chroma_qp_index_offset[0]            = get_se_golomb(gb);
    pps->deblocking_filter_parameters_present = get_bits1(gb);
    pps->constrained_intra_pred               = get_bits1(gb);
    pps->redundant_pic_cnt_present            = get_bits1(gb);
758 759

    pps->transform_8x8_mode = 0;
760
    memcpy(pps->scaling_matrix4, sps->scaling_matrix4,
761
           sizeof(pps->scaling_matrix4));
762
    memcpy(pps->scaling_matrix8, sps->scaling_matrix8,
763
           sizeof(pps->scaling_matrix8));
764

765
    bits_left = bit_length - get_bits_count(gb);
766
    if (bits_left && (bits_left > 8 ||
767 768 769
                      show_bits(gb, bits_left) != 1 << (bits_left - 1))) {
        pps->transform_8x8_mode = get_bits1(gb);
        decode_scaling_matrices(gb, sps, pps, 0,
770 771
                                pps->scaling_matrix4, pps->scaling_matrix8);
        // second_chroma_qp_index_offset
772
        pps->chroma_qp_index_offset[1] = get_se_golomb(gb);
773
    } else {
774
        pps->chroma_qp_index_offset[1] = pps->chroma_qp_index_offset[0];
775 776
    }

777
    build_qp_table(pps, 0, pps->chroma_qp_index_offset[0],
778
                   sps->bit_depth_luma);
779
    build_qp_table(pps, 1, pps->chroma_qp_index_offset[1],
780
                   sps->bit_depth_luma);
781 782 783

    init_dequant_tables(pps, sps);

784 785
    if (pps->chroma_qp_index_offset[0] != pps->chroma_qp_index_offset[1])
        pps->chroma_qp_diff = 1;
786

787 788
    if (avctx->debug & FF_DEBUG_PICT_INFO) {
        av_log(avctx, AV_LOG_DEBUG,
789
               "pps:%u sps:%u %s slice_groups:%d ref:%u/%u %s qp:%d/%d/%d/%d %s %s %s %s\n",
790 791 792 793 794 795 796 797 798
               pps_id, pps->sps_id,
               pps->cabac ? "CABAC" : "CAVLC",
               pps->slice_group_count,
               pps->ref_count[0], pps->ref_count[1],
               pps->weighted_pred ? "weighted" : "",
               pps->init_qp, pps->init_qs, pps->chroma_qp_index_offset[0], pps->chroma_qp_index_offset[1],
               pps->deblocking_filter_parameters_present ? "LPAR" : "",
               pps->constrained_intra_pred ? "CONSTR" : "",
               pps->redundant_pic_cnt_present ? "REDU" : "",
799
               pps->transform_8x8_mode ? "8x8DCT" : "");
800 801
    }

802 803 804
    remove_pps(ps, pps_id);
    ps->pps_list[pps_id] = pps_buf;

805
    return 0;
806

807
fail:
808
    av_buffer_unref(&pps_buf);
809
    return ret;
810
}