h264_ps.c 29.7 KB
Newer Older
1 2 3 4
/*
 * H.26L/H.264/AVC/JVT/14496-10/... parameter set decoding
 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
 *
5
 * This file is part of Libav.
6
 *
7
 * Libav is free software; you can redistribute it and/or
8 9 10 11
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
12
 * Libav is distributed in the hope that it will be useful,
13 14 15 16 17
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with Libav; if not, write to the Free Software
19 20 21 22
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

/**
23
 * @file
24
 * H.264 / AVC / MPEG-4 part10 parameter set decoding.
25 26 27
 * @author Michael Niedermayer <michaelni@gmx.at>
 */

28 29
#include <inttypes.h>

30
#include "libavutil/imgutils.h"
31
#include "internal.h"
32
#include "mathops.h"
33
#include "avcodec.h"
34
#include "h264data.h"
35
#include "h264_ps.h"
36 37
#include "golomb.h"

38 39 40
#define MAX_LOG2_MAX_FRAME_NUM    (12 + 4)
#define MIN_LOG2_MAX_FRAME_NUM    4

41 42
#define EXTENDED_SAR       255

43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60
static const AVRational pixel_aspect[17] = {
    {   0,  1 },
    {   1,  1 },
    {  12, 11 },
    {  10, 11 },
    {  16, 11 },
    {  40, 33 },
    {  24, 11 },
    {  20, 11 },
    {  32, 11 },
    {  80, 33 },
    {  18, 11 },
    {  15, 11 },
    {  64, 33 },
    { 160, 99 },
    {   4,  3 },
    {   3,  2 },
    {   2,  1 },
61 62
};

63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88
static const uint8_t default_scaling4[2][16] = {
    {  6, 13, 20, 28, 13, 20, 28, 32,
      20, 28, 32, 37, 28, 32, 37, 42 },
    { 10, 14, 20, 24, 14, 20, 24, 27,
      20, 24, 27, 30, 24, 27, 30, 34 }
};

static const uint8_t default_scaling8[2][64] = {
    {  6, 10, 13, 16, 18, 23, 25, 27,
      10, 11, 16, 18, 23, 25, 27, 29,
      13, 16, 18, 23, 25, 27, 29, 31,
      16, 18, 23, 25, 27, 29, 31, 33,
      18, 23, 25, 27, 29, 31, 33, 36,
      23, 25, 27, 29, 31, 33, 36, 38,
      25, 27, 29, 31, 33, 36, 38, 40,
      27, 29, 31, 33, 36, 38, 40, 42 },
    {  9, 13, 15, 17, 19, 21, 22, 24,
      13, 13, 17, 19, 21, 22, 24, 25,
      15, 17, 19, 21, 22, 24, 25, 27,
      17, 19, 21, 22, 24, 25, 27, 28,
      19, 21, 22, 24, 25, 27, 28, 30,
      21, 22, 24, 25, 27, 28, 30, 32,
      22, 24, 25, 27, 28, 30, 32, 33,
      24, 25, 27, 28, 30, 32, 33, 35 }
};

89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108
/* maximum number of MBs in the DPB for a given level */
static const int level_max_dpb_mbs[][2] = {
    { 10, 396       },
    { 11, 900       },
    { 12, 2376      },
    { 13, 2376      },
    { 20, 2376      },
    { 21, 4752      },
    { 22, 8100      },
    { 30, 8100      },
    { 31, 18000     },
    { 32, 20480     },
    { 40, 32768     },
    { 41, 32768     },
    { 42, 34816     },
    { 50, 110400    },
    { 51, 184320    },
    { 52, 184320    },
};

109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132
static void remove_pps(H264ParamSets *s, int id)
{
    if (s->pps_list[id] && s->pps == (const PPS*)s->pps_list[id]->data)
        s->pps = NULL;
    av_buffer_unref(&s->pps_list[id]);
}

static void remove_sps(H264ParamSets *s, int id)
{
    int i;
    if (s->sps_list[id]) {
        if (s->sps == (SPS*)s->sps_list[id]->data)
            s->sps = NULL;

        /* drop all PPS that depend on this SPS */
        for (i = 0; i < FF_ARRAY_ELEMS(s->pps_list); i++)
            if (s->pps_list[i] && ((PPS*)s->pps_list[i]->data)->sps_id == id)
                remove_pps(s, i);
    }
    av_buffer_unref(&s->sps_list[id]);
}

static inline int decode_hrd_parameters(GetBitContext *gb, AVCodecContext *avctx,
                                        SPS *sps)
133
{
134
    int cpb_count, i;
135
    cpb_count = get_ue_golomb_31(gb) + 1;
136

137
    if (cpb_count > 32U) {
138
        av_log(avctx, AV_LOG_ERROR, "cpb_count %d invalid\n", cpb_count);
139
        return AVERROR_INVALIDDATA;
140 141
    }

142 143
    get_bits(gb, 4); /* bit_rate_scale */
    get_bits(gb, 4); /* cpb_size_scale */
144
    for (i = 0; i < cpb_count; i++) {
145 146 147 148 149 150 151 152
        get_ue_golomb_long(gb); /* bit_rate_value_minus1 */
        get_ue_golomb_long(gb); /* cpb_size_value_minus1 */
        get_bits1(gb);          /* cbr_flag */
    }
    sps->initial_cpb_removal_delay_length = get_bits(gb, 5) + 1;
    sps->cpb_removal_delay_length         = get_bits(gb, 5) + 1;
    sps->dpb_output_delay_length          = get_bits(gb, 5) + 1;
    sps->time_offset_length               = get_bits(gb, 5);
153
    sps->cpb_cnt                          = cpb_count;
154 155 156
    return 0;
}

157 158
static inline int decode_vui_parameters(GetBitContext *gb, AVCodecContext *avctx,
                                        SPS *sps)
159
{
160 161 162
    int aspect_ratio_info_present_flag;
    unsigned int aspect_ratio_idc;

163
    aspect_ratio_info_present_flag = get_bits1(gb);
164

165
    if (aspect_ratio_info_present_flag) {
166
        aspect_ratio_idc = get_bits(gb, 8);
167
        if (aspect_ratio_idc == EXTENDED_SAR) {
168 169
            sps->sar.num = get_bits(gb, 16);
            sps->sar.den = get_bits(gb, 16);
170 171 172
        } else if (aspect_ratio_idc < FF_ARRAY_ELEMS(pixel_aspect)) {
            sps->sar = pixel_aspect[aspect_ratio_idc];
        } else {
173
            av_log(avctx, AV_LOG_ERROR, "illegal aspect ratio\n");
174
            return AVERROR_INVALIDDATA;
175
        }
176 177 178
    } else {
        sps->sar.num =
        sps->sar.den = 0;
179 180
    }

181 182
    if (get_bits1(gb))      /* overscan_info_present_flag */
        get_bits1(gb);      /* overscan_appropriate_flag */
183

184
    sps->video_signal_type_present_flag = get_bits1(gb);
185
    if (sps->video_signal_type_present_flag) {
186 187
        get_bits(gb, 3);                 /* video_format */
        sps->full_range = get_bits1(gb); /* video_full_range_flag */
188

189
        sps->colour_description_present_flag = get_bits1(gb);
190
        if (sps->colour_description_present_flag) {
191 192 193
            sps->color_primaries = get_bits(gb, 8); /* colour_primaries */
            sps->color_trc       = get_bits(gb, 8); /* transfer_characteristics */
            sps->colorspace      = get_bits(gb, 8); /* matrix_coefficients */
194 195 196

            // Set invalid values to "unspecified"
            if (!av_color_primaries_name(sps->color_primaries))
197
                sps->color_primaries = AVCOL_PRI_UNSPECIFIED;
198
            if (!av_color_transfer_name(sps->color_trc))
199
                sps->color_trc = AVCOL_TRC_UNSPECIFIED;
200
            if (!av_color_space_name(sps->colorspace))
201
                sps->colorspace = AVCOL_SPC_UNSPECIFIED;
202 203 204
        }
    }

205
    /* chroma_location_info_present_flag */
206
    if (get_bits1(gb)) {
207
        /* chroma_sample_location_type_top_field */
208 209
        avctx->chroma_sample_location = get_ue_golomb(gb) + 1;
        get_ue_golomb(gb);  /* chroma_sample_location_type_bottom_field */
210 211
    }

212
    sps->timing_info_present_flag = get_bits1(gb);
213
    if (sps->timing_info_present_flag) {
214 215
        sps->num_units_in_tick = get_bits_long(gb, 32);
        sps->time_scale        = get_bits_long(gb, 32);
216
        if (!sps->num_units_in_tick || !sps->time_scale) {
217
            av_log(avctx, AV_LOG_ERROR,
218
                   "time_scale/num_units_in_tick invalid or unsupported (%"PRIu32"/%"PRIu32")\n",
219
                   sps->time_scale, sps->num_units_in_tick);
220
            return AVERROR_INVALIDDATA;
221
        }
222
        sps->fixed_frame_rate_flag = get_bits1(gb);
223 224
    }

225
    sps->nal_hrd_parameters_present_flag = get_bits1(gb);
226
    if (sps->nal_hrd_parameters_present_flag)
227
        if (decode_hrd_parameters(gb, avctx, sps) < 0)
228
            return AVERROR_INVALIDDATA;
229
    sps->vcl_hrd_parameters_present_flag = get_bits1(gb);
230
    if (sps->vcl_hrd_parameters_present_flag)
231
        if (decode_hrd_parameters(gb, avctx, sps) < 0)
232
            return AVERROR_INVALIDDATA;
233 234
    if (sps->nal_hrd_parameters_present_flag ||
        sps->vcl_hrd_parameters_present_flag)
235 236
        get_bits1(gb);     /* low_delay_hrd_flag */
    sps->pic_struct_present_flag = get_bits1(gb);
237

238
    sps->bitstream_restriction_flag = get_bits1(gb);
239
    if (sps->bitstream_restriction_flag) {
240 241 242 243 244 245 246 247 248
        get_bits1(gb);     /* motion_vectors_over_pic_boundaries_flag */
        get_ue_golomb(gb); /* max_bytes_per_pic_denom */
        get_ue_golomb(gb); /* max_bits_per_mb_denom */
        get_ue_golomb(gb); /* log2_max_mv_length_horizontal */
        get_ue_golomb(gb); /* log2_max_mv_length_vertical */
        sps->num_reorder_frames = get_ue_golomb(gb);
        get_ue_golomb(gb); /*max_dec_frame_buffering*/

        if (get_bits_left(gb) < 0) {
249 250
            sps->num_reorder_frames         = 0;
            sps->bitstream_restriction_flag = 0;
251 252
        }

253 254
        if (sps->num_reorder_frames > 16U
            /* max_dec_frame_buffering || max_dec_frame_buffering > 16 */) {
255
            av_log(avctx, AV_LOG_ERROR,
256 257 258
                   "Clipping illegal num_reorder_frames %d\n",
                   sps->num_reorder_frames);
            sps->num_reorder_frames = 16;
259
            return AVERROR_INVALIDDATA;
260 261
        }
    }
262 263 264
    if (get_bits_left(gb) < 0) {
        av_log(avctx, AV_LOG_ERROR,
               "Overread VUI by %d bits\n", -get_bits_left(gb));
265 266
        return AVERROR_INVALIDDATA;
    }
267 268 269 270

    return 0;
}

271
static void decode_scaling_list(GetBitContext *gb, uint8_t *factors, int size,
272 273 274
                                const uint8_t *jvt_list,
                                const uint8_t *fallback_list)
{
275
    int i, last = 8, next = 8;
276
    const uint8_t *scan = size == 16 ? ff_zigzag_scan : ff_zigzag_direct;
277
    if (!get_bits1(gb)) /* matrix not written, we use the predicted one */
278
        memcpy(factors, fallback_list, size * sizeof(uint8_t));
279
    else
280 281
        for (i = 0; i < size; i++) {
            if (next)
282
                next = (last + get_se_golomb(gb)) & 0xff;
283 284 285 286 287
            if (!i && !next) { /* matrix not written, we use the preset one */
                memcpy(factors, jvt_list, size * sizeof(uint8_t));
                break;
            }
            last = factors[scan[i]] = next ? next : last;
288 289 290
        }
}

291
static void decode_scaling_matrices(GetBitContext *gb, SPS *sps,
292 293 294 295
                                    PPS *pps, int is_sps,
                                    uint8_t(*scaling_matrix4)[16],
                                    uint8_t(*scaling_matrix8)[64])
{
296 297 298 299 300
    int fallback_sps = !is_sps && sps->scaling_matrix_present;
    const uint8_t *fallback[4] = {
        fallback_sps ? sps->scaling_matrix4[0] : default_scaling4[0],
        fallback_sps ? sps->scaling_matrix4[3] : default_scaling4[1],
        fallback_sps ? sps->scaling_matrix8[0] : default_scaling8[0],
301
        fallback_sps ? sps->scaling_matrix8[3] : default_scaling8[1]
302
    };
303
    if (get_bits1(gb)) {
304
        sps->scaling_matrix_present |= is_sps;
305 306 307 308 309 310
        decode_scaling_list(gb, scaling_matrix4[0], 16, default_scaling4[0], fallback[0]);        // Intra, Y
        decode_scaling_list(gb, scaling_matrix4[1], 16, default_scaling4[0], scaling_matrix4[0]); // Intra, Cr
        decode_scaling_list(gb, scaling_matrix4[2], 16, default_scaling4[0], scaling_matrix4[1]); // Intra, Cb
        decode_scaling_list(gb, scaling_matrix4[3], 16, default_scaling4[1], fallback[1]);        // Inter, Y
        decode_scaling_list(gb, scaling_matrix4[4], 16, default_scaling4[1], scaling_matrix4[3]); // Inter, Cr
        decode_scaling_list(gb, scaling_matrix4[5], 16, default_scaling4[1], scaling_matrix4[4]); // Inter, Cb
311
        if (is_sps || pps->transform_8x8_mode) {
312
            decode_scaling_list(gb, scaling_matrix8[0], 64, default_scaling8[0], fallback[2]); // Intra, Y
313
            if (sps->chroma_format_idc == 3) {
314 315
                decode_scaling_list(gb, scaling_matrix8[1], 64, default_scaling8[0], scaling_matrix8[0]); // Intra, Cr
                decode_scaling_list(gb, scaling_matrix8[2], 64, default_scaling8[0], scaling_matrix8[1]); // Intra, Cb
316
            }
317
            decode_scaling_list(gb, scaling_matrix8[3], 64, default_scaling8[1], fallback[3]); // Inter, Y
318
            if (sps->chroma_format_idc == 3) {
319 320
                decode_scaling_list(gb, scaling_matrix8[4], 64, default_scaling8[1], scaling_matrix8[3]); // Inter, Cr
                decode_scaling_list(gb, scaling_matrix8[5], 64, default_scaling8[1], scaling_matrix8[4]); // Inter, Cb
321
            }
322 323 324 325
        }
    }
}

326 327
int ff_h264_decode_seq_parameter_set(GetBitContext *gb, AVCodecContext *avctx,
                                     H264ParamSets *ps)
328
{
329
    AVBufferRef *sps_buf;
330
    int profile_idc, level_idc, constraint_set_flags = 0;
331
    unsigned int sps_id;
332
    int i, log2_max_frame_num_minus4;
333 334
    SPS *sps;

335 336 337 338 339 340 341 342 343 344
    profile_idc           = get_bits(gb, 8);
    constraint_set_flags |= get_bits1(gb) << 0;   // constraint_set0_flag
    constraint_set_flags |= get_bits1(gb) << 1;   // constraint_set1_flag
    constraint_set_flags |= get_bits1(gb) << 2;   // constraint_set2_flag
    constraint_set_flags |= get_bits1(gb) << 3;   // constraint_set3_flag
    constraint_set_flags |= get_bits1(gb) << 4;   // constraint_set4_flag
    constraint_set_flags |= get_bits1(gb) << 5;   // constraint_set5_flag
    skip_bits(gb, 2);                             // reserved_zero_2bits
    level_idc = get_bits(gb, 8);
    sps_id    = get_ue_golomb_31(gb);
345

346
    if (sps_id >= MAX_SPS_COUNT) {
347
        av_log(avctx, AV_LOG_ERROR, "sps_id %u out of range\n", sps_id);
348
        return AVERROR_INVALIDDATA;
349
    }
350 351 352

    sps_buf = av_buffer_allocz(sizeof(*sps));
    if (!sps_buf)
353
        return AVERROR(ENOMEM);
354
    sps = (SPS*)sps_buf->data;
355

356
    sps->sps_id               = sps_id;
357 358
    sps->time_offset_length   = 24;
    sps->profile_idc          = profile_idc;
359
    sps->constraint_set_flags = constraint_set_flags;
360
    sps->level_idc            = level_idc;
361 362 363 364 365

    memset(sps->scaling_matrix4, 16, sizeof(sps->scaling_matrix4));
    memset(sps->scaling_matrix8, 16, sizeof(sps->scaling_matrix8));
    sps->scaling_matrix_present = 0;

366 367 368 369 370 371 372 373 374 375 376
    if (sps->profile_idc == 100 ||  // High profile
        sps->profile_idc == 110 ||  // High10 profile
        sps->profile_idc == 122 ||  // High422 profile
        sps->profile_idc == 244 ||  // High444 Predictive profile
        sps->profile_idc ==  44 ||  // Cavlc444 profile
        sps->profile_idc ==  83 ||  // Scalable Constrained High profile (SVC)
        sps->profile_idc ==  86 ||  // Scalable High Intra profile (SVC)
        sps->profile_idc == 118 ||  // Stereo High profile (MVC)
        sps->profile_idc == 128 ||  // Multiview High profile (MVC)
        sps->profile_idc == 138 ||  // Multiview Depth High profile (MVCD)
        sps->profile_idc == 144) {  // old High444 profile
377
        sps->chroma_format_idc = get_ue_golomb_31(gb);
378
        if (sps->chroma_format_idc > 3) {
379
            avpriv_request_sample(avctx, "chroma_format_idc %u",
380
                                  sps->chroma_format_idc);
381
            goto fail;
382
        } else if (sps->chroma_format_idc == 3) {
383
            sps->residual_color_transform_flag = get_bits1(gb);
384
        }
385 386
        sps->bit_depth_luma   = get_ue_golomb(gb) + 8;
        sps->bit_depth_chroma = get_ue_golomb(gb) + 8;
387
        if (sps->bit_depth_chroma != sps->bit_depth_luma) {
388
            avpriv_request_sample(avctx,
389 390 391
                                  "Different chroma and luma bit depth");
            goto fail;
        }
392 393
        sps->transform_bypass = get_bits1(gb);
        decode_scaling_matrices(gb, sps, NULL, 1,
394 395 396 397 398
                                sps->scaling_matrix4, sps->scaling_matrix8);
    } else {
        sps->chroma_format_idc = 1;
        sps->bit_depth_luma    = 8;
        sps->bit_depth_chroma  = 8;
399 400
    }

401
    log2_max_frame_num_minus4 = get_ue_golomb(gb);
402 403
    if (log2_max_frame_num_minus4 < MIN_LOG2_MAX_FRAME_NUM - 4 ||
        log2_max_frame_num_minus4 > MAX_LOG2_MAX_FRAME_NUM - 4) {
404
        av_log(avctx, AV_LOG_ERROR,
405 406
               "log2_max_frame_num_minus4 out of range (0-12): %d\n",
               log2_max_frame_num_minus4);
407
        goto fail;
408 409 410
    }
    sps->log2_max_frame_num = log2_max_frame_num_minus4 + 4;

411
    sps->poc_type = get_ue_golomb_31(gb);
412

413
    if (sps->poc_type == 0) { // FIXME #define
414
        sps->log2_max_poc_lsb = get_ue_golomb(gb) + 4;
415
    } else if (sps->poc_type == 1) { // FIXME #define
416 417 418 419
        sps->delta_pic_order_always_zero_flag = get_bits1(gb);
        sps->offset_for_non_ref_pic           = get_se_golomb(gb);
        sps->offset_for_top_to_bottom_field   = get_se_golomb(gb);
        sps->poc_cycle_length                 = get_ue_golomb(gb);
420

421 422
        if ((unsigned)sps->poc_cycle_length >=
            FF_ARRAY_ELEMS(sps->offset_for_ref_frame)) {
423
            av_log(avctx, AV_LOG_ERROR,
424
                   "poc_cycle_length overflow %d\n", sps->poc_cycle_length);
425 426 427
            goto fail;
        }

428
        for (i = 0; i < sps->poc_cycle_length; i++)
429
            sps->offset_for_ref_frame[i] = get_se_golomb(gb);
430
    } else if (sps->poc_type != 2) {
431
        av_log(avctx, AV_LOG_ERROR, "illegal POC type %d\n", sps->poc_type);
432 433 434
        goto fail;
    }

435
    sps->ref_frame_count = get_ue_golomb_31(gb);
436
    if (sps->ref_frame_count > MAX_DELAYED_PIC_COUNT) {
437
        av_log(avctx, AV_LOG_ERROR,
438
               "too many reference frames %d\n", sps->ref_frame_count);
439 440
        goto fail;
    }
441 442 443
    sps->gaps_in_frame_num_allowed_flag = get_bits1(gb);
    sps->mb_width                       = get_ue_golomb(gb) + 1;
    sps->mb_height                      = get_ue_golomb(gb) + 1;
444 445 446 447 448 449 450 451 452

    sps->frame_mbs_only_flag = get_bits1(gb);

    if (sps->mb_height >= INT_MAX / 2) {
        av_log(avctx, AV_LOG_ERROR, "height overflow\n");
        goto fail;
    }
    sps->mb_height *= 2 - sps->frame_mbs_only_flag;

453 454 455
    if ((unsigned)sps->mb_width  >= INT_MAX / 16 ||
        (unsigned)sps->mb_height >= INT_MAX / 16 ||
        av_image_check_size(16 * sps->mb_width,
456 457
                            16 * sps->mb_height, 0, avctx)) {
        av_log(avctx, AV_LOG_ERROR, "mb_width/height overflow\n");
458 459 460
        goto fail;
    }

461
    if (!sps->frame_mbs_only_flag)
462
        sps->mb_aff = get_bits1(gb);
463
    else
464
        sps->mb_aff = 0;
465

466
    sps->direct_8x8_inference_flag = get_bits1(gb);
467
    if (!sps->frame_mbs_only_flag && !sps->direct_8x8_inference_flag) {
468
        av_log(avctx, AV_LOG_ERROR,
469
               "This stream was generated by a broken encoder, invalid 8x8 inference\n");
470 471
        goto fail;
    }
472 473

#ifndef ALLOW_INTERLACE
474
    if (sps->mb_aff)
475
        av_log(avctx, AV_LOG_ERROR,
476
               "MBAFF support not included; enable it at compile-time.\n");
477
#endif
478
    sps->crop = get_bits1(gb);
479
    if (sps->crop) {
480 481 482 483
        unsigned int crop_left   = get_ue_golomb(gb);
        unsigned int crop_right  = get_ue_golomb(gb);
        unsigned int crop_top    = get_ue_golomb(gb);
        unsigned int crop_bottom = get_ue_golomb(gb);
A
Anton Khirnov 已提交
484

485 486
        if (avctx->flags2 & AV_CODEC_FLAG2_IGNORE_CROP) {
            av_log(avctx, AV_LOG_DEBUG, "discarding sps cropping, original "
487
                                           "values are l:%d r:%d t:%d b:%d\n",
488
                   crop_left, crop_right, crop_top, crop_bottom);
489 490 491 492 493

            sps->crop_left   =
            sps->crop_right  =
            sps->crop_top    =
            sps->crop_bottom = 0;
A
Anton Khirnov 已提交
494
        } else {
495 496 497
            int vsub   = (sps->chroma_format_idc == 1) ? 1 : 0;
            int hsub   = (sps->chroma_format_idc == 1 ||
                          sps->chroma_format_idc == 2) ? 1 : 0;
A
Anton Khirnov 已提交
498 499 500 501
            int step_x = 1 << hsub;
            int step_y = (2 - sps->frame_mbs_only_flag) << vsub;

            if (crop_left & (0x1F >> (sps->bit_depth_luma > 8)) &&
502
                !(avctx->flags & AV_CODEC_FLAG_UNALIGNED)) {
A
Anton Khirnov 已提交
503
                crop_left &= ~(0x1F >> (sps->bit_depth_luma > 8));
504
                av_log(avctx, AV_LOG_WARNING,
505
                       "Reducing left cropping to %d "
A
Anton Khirnov 已提交
506 507 508 509
                       "chroma samples to preserve alignment.\n",
                       crop_left);
            }

510 511 512 513 514 515
            if (INT_MAX / step_x             <= crop_left               ||
                INT_MAX / step_x - crop_left <= crop_right              ||
                16 * sps->mb_width <= step_x * (crop_left + crop_right) ||
                INT_MAX / step_y             <= crop_top                ||
                INT_MAX / step_y - crop_top  <= crop_bottom             ||
                16 * sps->mb_height <= step_y * (crop_top + crop_bottom)) {
516 517
                av_log(avctx, AV_LOG_WARNING, "Invalid crop parameters\n");
                if (avctx->err_recognition & AV_EF_EXPLODE)
518 519 520 521
                    goto fail;
                crop_left = crop_right = crop_top = crop_bottom = 0;
            }

A
Anton Khirnov 已提交
522 523 524 525
            sps->crop_left   = crop_left   * step_x;
            sps->crop_right  = crop_right  * step_x;
            sps->crop_top    = crop_top    * step_y;
            sps->crop_bottom = crop_bottom * step_y;
526
        }
527 528 529 530 531 532
    } else {
        sps->crop_left   =
        sps->crop_right  =
        sps->crop_top    =
        sps->crop_bottom =
        sps->crop        = 0;
533 534
    }

535
    sps->vui_parameters_present_flag = get_bits1(gb);
536
    if (sps->vui_parameters_present_flag) {
537 538
        int ret = decode_vui_parameters(gb, avctx, sps);
        if (ret < 0 && avctx->err_recognition & AV_EF_EXPLODE)
539
            goto fail;
540
    }
541

542 543
    /* if the maximum delay is not stored in the SPS, derive it based on the
     * level */
544 545
    if (!sps->bitstream_restriction_flag &&
        (sps->ref_frame_count || avctx->strict_std_compliance >= FF_COMPLIANCE_STRICT)) {
546 547 548 549 550 551 552 553 554 555
        sps->num_reorder_frames = MAX_DELAYED_PIC_COUNT - 1;
        for (i = 0; i < FF_ARRAY_ELEMS(level_max_dpb_mbs); i++) {
            if (level_max_dpb_mbs[i][0] == sps->level_idc) {
                sps->num_reorder_frames = FFMIN(level_max_dpb_mbs[i][1] / (sps->mb_width * sps->mb_height),
                                                sps->num_reorder_frames);
                break;
            }
        }
    }

556 557
    if (!sps->sar.den)
        sps->sar.den = 1;
558

559
    if (avctx->debug & FF_DEBUG_PICT_INFO) {
560
        static const char csp[4][5] = { "Gray", "420", "422", "444" };
561
        av_log(avctx, AV_LOG_DEBUG,
562
               "sps:%u profile:%d/%d poc:%d ref:%d %dx%d %s %s crop:%u/%u/%u/%u %s %s %"PRId32"/%"PRId32"\n",
563 564 565 566 567 568 569 570 571
               sps_id, sps->profile_idc, sps->level_idc,
               sps->poc_type,
               sps->ref_frame_count,
               sps->mb_width, sps->mb_height,
               sps->frame_mbs_only_flag ? "FRM" : (sps->mb_aff ? "MB-AFF" : "PIC-AFF"),
               sps->direct_8x8_inference_flag ? "8B8" : "",
               sps->crop_left, sps->crop_right,
               sps->crop_top, sps->crop_bottom,
               sps->vui_parameters_present_flag ? "VUI" : "",
572
               csp[sps->chroma_format_idc],
573
               sps->timing_info_present_flag ? sps->num_units_in_tick : 0,
574
               sps->timing_info_present_flag ? sps->time_scale : 0);
575 576
    }

577 578 579 580 581 582 583 584 585 586
    /* check if this is a repeat of an already parsed SPS, then keep the
     * original one.
     * otherwise drop all PPSes that depend on it */
    if (ps->sps_list[sps_id] &&
        !memcmp(ps->sps_list[sps_id]->data, sps_buf->data, sps_buf->size)) {
        av_buffer_unref(&sps_buf);
    } else {
        remove_sps(ps, sps_id);
        ps->sps_list[sps_id] = sps_buf;
    }
587

588
    return 0;
589

590
fail:
591
    av_buffer_unref(&sps_buf);
592
    return AVERROR_INVALIDDATA;
593 594
}

595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632 633 634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664
static void init_dequant8_coeff_table(PPS *pps, const SPS *sps)
{
    int i, j, q, x;
    const int max_qp = 51 + 6 * (sps->bit_depth_luma - 8);

    for (i = 0; i < 6; i++) {
        pps->dequant8_coeff[i] = pps->dequant8_buffer[i];
        for (j = 0; j < i; j++)
            if (!memcmp(pps->scaling_matrix8[j], pps->scaling_matrix8[i],
                        64 * sizeof(uint8_t))) {
                pps->dequant8_coeff[i] = pps->dequant8_buffer[j];
                break;
            }
        if (j < i)
            continue;

        for (q = 0; q < max_qp + 1; q++) {
            int shift = ff_h264_quant_div6[q];
            int idx   = ff_h264_quant_rem6[q];
            for (x = 0; x < 64; x++)
                pps->dequant8_coeff[i][q][(x >> 3) | ((x & 7) << 3)] =
                    ((uint32_t)ff_h264_dequant8_coeff_init[idx][ff_h264_dequant8_coeff_init_scan[((x >> 1) & 12) | (x & 3)]] *
                     pps->scaling_matrix8[i][x]) << shift;
        }
    }
}

static void init_dequant4_coeff_table(PPS *pps, const SPS *sps)
{
    int i, j, q, x;
    const int max_qp = 51 + 6 * (sps->bit_depth_luma - 8);
    for (i = 0; i < 6; i++) {
        pps->dequant4_coeff[i] = pps->dequant4_buffer[i];
        for (j = 0; j < i; j++)
            if (!memcmp(pps->scaling_matrix4[j], pps->scaling_matrix4[i],
                        16 * sizeof(uint8_t))) {
                pps->dequant4_coeff[i] = pps->dequant4_buffer[j];
                break;
            }
        if (j < i)
            continue;

        for (q = 0; q < max_qp + 1; q++) {
            int shift = ff_h264_quant_div6[q] + 2;
            int idx   = ff_h264_quant_rem6[q];
            for (x = 0; x < 16; x++)
                pps->dequant4_coeff[i][q][(x >> 2) | ((x << 2) & 0xF)] =
                    ((uint32_t)ff_h264_dequant4_coeff_init[idx][(x & 1) + ((x >> 2) & 1)] *
                     pps->scaling_matrix4[i][x]) << shift;
        }
    }
}

static void init_dequant_tables(PPS *pps, const SPS *sps)
{
    int i, x;
    init_dequant4_coeff_table(pps, sps);
    if (pps->transform_8x8_mode)
        init_dequant8_coeff_table(pps, sps);
    if (sps->transform_bypass) {
        for (i = 0; i < 6; i++)
            for (x = 0; x < 16; x++)
                pps->dequant4_coeff[i][0][x] = 1 << 6;
        if (pps->transform_8x8_mode)
            for (i = 0; i < 6; i++)
                for (x = 0; x < 64; x++)
                    pps->dequant8_coeff[i][0][x] = 1 << 6;
    }
}

665
static void build_qp_table(PPS *pps, int t, int index, const int depth)
666 667
{
    int i;
668 669 670 671
    const int max_qp = 51 + 6 * (depth - 8);
    for (i = 0; i < max_qp + 1; i++)
        pps->chroma_qp_table[t][i] =
            ff_h264_chroma_qp[depth - 8][av_clip(i + index, 0, max_qp)];
672 673
}

674 675
int ff_h264_decode_picture_parameter_set(GetBitContext *gb, AVCodecContext *avctx,
                                         H264ParamSets *ps, int bit_length)
676
{
677 678 679
    AVBufferRef *pps_buf;
    SPS *sps;
    unsigned int pps_id = get_ue_golomb(gb);
680
    PPS *pps;
681
    int qp_bd_offset;
682
    int bits_left;
683
    int ret;
684

685
    if (pps_id >= MAX_PPS_COUNT) {
686
        av_log(avctx, AV_LOG_ERROR, "pps_id %u out of range\n", pps_id);
687
        return AVERROR_INVALIDDATA;
688 689
    }

690 691
    pps_buf = av_buffer_allocz(sizeof(*pps));
    if (!pps_buf)
692
        return AVERROR(ENOMEM);
693 694 695
    pps = (PPS*)pps_buf->data;

    pps->sps_id = get_ue_golomb_31(gb);
696
    if ((unsigned)pps->sps_id >= MAX_SPS_COUNT ||
697 698
        !ps->sps_list[pps->sps_id]) {
        av_log(avctx, AV_LOG_ERROR, "sps_id %u out of range\n", pps->sps_id);
699
        ret = AVERROR_INVALIDDATA;
700 701
        goto fail;
    }
702
    sps = (SPS*)ps->sps_list[pps->sps_id]->data;
703 704

    if (sps->bit_depth_luma > 10) {
705 706
        avpriv_report_missing_feature(avctx, "Luma bit depth=%d (max=10)",
                                      sps->bit_depth_luma);
707 708
        ret = AVERROR_PATCHWELCOME;
        goto fail;
709
    }
710

711 712 713
    pps->cabac             = get_bits1(gb);
    pps->pic_order_present = get_bits1(gb);
    pps->slice_group_count = get_ue_golomb(gb) + 1;
714
    if (pps->slice_group_count > 1) {
715 716
        pps->mb_slice_group_map_type = get_ue_golomb(gb);
        av_log(avctx, AV_LOG_ERROR, "FMO not supported\n");
717
    }
718 719
    pps->ref_count[0] = get_ue_golomb(gb) + 1;
    pps->ref_count[1] = get_ue_golomb(gb) + 1;
720
    if (pps->ref_count[0] - 1 > 32 - 1 || pps->ref_count[1] - 1 > 32 - 1) {
721
        av_log(avctx, AV_LOG_ERROR, "reference overflow (pps)\n");
722
        ret = AVERROR_INVALIDDATA;
723 724 725
        goto fail;
    }

726 727
    qp_bd_offset = 6 * (sps->bit_depth_luma - 8);

728 729 730 731 732 733 734 735
    pps->weighted_pred                        = get_bits1(gb);
    pps->weighted_bipred_idc                  = get_bits(gb, 2);
    pps->init_qp                              = get_se_golomb(gb) + 26 + qp_bd_offset;
    pps->init_qs                              = get_se_golomb(gb) + 26 + qp_bd_offset;
    pps->chroma_qp_index_offset[0]            = get_se_golomb(gb);
    pps->deblocking_filter_parameters_present = get_bits1(gb);
    pps->constrained_intra_pred               = get_bits1(gb);
    pps->redundant_pic_cnt_present            = get_bits1(gb);
736 737

    pps->transform_8x8_mode = 0;
738
    memcpy(pps->scaling_matrix4, sps->scaling_matrix4,
739
           sizeof(pps->scaling_matrix4));
740
    memcpy(pps->scaling_matrix8, sps->scaling_matrix8,
741
           sizeof(pps->scaling_matrix8));
742

743
    bits_left = bit_length - get_bits_count(gb);
744
    if (bits_left && (bits_left > 8 ||
745 746 747
                      show_bits(gb, bits_left) != 1 << (bits_left - 1))) {
        pps->transform_8x8_mode = get_bits1(gb);
        decode_scaling_matrices(gb, sps, pps, 0,
748 749
                                pps->scaling_matrix4, pps->scaling_matrix8);
        // second_chroma_qp_index_offset
750
        pps->chroma_qp_index_offset[1] = get_se_golomb(gb);
751
    } else {
752
        pps->chroma_qp_index_offset[1] = pps->chroma_qp_index_offset[0];
753 754
    }

755
    build_qp_table(pps, 0, pps->chroma_qp_index_offset[0],
756
                   sps->bit_depth_luma);
757
    build_qp_table(pps, 1, pps->chroma_qp_index_offset[1],
758
                   sps->bit_depth_luma);
759 760 761

    init_dequant_tables(pps, sps);

762 763
    if (pps->chroma_qp_index_offset[0] != pps->chroma_qp_index_offset[1])
        pps->chroma_qp_diff = 1;
764

765 766
    if (avctx->debug & FF_DEBUG_PICT_INFO) {
        av_log(avctx, AV_LOG_DEBUG,
767
               "pps:%u sps:%u %s slice_groups:%d ref:%u/%u %s qp:%d/%d/%d/%d %s %s %s %s\n",
768 769 770 771 772 773 774 775 776
               pps_id, pps->sps_id,
               pps->cabac ? "CABAC" : "CAVLC",
               pps->slice_group_count,
               pps->ref_count[0], pps->ref_count[1],
               pps->weighted_pred ? "weighted" : "",
               pps->init_qp, pps->init_qs, pps->chroma_qp_index_offset[0], pps->chroma_qp_index_offset[1],
               pps->deblocking_filter_parameters_present ? "LPAR" : "",
               pps->constrained_intra_pred ? "CONSTR" : "",
               pps->redundant_pic_cnt_present ? "REDU" : "",
777
               pps->transform_8x8_mode ? "8x8DCT" : "");
778 779
    }

780 781 782
    remove_pps(ps, pps_id);
    ps->pps_list[pps_id] = pps_buf;

783
    return 0;
784

785
fail:
786
    av_buffer_unref(&pps_buf);
787
    return ret;
788
}