dxva2_h264.c 23.1 KB
Newer Older
L
Laurent Aimar 已提交
1
/*
2
 * DXVA2 H.264 HW acceleration.
L
Laurent Aimar 已提交
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22
 *
 * copyright (c) 2009 Laurent Aimar
 *
 * This file is part of FFmpeg.
 *
 * FFmpeg is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * FFmpeg is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with FFmpeg; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

23 24
#include "libavutil/avassert.h"

D
Diego Biurrun 已提交
25
#include "dxva2_internal.h"
26
#include "h264dec.h"
L
Laurent Aimar 已提交
27
#include "h264data.h"
28
#include "h264_ps.h"
29
#include "mpegutils.h"
L
Laurent Aimar 已提交
30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47

struct dxva2_picture_context {
    DXVA_PicParams_H264   pp;
    DXVA_Qmatrix_H264     qm;
    unsigned              slice_count;
    DXVA_Slice_H264_Short slice_short[MAX_SLICES];
    DXVA_Slice_H264_Long  slice_long[MAX_SLICES];
    const uint8_t         *bitstream;
    unsigned              bitstream_size;
};

static void fill_picture_entry(DXVA_PicEntry_H264 *pic,
                               unsigned index, unsigned flag)
{
    assert((index&0x7f) == index && (flag&0x01) == flag);
    pic->bPicEntry = index | (flag << 7);
}

48
static void fill_picture_parameters(const AVCodecContext *avctx, AVDXVAContext *ctx, const H264Context *h,
L
Laurent Aimar 已提交
49 50
                                    DXVA_PicParams_H264 *pp)
{
51
    const H264Picture *current_picture = h->cur_pic_ptr;
52 53
    const SPS *sps = h->ps.sps;
    const PPS *pps = h->ps.pps;
54
    int i, j;
L
Laurent Aimar 已提交
55 56 57 58

    memset(pp, 0, sizeof(*pp));
    /* Configure current picture */
    fill_picture_entry(&pp->CurrPic,
59
                       ff_dxva2_get_surface_index(avctx, ctx, current_picture->f),
A
Anton Khirnov 已提交
60
                       h->picture_structure == PICT_BOTTOM_FIELD);
L
Laurent Aimar 已提交
61 62 63
    /* Configure the set of references */
    pp->UsedForReferenceFlags  = 0;
    pp->NonExistingFrameFlags  = 0;
64
    for (i = 0, j = 0; i < FF_ARRAY_ELEMS(pp->RefFrameList); i++) {
65
        const H264Picture *r;
66 67 68 69 70 71 72
        if (j < h->short_ref_count) {
            r = h->short_ref[j++];
        } else {
            r = NULL;
            while (!r && j < h->short_ref_count + 16)
                r = h->long_ref[j++ - h->short_ref_count];
        }
73
        if (r) {
L
Laurent Aimar 已提交
74
            fill_picture_entry(&pp->RefFrameList[i],
75
                               ff_dxva2_get_surface_index(avctx, ctx, r->f),
L
Laurent Aimar 已提交
76 77
                               r->long_ref != 0);

78
            if ((r->reference & PICT_TOP_FIELD) && r->field_poc[0] != INT_MAX)
L
Laurent Aimar 已提交
79
                pp->FieldOrderCntList[i][0] = r->field_poc[0];
80
            if ((r->reference & PICT_BOTTOM_FIELD) && r->field_poc[1] != INT_MAX)
L
Laurent Aimar 已提交
81 82 83
                pp->FieldOrderCntList[i][1] = r->field_poc[1];

            pp->FrameNumList[i] = r->long_ref ? r->pic_id : r->frame_num;
84
            if (r->reference & PICT_TOP_FIELD)
L
Laurent Aimar 已提交
85
                pp->UsedForReferenceFlags |= 1 << (2*i + 0);
86
            if (r->reference & PICT_BOTTOM_FIELD)
L
Laurent Aimar 已提交
87 88 89 90 91 92 93 94 95
                pp->UsedForReferenceFlags |= 1 << (2*i + 1);
        } else {
            pp->RefFrameList[i].bPicEntry = 0xff;
            pp->FieldOrderCntList[i][0]   = 0;
            pp->FieldOrderCntList[i][1]   = 0;
            pp->FrameNumList[i]           = 0;
        }
    }

A
Anton Khirnov 已提交
96 97
    pp->wFrameWidthInMbsMinus1        = h->mb_width  - 1;
    pp->wFrameHeightInMbsMinus1       = h->mb_height - 1;
98
    pp->num_ref_frames                = sps->ref_frame_count;
L
Laurent Aimar 已提交
99

A
Anton Khirnov 已提交
100
    pp->wBitFields                    = ((h->picture_structure != PICT_FRAME) <<  0) |
101
                                        ((sps->mb_aff &&
A
Anton Khirnov 已提交
102
                                        (h->picture_structure == PICT_FRAME)) <<  1) |
103
                                        (sps->residual_color_transform_flag   <<  2) |
104
                                        /* sp_for_switch_flag (not implemented by FFmpeg) */
L
Laurent Aimar 已提交
105
                                        (0                                    <<  3) |
106
                                        (sps->chroma_format_idc               <<  4) |
L
Laurent Aimar 已提交
107
                                        ((h->nal_ref_idc != 0)                <<  6) |
108 109 110
                                        (pps->constrained_intra_pred          <<  7) |
                                        (pps->weighted_pred                   <<  8) |
                                        (pps->weighted_bipred_idc             <<  9) |
L
Laurent Aimar 已提交
111 112
                                        /* MbsConsecutiveFlag */
                                        (1                                    << 11) |
113 114 115
                                        (sps->frame_mbs_only_flag             << 12) |
                                        (pps->transform_8x8_mode              << 13) |
                                        ((sps->level_idc >= 31)               << 14) |
L
Laurent Aimar 已提交
116
                                        /* IntraPicFlag (Modified if we detect a non
117
                                         * intra slice in dxva2_h264_decode_slice) */
L
Laurent Aimar 已提交
118 119
                                        (1                                    << 15);

120 121
    pp->bit_depth_luma_minus8         = sps->bit_depth_luma - 8;
    pp->bit_depth_chroma_minus8       = sps->bit_depth_chroma - 8;
122
    if (DXVA_CONTEXT_WORKAROUND(avctx, ctx) & FF_DXVA2_WORKAROUND_SCALING_LIST_ZIGZAG)
123
        pp->Reserved16Bits            = 0;
124
    else if (DXVA_CONTEXT_WORKAROUND(avctx, ctx) & FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO)
125
        pp->Reserved16Bits            = 0x34c;
126
    else
127
        pp->Reserved16Bits            = 3; /* FIXME is there a way to detect the right mode ? */
128
    pp->StatusReportFeedbackNumber    = 1 + DXVA_CONTEXT_REPORT_ID(avctx, ctx)++;
L
Laurent Aimar 已提交
129
    pp->CurrFieldOrderCnt[0] = 0;
A
Anton Khirnov 已提交
130
    if ((h->picture_structure & PICT_TOP_FIELD) &&
L
Laurent Aimar 已提交
131 132 133
        current_picture->field_poc[0] != INT_MAX)
        pp->CurrFieldOrderCnt[0] = current_picture->field_poc[0];
    pp->CurrFieldOrderCnt[1] = 0;
A
Anton Khirnov 已提交
134
    if ((h->picture_structure & PICT_BOTTOM_FIELD) &&
L
Laurent Aimar 已提交
135 136
        current_picture->field_poc[1] != INT_MAX)
        pp->CurrFieldOrderCnt[1] = current_picture->field_poc[1];
137 138 139
    pp->pic_init_qs_minus26           = pps->init_qs - 26;
    pp->chroma_qp_index_offset        = pps->chroma_qp_index_offset[0];
    pp->second_chroma_qp_index_offset = pps->chroma_qp_index_offset[1];
L
Laurent Aimar 已提交
140
    pp->ContinuationFlag              = 1;
141 142 143
    pp->pic_init_qp_minus26           = pps->init_qp - 26;
    pp->num_ref_idx_l0_active_minus1  = pps->ref_count[0] - 1;
    pp->num_ref_idx_l1_active_minus1  = pps->ref_count[1] - 1;
L
Laurent Aimar 已提交
144
    pp->Reserved8BitsA                = 0;
145
    pp->frame_num                     = h->poc.frame_num;
146 147 148 149 150 151 152 153 154 155 156 157 158
    pp->log2_max_frame_num_minus4     = sps->log2_max_frame_num - 4;
    pp->pic_order_cnt_type            = sps->poc_type;
    if (sps->poc_type == 0)
        pp->log2_max_pic_order_cnt_lsb_minus4 = sps->log2_max_poc_lsb - 4;
    else if (sps->poc_type == 1)
        pp->delta_pic_order_always_zero_flag = sps->delta_pic_order_always_zero_flag;
    pp->direct_8x8_inference_flag     = sps->direct_8x8_inference_flag;
    pp->entropy_coding_mode_flag      = pps->cabac;
    pp->pic_order_present_flag        = pps->pic_order_present;
    pp->num_slice_groups_minus1       = pps->slice_group_count - 1;
    pp->slice_group_map_type          = pps->mb_slice_group_map_type;
    pp->deblocking_filter_control_present_flag = pps->deblocking_filter_parameters_present;
    pp->redundant_pic_cnt_present_flag= pps->redundant_pic_cnt_present;
L
Laurent Aimar 已提交
159
    pp->Reserved8BitsB                = 0;
160 161
    pp->slice_group_change_rate_minus1= 0;  /* XXX not implemented by FFmpeg */
    //pp->SliceGroupMap[810];               /* XXX not implemented by FFmpeg */
L
Laurent Aimar 已提交
162 163
}

164
static void fill_scaling_lists(const AVCodecContext *avctx, AVDXVAContext *ctx, const H264Context *h, DXVA_Qmatrix_H264 *qm)
L
Laurent Aimar 已提交
165
{
166
    const PPS *pps = h->ps.pps;
L
Laurent Aimar 已提交
167 168
    unsigned i, j;
    memset(qm, 0, sizeof(*qm));
169
    if (DXVA_CONTEXT_WORKAROUND(avctx, ctx) & FF_DXVA2_WORKAROUND_SCALING_LIST_ZIGZAG) {
170 171
        for (i = 0; i < 6; i++)
            for (j = 0; j < 16; j++)
172
                qm->bScalingLists4x4[i][j] = pps->scaling_matrix4[i][j];
173

174
        for (i = 0; i < 64; i++) {
175 176
            qm->bScalingLists8x8[0][i] = pps->scaling_matrix8[0][i];
            qm->bScalingLists8x8[1][i] = pps->scaling_matrix8[3][i];
177
        }
178
    } else {
179 180
        for (i = 0; i < 6; i++)
            for (j = 0; j < 16; j++)
181
                qm->bScalingLists4x4[i][j] = pps->scaling_matrix4[i][ff_zigzag_scan[j]];
L
Laurent Aimar 已提交
182

183
        for (i = 0; i < 64; i++) {
184 185
            qm->bScalingLists8x8[0][i] = pps->scaling_matrix8[0][ff_zigzag_direct[i]];
            qm->bScalingLists8x8[1][i] = pps->scaling_matrix8[3][ff_zigzag_direct[i]];
186
        }
187
    }
L
Laurent Aimar 已提交
188 189
}

190
static int is_slice_short(const AVCodecContext *avctx, AVDXVAContext *ctx)
L
Laurent Aimar 已提交
191
{
192 193 194
    assert(DXVA_CONTEXT_CFG_BITSTREAM(avctx, ctx) == 1 ||
           DXVA_CONTEXT_CFG_BITSTREAM(avctx, ctx) == 2);
    return DXVA_CONTEXT_CFG_BITSTREAM(avctx, ctx) == 2;
L
Laurent Aimar 已提交
195 196 197 198 199 200 201 202 203 204 205
}

static void fill_slice_short(DXVA_Slice_H264_Short *slice,
                             unsigned position, unsigned size)
{
    memset(slice, 0, sizeof(*slice));
    slice->BSNALunitDataLocation = position;
    slice->SliceBytesInBuffer    = size;
    slice->wBadSliceChopping     = 0;
}

206 207 208 209 210 211 212 213 214 215
static int get_refpic_index(const DXVA_PicParams_H264 *pp, int surface_index)
{
    int i;
    for (i = 0; i < FF_ARRAY_ELEMS(pp->RefFrameList); i++) {
        if ((pp->RefFrameList[i].bPicEntry & 0x7f) == surface_index)
          return i;
    }
    return 0x7f;
}

L
Laurent Aimar 已提交
216
static void fill_slice_long(AVCodecContext *avctx, DXVA_Slice_H264_Long *slice,
217
                            const DXVA_PicParams_H264 *pp, unsigned position, unsigned size)
L
Laurent Aimar 已提交
218
{
219
    const H264Context *h = avctx->priv_data;
220
    H264SliceContext *sl = &h->slice_ctx[0];
W
wm4 已提交
221
    AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
L
Laurent Aimar 已提交
222 223 224 225 226 227 228
    unsigned list;

    memset(slice, 0, sizeof(*slice));
    slice->BSNALunitDataLocation = position;
    slice->SliceBytesInBuffer    = size;
    slice->wBadSliceChopping     = 0;

229
    slice->first_mb_in_slice     = (sl->mb_y >> FIELD_OR_MBAFF_PICTURE(h)) * h->mb_width + sl->mb_x;
L
Laurent Aimar 已提交
230
    slice->NumMbsForSlice        = 0; /* XXX it is set once we have all slices */
231
    slice->BitOffsetToSliceData  = get_bits_count(&sl->gb) - 8;
232 233
    slice->slice_type            = ff_h264_get_slice_type(sl);
    if (sl->slice_type_fixed)
L
Laurent Aimar 已提交
234
        slice->slice_type += 5;
235 236
    slice->luma_log2_weight_denom       = sl->pwt.luma_log2_weight_denom;
    slice->chroma_log2_weight_denom     = sl->pwt.chroma_log2_weight_denom;
237 238 239 240
    if (sl->list_count > 0)
        slice->num_ref_idx_l0_active_minus1 = sl->ref_count[0] - 1;
    if (sl->list_count > 1)
        slice->num_ref_idx_l1_active_minus1 = sl->ref_count[1] - 1;
241 242
    slice->slice_alpha_c0_offset_div2   = sl->slice_alpha_c0_offset / 2;
    slice->slice_beta_offset_div2       = sl->slice_beta_offset     / 2;
L
Laurent Aimar 已提交
243 244 245 246 247
    slice->Reserved8Bits                = 0;

    for (list = 0; list < 2; list++) {
        unsigned i;
        for (i = 0; i < FF_ARRAY_ELEMS(slice->RefPicList[list]); i++) {
248
            if (list < sl->list_count && i < sl->ref_count[list]) {
249
                const H264Picture *r = sl->ref_list[list][i].parent;
L
Laurent Aimar 已提交
250
                unsigned plane;
251
                unsigned index;
252 253
                if (DXVA_CONTEXT_WORKAROUND(avctx, ctx) & FF_DXVA2_WORKAROUND_INTEL_CLEARVIDEO)
                    index = ff_dxva2_get_surface_index(avctx, ctx, r->f);
254
                else
255
                    index = get_refpic_index(pp, ff_dxva2_get_surface_index(avctx, ctx, r->f));
256
                fill_picture_entry(&slice->RefPicList[list][i], index,
257
                                   sl->ref_list[list][i].reference == PICT_BOTTOM_FIELD);
L
Laurent Aimar 已提交
258 259
                for (plane = 0; plane < 3; plane++) {
                    int w, o;
260 261 262 263 264 265
                    if (plane == 0 && sl->pwt.luma_weight_flag[list]) {
                        w = sl->pwt.luma_weight[i][list][0];
                        o = sl->pwt.luma_weight[i][list][1];
                    } else if (plane >= 1 && sl->pwt.chroma_weight_flag[list]) {
                        w = sl->pwt.chroma_weight[i][list][plane-1][0];
                        o = sl->pwt.chroma_weight[i][list][plane-1][1];
L
Laurent Aimar 已提交
266
                    } else {
267 268
                        w = 1 << (plane == 0 ? sl->pwt.luma_log2_weight_denom :
                                               sl->pwt.chroma_log2_weight_denom);
L
Laurent Aimar 已提交
269 270 271 272 273 274 275 276 277 278 279 280 281 282 283
                        o = 0;
                    }
                    slice->Weights[list][i][plane][0] = w;
                    slice->Weights[list][i][plane][1] = o;
                }
            } else {
                unsigned plane;
                slice->RefPicList[list][i].bPicEntry = 0xff;
                for (plane = 0; plane < 3; plane++) {
                    slice->Weights[list][i][plane][0] = 0;
                    slice->Weights[list][i][plane][1] = 0;
                }
            }
        }
    }
284
    slice->slice_qs_delta    = 0; /* XXX not implemented by FFmpeg */
285
    slice->slice_qp_delta    = sl->qscale - h->ps.pps->init_qp;
286
    slice->redundant_pic_cnt = sl->redundant_pic_count;
287
    if (sl->slice_type == AV_PICTURE_TYPE_B)
288
        slice->direct_spatial_mv_pred_flag = sl->direct_spatial_mv_pred;
289
    slice->cabac_init_idc = h->ps.pps->cabac ? sl->cabac_init_idc : 0;
290 291
    if (sl->deblocking_filter < 2)
        slice->disable_deblocking_filter_idc = 1 - sl->deblocking_filter;
L
Laurent Aimar 已提交
292
    else
293
        slice->disable_deblocking_filter_idc = sl->deblocking_filter;
L
Laurent Aimar 已提交
294 295 296 297
    slice->slice_id = h->current_slice - 1;
}

static int commit_bitstream_and_slice_buffer(AVCodecContext *avctx,
298 299
                                             DECODER_BUFFER_DESC *bs,
                                             DECODER_BUFFER_DESC *sc)
L
Laurent Aimar 已提交
300
{
301
    const H264Context *h = avctx->priv_data;
A
Anton Khirnov 已提交
302
    const unsigned mb_count = h->mb_width * h->mb_height;
W
wm4 已提交
303
    AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
304
    const H264Picture *current_picture = h->cur_pic_ptr;
305
    struct dxva2_picture_context *ctx_pic = current_picture->hwaccel_picture_private;
L
Laurent Aimar 已提交
306
    DXVA_Slice_H264_Short *slice = NULL;
307
    void     *dxva_data_ptr = NULL;
L
Laurent Aimar 已提交
308
    uint8_t  *dxva_data, *current, *end;
309
    unsigned dxva_size = 0;
L
Laurent Aimar 已提交
310 311 312 313
    void     *slice_data;
    unsigned slice_size;
    unsigned padding;
    unsigned i;
314
    unsigned type;
L
Laurent Aimar 已提交
315 316

    /* Create an annex B bitstream buffer with only slice NAL and finalize slice */
317
#if CONFIG_D3D11VA
W
wm4 已提交
318
    if (ff_dxva2_is_d3d11(avctx)) {
319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335
        type = D3D11_VIDEO_DECODER_BUFFER_BITSTREAM;
        if (FAILED(ID3D11VideoContext_GetDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context,
                                                       D3D11VA_CONTEXT(ctx)->decoder,
                                                       type,
                                                       &dxva_size, &dxva_data_ptr)))
            return -1;
    }
#endif
#if CONFIG_DXVA2
    if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
        type = DXVA2_BitStreamDateBufferType;
        if (FAILED(IDirectXVideoDecoder_GetBuffer(DXVA2_CONTEXT(ctx)->decoder,
                                                  type,
                                                  &dxva_data_ptr, &dxva_size)))
            return -1;
    }
#endif
336 337

    dxva_data = dxva_data_ptr;
L
Laurent Aimar 已提交
338 339 340 341 342 343 344 345 346 347 348 349 350
    current = dxva_data;
    end = dxva_data + dxva_size;

    for (i = 0; i < ctx_pic->slice_count; i++) {
        static const uint8_t start_code[] = { 0, 0, 1 };
        static const unsigned start_code_size = sizeof(start_code);
        unsigned position, size;

        assert(offsetof(DXVA_Slice_H264_Short, BSNALunitDataLocation) ==
               offsetof(DXVA_Slice_H264_Long,  BSNALunitDataLocation));
        assert(offsetof(DXVA_Slice_H264_Short, SliceBytesInBuffer) ==
               offsetof(DXVA_Slice_H264_Long,  SliceBytesInBuffer));

351
        if (is_slice_short(avctx, ctx))
L
Laurent Aimar 已提交
352 353 354 355 356 357 358 359 360 361 362 363 364 365
            slice = &ctx_pic->slice_short[i];
        else
            slice = (DXVA_Slice_H264_Short*)&ctx_pic->slice_long[i];

        position = slice->BSNALunitDataLocation;
        size     = slice->SliceBytesInBuffer;
        if (start_code_size + size > end - current) {
            av_log(avctx, AV_LOG_ERROR, "Failed to build bitstream");
            break;
        }

        slice->BSNALunitDataLocation = current - dxva_data;
        slice->SliceBytesInBuffer    = start_code_size + size;

366
        if (!is_slice_short(avctx, ctx)) {
L
Laurent Aimar 已提交
367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387
            DXVA_Slice_H264_Long *slice_long = (DXVA_Slice_H264_Long*)slice;
            if (i < ctx_pic->slice_count - 1)
                slice_long->NumMbsForSlice =
                    slice_long[1].first_mb_in_slice - slice_long[0].first_mb_in_slice;
            else
                slice_long->NumMbsForSlice = mb_count - slice_long->first_mb_in_slice;
        }

        memcpy(current, start_code, start_code_size);
        current += start_code_size;

        memcpy(current, &ctx_pic->bitstream[position], size);
        current += size;
    }
    padding = FFMIN(128 - ((current - dxva_data) & 127), end - current);
    if (slice && padding > 0) {
        memset(current, 0, padding);
        current += padding;

        slice->SliceBytesInBuffer += padding;
    }
388
#if CONFIG_D3D11VA
W
wm4 已提交
389
    if (ff_dxva2_is_d3d11(avctx))
390 391 392 393 394 395 396 397
        if (FAILED(ID3D11VideoContext_ReleaseDecoderBuffer(D3D11VA_CONTEXT(ctx)->video_context, D3D11VA_CONTEXT(ctx)->decoder, type)))
            return -1;
#endif
#if CONFIG_DXVA2
    if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD)
        if (FAILED(IDirectXVideoDecoder_ReleaseBuffer(DXVA2_CONTEXT(ctx)->decoder, type)))
            return -1;
#endif
L
Laurent Aimar 已提交
398 399 400
    if (i < ctx_pic->slice_count)
        return -1;

401
#if CONFIG_D3D11VA
W
wm4 已提交
402
    if (ff_dxva2_is_d3d11(avctx)) {
403 404 405 406 407
        D3D11_VIDEO_DECODER_BUFFER_DESC *dsc11 = bs;
        memset(dsc11, 0, sizeof(*dsc11));
        dsc11->BufferType           = type;
        dsc11->DataSize             = current - dxva_data;
        dsc11->NumMBsInBuffer       = mb_count;
L
Laurent Aimar 已提交
408

409
        type = D3D11_VIDEO_DECODER_BUFFER_SLICE_CONTROL;
410 411

        av_assert0((dsc11->DataSize & 127) == 0);
412 413 414 415 416 417 418 419 420 421 422
    }
#endif
#if CONFIG_DXVA2
    if (avctx->pix_fmt == AV_PIX_FMT_DXVA2_VLD) {
        DXVA2_DecodeBufferDesc *dsc2 = bs;
        memset(dsc2, 0, sizeof(*dsc2));
        dsc2->CompressedBufferType = type;
        dsc2->DataSize             = current - dxva_data;
        dsc2->NumMBsInBuffer       = mb_count;

        type = DXVA2_SliceControlBufferType;
423 424

        av_assert0((dsc2->DataSize & 127) == 0);
425 426 427 428
    }
#endif

    if (is_slice_short(avctx, ctx)) {
L
Laurent Aimar 已提交
429 430 431 432 433 434
        slice_data = ctx_pic->slice_short;
        slice_size = ctx_pic->slice_count * sizeof(*ctx_pic->slice_short);
    } else {
        slice_data = ctx_pic->slice_long;
        slice_size = ctx_pic->slice_count * sizeof(*ctx_pic->slice_long);
    }
435
    return ff_dxva2_commit_buffer(avctx, ctx, sc,
436
                                  type,
437
                                  slice_data, slice_size, mb_count);
L
Laurent Aimar 已提交
438 439 440
}


441 442 443
static int dxva2_h264_start_frame(AVCodecContext *avctx,
                                  av_unused const uint8_t *buffer,
                                  av_unused uint32_t size)
L
Laurent Aimar 已提交
444 445
{
    const H264Context *h = avctx->priv_data;
W
wm4 已提交
446
    AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
447
    struct dxva2_picture_context *ctx_pic = h->cur_pic_ptr->hwaccel_picture_private;
L
Laurent Aimar 已提交
448

449
    if (!DXVA_CONTEXT_VALID(avctx, ctx))
L
Laurent Aimar 已提交
450 451 452 453
        return -1;
    assert(ctx_pic);

    /* Fill up DXVA_PicParams_H264 */
454
    fill_picture_parameters(avctx, ctx, h, &ctx_pic->pp);
L
Laurent Aimar 已提交
455 456

    /* Fill up DXVA_Qmatrix_H264 */
457
    fill_scaling_lists(avctx, ctx, h, &ctx_pic->qm);
L
Laurent Aimar 已提交
458 459 460 461 462 463 464

    ctx_pic->slice_count    = 0;
    ctx_pic->bitstream_size = 0;
    ctx_pic->bitstream      = NULL;
    return 0;
}

465 466 467
static int dxva2_h264_decode_slice(AVCodecContext *avctx,
                                   const uint8_t *buffer,
                                   uint32_t size)
L
Laurent Aimar 已提交
468
{
469
    const H264Context *h = avctx->priv_data;
470
    const H264SliceContext *sl = &h->slice_ctx[0];
W
wm4 已提交
471
    AVDXVAContext *ctx = DXVA_CONTEXT(avctx);
472
    const H264Picture *current_picture = h->cur_pic_ptr;
473
    struct dxva2_picture_context *ctx_pic = current_picture->hwaccel_picture_private;
L
Laurent Aimar 已提交
474 475 476 477 478 479 480 481 482 483
    unsigned position;

    if (ctx_pic->slice_count >= MAX_SLICES)
        return -1;

    if (!ctx_pic->bitstream)
        ctx_pic->bitstream = buffer;
    ctx_pic->bitstream_size += size;

    position = buffer - ctx_pic->bitstream;
484
    if (is_slice_short(avctx, ctx))
L
Laurent Aimar 已提交
485 486 487 488
        fill_slice_short(&ctx_pic->slice_short[ctx_pic->slice_count],
                         position, size);
    else
        fill_slice_long(avctx, &ctx_pic->slice_long[ctx_pic->slice_count],
489
                        &ctx_pic->pp, position, size);
L
Laurent Aimar 已提交
490 491
    ctx_pic->slice_count++;

492
    if (sl->slice_type != AV_PICTURE_TYPE_I && sl->slice_type != AV_PICTURE_TYPE_SI)
L
Laurent Aimar 已提交
493 494 495 496
        ctx_pic->pp.wBitFields &= ~(1 << 15); /* Set IntraPicFlag to 0 */
    return 0;
}

497
static int dxva2_h264_end_frame(AVCodecContext *avctx)
498 499
{
    H264Context *h = avctx->priv_data;
500
    H264SliceContext *sl = &h->slice_ctx[0];
501
    struct dxva2_picture_context *ctx_pic =
502
        h->cur_pic_ptr->hwaccel_picture_private;
A
Anton Khirnov 已提交
503
    int ret;
504 505 506

    if (ctx_pic->slice_count <= 0 || ctx_pic->bitstream_size <= 0)
        return -1;
507
    ret = ff_dxva2_common_end_frame(avctx, h->cur_pic_ptr->f,
A
Anton Khirnov 已提交
508 509 510 511
                                    &ctx_pic->pp, sizeof(ctx_pic->pp),
                                    &ctx_pic->qm, sizeof(ctx_pic->qm),
                                    commit_bitstream_and_slice_buffer);
    if (!ret)
512
        ff_h264_draw_horiz_band(h, sl, 0, h->avctx->height);
A
Anton Khirnov 已提交
513
    return ret;
514 515
}

516
#if CONFIG_H264_DXVA2_HWACCEL
517
const AVHWAccel ff_h264_dxva2_hwaccel = {
L
Laurent Aimar 已提交
518
    .name           = "h264_dxva2",
519
    .type           = AVMEDIA_TYPE_VIDEO,
520
    .id             = AV_CODEC_ID_H264,
521
    .pix_fmt        = AV_PIX_FMT_DXVA2_VLD,
522 523
    .init           = ff_dxva2_decode_init,
    .uninit         = ff_dxva2_decode_uninit,
524 525 526
    .start_frame    = dxva2_h264_start_frame,
    .decode_slice   = dxva2_h264_decode_slice,
    .end_frame      = dxva2_h264_end_frame,
527
    .frame_params   = ff_dxva2_common_frame_params,
528
    .frame_priv_data_size = sizeof(struct dxva2_picture_context),
529
    .priv_data_size = sizeof(FFDXVASharedContext),
L
Laurent Aimar 已提交
530
};
531 532 533
#endif

#if CONFIG_H264_D3D11VA_HWACCEL
534
const AVHWAccel ff_h264_d3d11va_hwaccel = {
535 536 537 538
    .name           = "h264_d3d11va",
    .type           = AVMEDIA_TYPE_VIDEO,
    .id             = AV_CODEC_ID_H264,
    .pix_fmt        = AV_PIX_FMT_D3D11VA_VLD,
539 540
    .init           = ff_dxva2_decode_init,
    .uninit         = ff_dxva2_decode_uninit,
541 542 543
    .start_frame    = dxva2_h264_start_frame,
    .decode_slice   = dxva2_h264_decode_slice,
    .end_frame      = dxva2_h264_end_frame,
544
    .frame_params   = ff_dxva2_common_frame_params,
545
    .frame_priv_data_size = sizeof(struct dxva2_picture_context),
546 547 548 549 550
    .priv_data_size = sizeof(FFDXVASharedContext),
};
#endif

#if CONFIG_H264_D3D11VA2_HWACCEL
551
const AVHWAccel ff_h264_d3d11va2_hwaccel = {
552 553 554 555 556 557 558 559 560
    .name           = "h264_d3d11va2",
    .type           = AVMEDIA_TYPE_VIDEO,
    .id             = AV_CODEC_ID_H264,
    .pix_fmt        = AV_PIX_FMT_D3D11,
    .init           = ff_dxva2_decode_init,
    .uninit         = ff_dxva2_decode_uninit,
    .start_frame    = dxva2_h264_start_frame,
    .decode_slice   = dxva2_h264_decode_slice,
    .end_frame      = dxva2_h264_end_frame,
561
    .frame_params   = ff_dxva2_common_frame_params,
562 563
    .frame_priv_data_size = sizeof(struct dxva2_picture_context),
    .priv_data_size = sizeof(FFDXVASharedContext),
564 565
};
#endif