vaapi_encode.h 12.4 KB
Newer Older
1
/*
2
 * This file is part of FFmpeg.
3
 *
4
 * FFmpeg is free software; you can redistribute it and/or
5 6 7 8
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
9
 * FFmpeg is distributed in the hope that it will be useful,
10 11 12 13 14
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
15
 * License along with FFmpeg; if not, write to the Free Software
16 17 18 19 20 21 22 23 24 25
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#ifndef AVCODEC_VAAPI_ENCODE_H
#define AVCODEC_VAAPI_ENCODE_H

#include <stdint.h>

#include <va/va.h>

26 27 28 29
#if VA_CHECK_VERSION(1, 0, 0)
#include <va/va_str.h>
#endif

30 31 32 33 34 35 36 37 38
#include "libavutil/hwcontext.h"
#include "libavutil/hwcontext_vaapi.h"

#include "avcodec.h"

struct VAAPIEncodeType;
struct VAAPIEncodePicture;

enum {
39 40
    MAX_CONFIG_ATTRIBUTES  = 4,
    MAX_GLOBAL_PARAMS      = 4,
41
    MAX_DPB_SIZE           = 16,
42 43 44 45 46 47 48 49 50 51 52 53 54
    MAX_PICTURE_REFERENCES = 2,
    MAX_REORDER_DELAY      = 16,
    MAX_PARAM_BUFFER_SIZE  = 1024,
};

enum {
    PICTURE_TYPE_IDR = 0,
    PICTURE_TYPE_I   = 1,
    PICTURE_TYPE_P   = 2,
    PICTURE_TYPE_B   = 3,
};

typedef struct VAAPIEncodeSlice {
M
Mark Thompson 已提交
55
    int             index;
56 57 58 59
    int             row_start;
    int             row_size;
    int             block_start;
    int             block_size;
60 61 62 63 64 65 66 67 68 69
    void           *priv_data;
    void           *codec_slice_params;
} VAAPIEncodeSlice;

typedef struct VAAPIEncodePicture {
    struct VAAPIEncodePicture *next;

    int64_t         display_order;
    int64_t         encode_order;
    int64_t         pts;
70
    int             force_idr;
71 72

    int             type;
73
    int             b_depth;
74 75 76 77 78 79 80 81 82 83
    int             encode_issued;
    int             encode_complete;

    AVFrame        *input_image;
    VASurfaceID     input_surface;

    AVFrame        *recon_image;
    VASurfaceID     recon_surface;

    int          nb_param_buffers;
84
    VABufferID     *param_buffers;
85

86
    AVBufferRef    *output_buffer_ref;
87 88 89 90 91
    VABufferID      output_buffer;

    void           *priv_data;
    void           *codec_picture_params;

92 93 94 95 96 97 98 99 100 101 102
    // Whether this picture is a reference picture.
    int             is_reference;

    // The contents of the DPB after this picture has been decoded.
    // This will contain the picture itself if it is a reference picture,
    // but not if it isn't.
    int                     nb_dpb_pics;
    struct VAAPIEncodePicture *dpb[MAX_DPB_SIZE];
    // The reference pictures used in decoding this picture.  If they are
    // used by later pictures they will also appear in the DPB.
    int                     nb_refs;
103
    struct VAAPIEncodePicture *refs[MAX_PICTURE_REFERENCES];
104 105 106 107 108 109 110 111
    // The previous reference picture in encode order.  Must be in at least
    // one of the reference list and DPB list.
    struct VAAPIEncodePicture *prev;
    // Reference count for other pictures referring to this one through
    // the above pointers, directly from incomplete pictures and indirectly
    // through completed pictures.
    int             ref_count[2];
    int             ref_removed[2];
112 113

    int          nb_slices;
114
    VAAPIEncodeSlice *slices;
115 116
} VAAPIEncodePicture;

117 118 119 120 121 122 123 124 125 126 127 128 129 130 131
typedef struct VAAPIEncodeProfile {
    // lavc profile value (FF_PROFILE_*).
    int       av_profile;
    // Supported bit depth.
    int       depth;
    // Number of components.
    int       nb_components;
    // Chroma subsampling in width dimension.
    int       log2_chroma_w;
    // Chroma subsampling in height dimension.
    int       log2_chroma_h;
    // VAAPI profile value.
    VAProfile va_profile;
} VAAPIEncodeProfile;

132 133 134 135 136 137
typedef struct VAAPIEncodeContext {
    const AVClass *class;

    // Codec-specific hooks.
    const struct VAAPIEncodeType *codec;

138 139 140 141 142
    // Global options.

    // Use low power encoding mode.
    int             low_power;

143 144 145 146 147 148
    // Number of I frames between IDR frames.
    int             idr_interval;

    // Desired B frame reference depth.
    int             desired_b_depth;

149 150
    // Desired packed headers.
    unsigned int    desired_packed_headers;
151 152 153 154 155 156 157

    // The required size of surfaces.  This is probably the input
    // size (AVCodecContext.width|height) aligned up to whatever
    // block size is required by the codec.
    int             surface_width;
    int             surface_height;

158 159 160 161
    // The block size for slice calculations.
    int             slice_block_width;
    int             slice_block_height;

162 163 164
    // Everything above this point must be set before calling
    // ff_vaapi_encode_init().

165 166 167 168 169 170 171
    // Chosen encoding profile details.
    const VAAPIEncodeProfile *profile;

    // Encoding profile (VAProfile*).
    VAProfile       va_profile;
    // Encoding entrypoint (VAEntryoint*).
    VAEntrypoint    va_entrypoint;
172 173 174 175
    // Rate control mode.
    unsigned int    va_rc_mode;
    // Bitrate for codec-specific encoder parameters.
    unsigned int    va_bit_rate;
176 177
    // Packed headers which will actually be sent.
    unsigned int    va_packed_headers;
178

179 180 181 182
    // Configuration attributes to use when creating va_config.
    VAConfigAttrib  config_attributes[MAX_CONFIG_ATTRIBUTES];
    int          nb_config_attributes;

183 184 185 186 187 188 189
    VAConfigID      va_config;
    VAContextID     va_context;

    AVBufferRef    *device_ref;
    AVHWDeviceContext *device;
    AVVAAPIDeviceContext *hwctx;

190
    // The hardware frame context containing the input frames.
191 192 193
    AVBufferRef    *input_frames_ref;
    AVHWFramesContext *input_frames;

194
    // The hardware frame context containing the reconstructed frames.
195 196 197
    AVBufferRef    *recon_frames_ref;
    AVHWFramesContext *recon_frames;

198
    // Pool of (reusable) bitstream output buffers.
199 200
    AVBufferPool   *output_buffer_pool;

201 202
    // Global parameters which will be applied at the start of the
    // sequence (includes rate control parameters below).
203 204 205 206
    VAEncMiscParameterBuffer *global_params[MAX_GLOBAL_PARAMS];
    size_t          global_params_size[MAX_GLOBAL_PARAMS];
    int          nb_global_params;

207 208 209 210 211 212 213 214 215
    // Rate control parameters.
    struct {
        VAEncMiscParameterBuffer misc;
        VAEncMiscParameterRateControl rc;
    } rc_params;
    struct {
        VAEncMiscParameterBuffer misc;
        VAEncMiscParameterHRD hrd;
    } hrd_params;
216 217 218 219
    struct {
        VAEncMiscParameterBuffer misc;
        VAEncMiscParameterFrameRate fr;
    } fr_params;
220 221 222 223 224 225
#if VA_CHECK_VERSION(0, 36, 0)
    struct {
        VAEncMiscParameterBuffer misc;
        VAEncMiscParameterBufferQualityLevel quality;
    } quality_params;
#endif
226

227 228 229 230 231
    // Per-sequence parameter structure (VAEncSequenceParameterBuffer*).
    void           *codec_sequence_params;

    // Per-sequence parameters found in the per-picture parameter
    // structure (VAEncPictureParameterBuffer*).
232
    void           *codec_picture_params;
233 234 235

    // Current encoding window, in display (input) order.
    VAAPIEncodePicture *pic_start, *pic_end;
236 237 238
    // The next picture to use as the previous reference picture in
    // encoding order.
    VAAPIEncodePicture *next_prev;
239 240 241 242 243

    // Next input order index (display order).
    int64_t         input_order;
    // Number of frames that output is behind input.
    int64_t         output_delay;
244 245
    // Next encode order index.
    int64_t         encode_order;
246 247
    // Number of frames decode output will need to be delayed.
    int64_t         decode_delay;
248
    // Next output order index (in encode order).
249 250 251 252 253 254 255
    int64_t         output_order;

    // Timestamp handling.
    int64_t         first_pts;
    int64_t         dts_pts_diff;
    int64_t         ts_ring[MAX_REORDER_DELAY * 3];

256 257 258 259 260 261
    // Slice structure.
    int slice_block_rows;
    int slice_block_cols;
    int nb_slices;
    int slice_size;

262
    // Frame type decision.
263
    int gop_size;
264 265
    int closed_gop;
    int gop_per_idr;
266
    int p_per_i;
267
    int max_b_depth;
268
    int b_per_p;
269
    int force_idr;
270
    int idr_counter;
M
Mark Thompson 已提交
271
    int gop_counter;
272 273 274
    int end_of_stream;
} VAAPIEncodeContext;

275 276 277
enum {
    // Codec supports controlling the subdivision of pictures into slices.
    FLAG_SLICE_CONTROL         = 1 << 0,
278 279
    // Codec only supports constant quality (no rate control).
    FLAG_CONSTANT_QUALITY_ONLY = 1 << 1,
280 281 282 283 284 285 286 287 288
    // Codec is intra-only.
    FLAG_INTRA_ONLY            = 1 << 2,
    // Codec supports B-pictures.
    FLAG_B_PICTURES            = 1 << 3,
    // Codec supports referencing B-pictures.
    FLAG_B_PICTURE_REFERENCES  = 1 << 4,
    // Codec supports non-IDR key pictures (that is, key pictures do
    // not necessarily empty the DPB).
    FLAG_NON_IDR_KEY_PICTURES  = 1 << 5,
289 290
};

291
typedef struct VAAPIEncodeType {
292 293 294 295
    // List of supported profiles and corresponding VAAPI profiles.
    // (Must end with FF_PROFILE_UNKNOWN.)
    const VAAPIEncodeProfile *profiles;

296 297 298
    // Codec feature flags.
    int flags;

299 300 301 302
    // Perform any extra codec-specific configuration after the
    // codec context is initialised (set up the private data and
    // add any necessary global parameters).
    int (*configure)(AVCodecContext *avctx);
303

304 305 306 307
    // The size of any private data structure associated with each
    // picture (can be zero if not required).
    size_t picture_priv_data_size;

308 309
    // The size of the parameter structures:
    // sizeof(VAEnc{type}ParameterBuffer{codec}).
310 311 312 313
    size_t sequence_params_size;
    size_t picture_params_size;
    size_t slice_params_size;

314
    // Fill the parameter structures.
315 316 317 318 319 320 321
    int  (*init_sequence_params)(AVCodecContext *avctx);
    int   (*init_picture_params)(AVCodecContext *avctx,
                                 VAAPIEncodePicture *pic);
    int     (*init_slice_params)(AVCodecContext *avctx,
                                 VAAPIEncodePicture *pic,
                                 VAAPIEncodeSlice *slice);

322 323
    // The type used by the packed header: this should look like
    // VAEncPackedHeader{something}.
324 325 326 327
    int sequence_header_type;
    int picture_header_type;
    int slice_header_type;

328
    // Write the packed header data to the provided buffer.
329 330
    // The sequence header is also used to fill the codec extradata
    // when the encoder is starting.
331 332 333 334 335 336 337 338 339 340
    int (*write_sequence_header)(AVCodecContext *avctx,
                                 char *data, size_t *data_len);
    int  (*write_picture_header)(AVCodecContext *avctx,
                                 VAAPIEncodePicture *pic,
                                 char *data, size_t *data_len);
    int    (*write_slice_header)(AVCodecContext *avctx,
                                 VAAPIEncodePicture *pic,
                                 VAAPIEncodeSlice *slice,
                                 char *data, size_t *data_len);

341 342 343 344
    // Fill an extra parameter structure, which will then be
    // passed to vaRenderPicture().  Will be called repeatedly
    // with increasing index argument until AVERROR_EOF is
    // returned.
345 346 347 348
    int    (*write_extra_buffer)(AVCodecContext *avctx,
                                 VAAPIEncodePicture *pic,
                                 int index, int *type,
                                 char *data, size_t *data_len);
349 350 351 352

    // Write an extra packed header.  Will be called repeatedly
    // with increasing index argument until AVERROR_EOF is
    // returned.
353 354 355 356
    int    (*write_extra_header)(AVCodecContext *avctx,
                                 VAAPIEncodePicture *pic,
                                 int index, int *type,
                                 char *data, size_t *data_len);
357 358 359 360 361 362
} VAAPIEncodeType;


int ff_vaapi_encode2(AVCodecContext *avctx, AVPacket *pkt,
                     const AVFrame *input_image, int *got_packet);

363 364 365
int ff_vaapi_encode_send_frame(AVCodecContext *avctx, const AVFrame *frame);
int ff_vaapi_encode_receive_packet(AVCodecContext *avctx, AVPacket *pkt);

366
int ff_vaapi_encode_init(AVCodecContext *avctx);
367 368
int ff_vaapi_encode_close(AVCodecContext *avctx);

369 370 371 372 373 374

#define VAAPI_ENCODE_COMMON_OPTIONS \
    { "low_power", \
      "Use low-power encoding mode (only available on some platforms; " \
      "may not support all encoding features)", \
      OFFSET(common.low_power), AV_OPT_TYPE_BOOL, \
375 376 377 378 379 380 381 382 383
      { .i64 = 0 }, 0, 1, FLAGS }, \
    { "idr_interval", \
      "Distance (in I-frames) between IDR frames", \
      OFFSET(common.idr_interval), AV_OPT_TYPE_INT, \
      { .i64 = 0 }, 0, INT_MAX, FLAGS }, \
    { "b_depth", \
      "Maximum B-frame reference depth", \
      OFFSET(common.desired_b_depth), AV_OPT_TYPE_INT, \
      { .i64 = 1 }, 1, INT_MAX, FLAGS }
384 385


386
#endif /* AVCODEC_VAAPI_ENCODE_H */