FFmpeg  4.0
qsvenc_h264.c
Go to the documentation of this file.
1 /*
2  * Intel MediaSDK QSV based H.264 enccoder
3  *
4  * copyright (c) 2013 Yukinori Yamazoe
5  *
6  * This file is part of FFmpeg.
7  *
8  * FFmpeg is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2.1 of the License, or (at your option) any later version.
12  *
13  * FFmpeg is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public
19  * License along with FFmpeg; if not, write to the Free Software
20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21  */
22 
23 
24 #include <stdint.h>
25 #include <sys/types.h>
26 
27 #include <mfx/mfxvideo.h>
28 
29 #include "libavutil/common.h"
30 #include "libavutil/opt.h"
31 
32 #include "avcodec.h"
33 #include "internal.h"
34 #include "qsv.h"
35 #include "qsv_internal.h"
36 #include "qsvenc.h"
37 
38 typedef struct QSVH264EncContext {
39  AVClass *class;
42 
44  const AVFrame *frame, mfxEncodeCtrl* enc_ctrl)
45 {
46  QSVH264EncContext *qh264 = avctx->priv_data;
47  QSVEncContext *q = &qh264->qsv;
48 
49  if (q->a53_cc && frame) {
50  mfxPayload* payload;
51  mfxU8* sei_data;
52  size_t sei_size;
53  int res;
54 
55  res = ff_alloc_a53_sei(frame, sizeof(mfxPayload) + 2, (void**)&payload, &sei_size);
56  if (res < 0 || !payload)
57  return res;
58 
59  sei_data = (mfxU8*)(payload + 1);
60  // SEI header
61  sei_data[0] = 4;
62  sei_data[1] = (mfxU8)sei_size; // size of SEI data
63  // SEI data filled in by ff_alloc_a53_sei
64 
65  payload->BufSize = sei_size + 2;
66  payload->NumBit = payload->BufSize * 8;
67  payload->Type = 4;
68  payload->Data = sei_data;
69 
70  enc_ctrl->NumExtParam = 0;
71  enc_ctrl->NumPayload = 1;
72  enc_ctrl->Payload[0] = payload;
73  }
74  return 0;
75 }
76 
78 {
79  QSVH264EncContext *q = avctx->priv_data;
80 
82  return ff_qsv_enc_init(avctx, &q->qsv);
83 }
84 
86  const AVFrame *frame, int *got_packet)
87 {
88  QSVH264EncContext *q = avctx->priv_data;
89 
90  return ff_qsv_encode(avctx, &q->qsv, pkt, frame, got_packet);
91 }
92 
94 {
95  QSVH264EncContext *q = avctx->priv_data;
96 
97  return ff_qsv_enc_close(avctx, &q->qsv);
98 }
99 
100 #define OFFSET(x) offsetof(QSVH264EncContext, x)
101 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
102 static const AVOption options[] = {
104 
105  { "cavlc", "Enable CAVLC", OFFSET(qsv.cavlc), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, VE },
106  { "idr_interval", "Distance (in I-frames) between IDR frames", OFFSET(qsv.idr_interval), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, VE },
107  { "pic_timing_sei", "Insert picture timing SEI with pic_struct_syntax element", OFFSET(qsv.pic_timing_sei), AV_OPT_TYPE_INT, { .i64 = 1 }, 0, 1, VE },
108  { "single_sei_nal_unit", "Put all the SEI messages into one NALU", OFFSET(qsv.single_sei_nal_unit), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
109  { "max_dec_frame_buffering", "Maximum number of frames buffered in the DPB", OFFSET(qsv.max_dec_frame_buffering), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, UINT16_MAX, VE },
110 
111 #if QSV_HAVE_LA
112  { "look_ahead", "Use VBR algorithm with look ahead", OFFSET(qsv.look_ahead), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, VE },
113  { "look_ahead_depth", "Depth of look ahead in number frames", OFFSET(qsv.look_ahead_depth), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 100, VE },
114 #endif
115 #if QSV_HAVE_LA_DS
116  { "look_ahead_downsampling", "Downscaling factor for the frames saved for the lookahead analysis", OFFSET(qsv.look_ahead_downsampling),
117  AV_OPT_TYPE_INT, { .i64 = MFX_LOOKAHEAD_DS_UNKNOWN }, MFX_LOOKAHEAD_DS_UNKNOWN, MFX_LOOKAHEAD_DS_2x, VE, "look_ahead_downsampling" },
118  { "unknown" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_UNKNOWN }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
119  { "auto" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_UNKNOWN }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
120  { "off" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_OFF }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
121  { "2x" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_2x }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
122  { "4x" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_4x }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
123 #endif
124 
125  { "int_ref_type", "Intra refresh type", OFFSET(qsv.int_ref_type), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, UINT16_MAX, VE, "int_ref_type" },
126  { "none", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 0 }, .flags = VE, "int_ref_type" },
127  { "vertical", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, .flags = VE, "int_ref_type" },
128  { "int_ref_cycle_size", "Number of frames in the intra refresh cycle", OFFSET(qsv.int_ref_cycle_size), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, UINT16_MAX, VE },
129  { "int_ref_qp_delta", "QP difference for the refresh MBs", OFFSET(qsv.int_ref_qp_delta), AV_OPT_TYPE_INT, { .i64 = INT16_MIN }, INT16_MIN, INT16_MAX, VE },
130  { "recovery_point_sei", "Insert recovery point SEI messages", OFFSET(qsv.recovery_point_sei), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
131 
132  { "trellis", "Trellis quantization", OFFSET(qsv.trellis), AV_OPT_TYPE_FLAGS, { .i64 = 0 }, 0, UINT_MAX, VE, "trellis" },
133  { "off", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_TRELLIS_OFF }, .flags = VE, "trellis" },
134  { "I", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_TRELLIS_I }, .flags = VE, "trellis" },
135  { "P", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_TRELLIS_P }, .flags = VE, "trellis" },
136  { "B", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_TRELLIS_B }, .flags = VE, "trellis" },
137 
138  { "profile", NULL, OFFSET(qsv.profile), AV_OPT_TYPE_INT, { .i64 = MFX_PROFILE_UNKNOWN }, 0, INT_MAX, VE, "profile" },
139  { "unknown" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_UNKNOWN }, INT_MIN, INT_MAX, VE, "profile" },
140  { "baseline", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_AVC_BASELINE }, INT_MIN, INT_MAX, VE, "profile" },
141  { "main" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_AVC_MAIN }, INT_MIN, INT_MAX, VE, "profile" },
142  { "high" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_AVC_HIGH }, INT_MIN, INT_MAX, VE, "profile" },
143 
144  { "a53cc" , "Use A53 Closed Captions (if available)", OFFSET(qsv.a53_cc), AV_OPT_TYPE_INT, {.i64 = 1}, 0, 1, VE},
145 
146  { "aud", "Insert the Access Unit Delimiter NAL", OFFSET(qsv.aud), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, VE},
147 
148 #if QSV_HAVE_MF
149  { "mfmode", "Multi-Frame Mode", OFFSET(qsv.mfmode), AV_OPT_TYPE_INT, { .i64 = MFX_MF_AUTO }, 0, INT_MAX, VE },
150 #endif
151 
152  { NULL },
153 };
154 
155 static const AVClass class = {
156  .class_name = "h264_qsv encoder",
157  .item_name = av_default_item_name,
158  .option = options,
160 };
161 
163  { "b", "1M" },
164  { "refs", "0" },
165  // same as the x264 default
166  { "g", "250" },
167  { "bf", "3" },
168 #if FF_API_CODER_TYPE
169  { "coder", "-1" },
170 #endif
171 
172  { "flags", "+cgop" },
173 #if FF_API_PRIVATE_OPT
174  { "b_strategy", "-1" },
175 #endif
176  { NULL },
177 };
178 
180  .name = "h264_qsv",
181  .long_name = NULL_IF_CONFIG_SMALL("H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10 (Intel Quick Sync Video acceleration)"),
182  .priv_data_size = sizeof(QSVH264EncContext),
184  .id = AV_CODEC_ID_H264,
185  .init = qsv_enc_init,
186  .encode2 = qsv_enc_frame,
187  .close = qsv_enc_close,
188  .capabilities = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_HYBRID,
189  .pix_fmts = (const enum AVPixelFormat[]){ AV_PIX_FMT_NV12,
192  AV_PIX_FMT_NONE },
193  .priv_class = &class,
194  .defaults = qsv_enc_defaults,
195  .caps_internal = FF_CODEC_CAP_INIT_CLEANUP,
196  .wrapper_name = "qsv",
197 };
#define FF_CODEC_CAP_INIT_CLEANUP
The codec allows calling the close function for deallocation even if the init function returned a fai...
Definition: internal.h:48
int single_sei_nal_unit
Definition: qsvenc.h:148
#define NULL
Definition: coverity.c:32
This structure describes decoded (raw) audio or video data.
Definition: frame.h:218
AVOption.
Definition: opt.h:246
int int_ref_type
Definition: qsvenc.h:160
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
static av_cold int init(AVCodecContext *avctx)
Definition: avrndec.c:35
int look_ahead_depth
Definition: qsvenc.h:139
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:191
int int_ref_qp_delta
Definition: qsvenc.h:162
static AVPacket pkt
AVCodec.
Definition: avcodec.h:3408
int look_ahead
Definition: qsvenc.h:138
#define AV_PIX_FMT_P010
Definition: pixfmt.h:413
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:72
#define AV_CODEC_CAP_DELAY
Encoder or decoder requires flushing with NULL input at the end in order to give the complete and cor...
Definition: avcodec.h:984
int ff_qsv_encode(AVCodecContext *avctx, QSVEncContext *q, AVPacket *pkt, const AVFrame *frame, int *got_packet)
Definition: qsvenc.c:1208
#define av_cold
Definition: attributes.h:82
AVOptions.
static const AVCodecDefault qsv_enc_defaults[]
Definition: qsvenc_h264.c:162
static AVFrame * frame
#define QSV_COMMON_OPTS
Definition: qsvenc.h:69
int ff_qsv_enc_close(AVCodecContext *avctx, QSVEncContext *q)
Definition: qsvenc.c:1277
static const AVOption options[]
Definition: qsvenc_h264.c:102
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:186
planar YUV 4:2:0, 12bpp, 1 plane for Y and 1 plane for the UV components, which are interleaved (firs...
Definition: pixfmt.h:85
const char * name
Name of the codec implementation.
Definition: avcodec.h:3415
int max_dec_frame_buffering
Definition: qsvenc.h:149
#define MFX_LOOKAHEAD_DS_UNKNOWN
Definition: qsvenc.h:63
AVCodec ff_h264_qsv_encoder
Definition: qsvenc_h264.c:179
int idr_interval
Definition: qsvenc.h:132
int a53_cc
Definition: qsvenc.h:165
#define MFX_LOOKAHEAD_DS_OFF
Definition: qsvenc.h:64
#define MFX_LOOKAHEAD_DS_2x
Definition: qsvenc.h:65
QSVEncContext qsv
Definition: qsvenc_h264.c:40
Libavcodec external API header.
static int qsv_h264_set_encode_ctrl(AVCodecContext *avctx, const AVFrame *frame, mfxEncodeCtrl *enc_ctrl)
Definition: qsvenc_h264.c:43
main external API structure.
Definition: avcodec.h:1518
int profile
Definition: qsvenc.h:133
#define AV_CODEC_CAP_HYBRID
Codec is potentially backed by a hardware implementation, but not necessarily.
Definition: avcodec.h:1063
Describe the class of an AVClass context structure.
Definition: log.h:67
int ff_qsv_enc_init(AVCodecContext *avctx, QSVEncContext *q)
Definition: qsvenc.c:851
cl_device_type type
HW acceleration through QSV, data[3] contains a pointer to the mfxFrameSurface1 structure.
Definition: pixfmt.h:218
static int qsv_enc_frame(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *frame, int *got_packet)
Definition: qsvenc_h264.c:85
static enum AVPixelFormat pix_fmts[]
Definition: libkvazaar.c:266
int int_ref_cycle_size
Definition: qsvenc.h:161
static av_cold int qsv_enc_init(AVCodecContext *avctx)
Definition: qsvenc_h264.c:77
common internal api header.
common internal and external API header
#define MFX_LOOKAHEAD_DS_4x
Definition: qsvenc.h:66
void * priv_data
Definition: avcodec.h:1545
#define VE
Definition: qsvenc_h264.c:101
int recovery_point_sei
Definition: qsvenc.h:163
#define OFFSET(x)
Definition: qsvenc_h264.c:100
int ff_alloc_a53_sei(const AVFrame *frame, size_t prefix_len, void **data, size_t *sei_size)
Check AVFrame for A53 side data and allocate and fill SEI message with A53 info.
Definition: utils.c:2135
int look_ahead_downsampling
Definition: qsvenc.h:140
static av_cold int qsv_enc_close(AVCodecContext *avctx)
Definition: qsvenc_h264.c:93
int trellis
Definition: qsvenc.h:150
AVPixelFormat
Pixel format.
Definition: pixfmt.h:60
This structure stores compressed data.
Definition: avcodec.h:1407
int pic_timing_sei
Definition: qsvenc.h:137
SetEncodeCtrlCB * set_encode_ctrl_cb
Definition: qsvenc.h:171