1 /*
2 * Intel MediaSDK QSV based H.264 encoder
3 *
4 * copyright (c) 2013 Yukinori Yamazoe
5 *
6 * This file is part of FFmpeg.
7 *
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
12 *
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
17 *
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21 */
22
23
24 #include <stdint.h>
25 #include <sys/types.h>
26
27 #include <mfx/mfxvideo.h>
28
29 #include "libavutil/common.h"
30 #include "libavutil/opt.h"
31
32 #include "avcodec.h"
33 #include "codec_internal.h"
34 #include "qsv.h"
35 #include "qsv_internal.h"
36 #include "qsvenc.h"
37 #include "atsc_a53.h"
38
39 typedef struct QSVH264EncContext {
40 AVClass *class;
41 QSVEncContext qsv;
42 } QSVH264EncContext;
43
qsv_h264_set_encode_ctrl(AVCodecContext * avctx,const AVFrame * frame,mfxEncodeCtrl * enc_ctrl)44 static int qsv_h264_set_encode_ctrl(AVCodecContext *avctx,
45 const AVFrame *frame, mfxEncodeCtrl* enc_ctrl)
46 {
47 QSVH264EncContext *qh264 = avctx->priv_data;
48 QSVEncContext *q = &qh264->qsv;
49
50 if (q->a53_cc && frame) {
51 mfxPayload* payload;
52 mfxU8* sei_data;
53 size_t sei_size;
54 int res;
55
56 res = ff_alloc_a53_sei(frame, sizeof(mfxPayload) + 2, (void**)&payload, &sei_size);
57 if (res < 0 || !payload)
58 return res;
59
60 sei_data = (mfxU8*)(payload + 1);
61 // SEI header
62 sei_data[0] = 4;
63 sei_data[1] = (mfxU8)sei_size; // size of SEI data
64 // SEI data filled in by ff_alloc_a53_sei
65
66 payload->BufSize = sei_size + 2;
67 payload->NumBit = payload->BufSize * 8;
68 payload->Type = 4;
69 payload->Data = sei_data;
70
71 enc_ctrl->NumExtParam = 0;
72 enc_ctrl->NumPayload = 1;
73 enc_ctrl->Payload[0] = payload;
74 }
75 return 0;
76 }
77
qsv_enc_init(AVCodecContext * avctx)78 static av_cold int qsv_enc_init(AVCodecContext *avctx)
79 {
80 QSVH264EncContext *q = avctx->priv_data;
81
82 q->qsv.set_encode_ctrl_cb = qsv_h264_set_encode_ctrl;
83 return ff_qsv_enc_init(avctx, &q->qsv);
84 }
85
qsv_enc_frame(AVCodecContext * avctx,AVPacket * pkt,const AVFrame * frame,int * got_packet)86 static int qsv_enc_frame(AVCodecContext *avctx, AVPacket *pkt,
87 const AVFrame *frame, int *got_packet)
88 {
89 QSVH264EncContext *q = avctx->priv_data;
90
91 return ff_qsv_encode(avctx, &q->qsv, pkt, frame, got_packet);
92 }
93
qsv_enc_close(AVCodecContext * avctx)94 static av_cold int qsv_enc_close(AVCodecContext *avctx)
95 {
96 QSVH264EncContext *q = avctx->priv_data;
97
98 return ff_qsv_enc_close(avctx, &q->qsv);
99 }
100
101 #define OFFSET(x) offsetof(QSVH264EncContext, x)
102 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
103 static const AVOption options[] = {
104 QSV_COMMON_OPTS
105 QSV_OPTION_RDO
106 QSV_OPTION_MAX_FRAME_SIZE
107 QSV_OPTION_MAX_SLICE_SIZE
108 QSV_OPTION_BITRATE_LIMIT
109 QSV_OPTION_MBBRC
110 QSV_OPTION_EXTBRC
111 QSV_OPTION_ADAPTIVE_I
112 QSV_OPTION_ADAPTIVE_B
113 QSV_OPTION_P_STRATEGY
114 QSV_OPTION_B_STRATEGY
115 QSV_OPTION_DBLK_IDC
116 QSV_OPTION_LOW_DELAY_BRC
117 QSV_OPTION_MAX_MIN_QP
118
119 { "cavlc", "Enable CAVLC", OFFSET(qsv.cavlc), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VE },
120 #if QSV_HAVE_VCM
121 { "vcm", "Use the video conferencing mode ratecontrol", OFFSET(qsv.vcm), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VE },
122 #endif
123 { "idr_interval", "Distance (in I-frames) between IDR frames", OFFSET(qsv.idr_interval), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, VE },
124 { "pic_timing_sei", "Insert picture timing SEI with pic_struct_syntax element", OFFSET(qsv.pic_timing_sei), AV_OPT_TYPE_BOOL, { .i64 = 1 }, 0, 1, VE },
125 { "single_sei_nal_unit", "Put all the SEI messages into one NALU", OFFSET(qsv.single_sei_nal_unit), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
126 { "max_dec_frame_buffering", "Maximum number of frames buffered in the DPB", OFFSET(qsv.max_dec_frame_buffering), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, UINT16_MAX, VE },
127
128 { "look_ahead", "Use VBR algorithm with look ahead", OFFSET(qsv.look_ahead), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VE },
129 { "look_ahead_depth", "Depth of look ahead in number frames", OFFSET(qsv.look_ahead_depth), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 100, VE },
130 { "look_ahead_downsampling", "Downscaling factor for the frames saved for the lookahead analysis", OFFSET(qsv.look_ahead_downsampling),
131 AV_OPT_TYPE_INT, { .i64 = MFX_LOOKAHEAD_DS_UNKNOWN }, MFX_LOOKAHEAD_DS_UNKNOWN, MFX_LOOKAHEAD_DS_4x, VE, "look_ahead_downsampling" },
132 { "unknown" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_UNKNOWN }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
133 { "auto" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_UNKNOWN }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
134 { "off" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_OFF }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
135 { "2x" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_2x }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
136 { "4x" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_LOOKAHEAD_DS_4x }, INT_MIN, INT_MAX, VE, "look_ahead_downsampling" },
137
138 { "int_ref_type", "Intra refresh type. B frames should be set to 0.", OFFSET(qsv.int_ref_type), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, UINT16_MAX, VE, "int_ref_type" },
139 { "none", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 0 }, .flags = VE, "int_ref_type" },
140 { "vertical", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 1 }, .flags = VE, "int_ref_type" },
141 { "horizontal", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = 2 }, .flags = VE, "int_ref_type" },
142 { "int_ref_cycle_size", "Number of frames in the intra refresh cycle", OFFSET(qsv.int_ref_cycle_size), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, UINT16_MAX, VE },
143 { "int_ref_qp_delta", "QP difference for the refresh MBs", OFFSET(qsv.int_ref_qp_delta), AV_OPT_TYPE_INT, { .i64 = INT16_MIN }, INT16_MIN, INT16_MAX, VE },
144 { "recovery_point_sei", "Insert recovery point SEI messages", OFFSET(qsv.recovery_point_sei), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, 1, VE },
145 { "int_ref_cycle_dist", "Distance between the beginnings of the intra-refresh cycles in frames", OFFSET(qsv.int_ref_cycle_dist), AV_OPT_TYPE_INT, { .i64 = -1 }, -1, INT16_MAX, VE },
146 { "profile", NULL, OFFSET(qsv.profile), AV_OPT_TYPE_INT, { .i64 = MFX_PROFILE_UNKNOWN }, 0, INT_MAX, VE, "profile" },
147 { "unknown" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_UNKNOWN }, INT_MIN, INT_MAX, VE, "profile" },
148 { "baseline", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_AVC_BASELINE }, INT_MIN, INT_MAX, VE, "profile" },
149 { "main" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_AVC_MAIN }, INT_MIN, INT_MAX, VE, "profile" },
150 { "high" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_AVC_HIGH }, INT_MIN, INT_MAX, VE, "profile" },
151
152 { "a53cc" , "Use A53 Closed Captions (if available)", OFFSET(qsv.a53_cc), AV_OPT_TYPE_BOOL, {.i64 = 1}, 0, 1, VE},
153
154 { "aud", "Insert the Access Unit Delimiter NAL", OFFSET(qsv.aud), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VE},
155
156 #if QSV_HAVE_MF
157 { "mfmode", "Multi-Frame Mode", OFFSET(qsv.mfmode), AV_OPT_TYPE_INT, { .i64 = MFX_MF_AUTO }, MFX_MF_DEFAULT, MFX_MF_AUTO, VE, "mfmode"},
158 { "off" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_MF_DISABLED }, INT_MIN, INT_MAX, VE, "mfmode" },
159 { "auto" , NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_MF_AUTO }, INT_MIN, INT_MAX, VE, "mfmode" },
160 #endif
161
162 { "repeat_pps", "repeat pps for every frame", OFFSET(qsv.repeat_pps), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VE },
163
164 { NULL },
165 };
166
167 static const AVClass class = {
168 .class_name = "h264_qsv encoder",
169 .item_name = av_default_item_name,
170 .option = options,
171 .version = LIBAVUTIL_VERSION_INT,
172 };
173
174 static const FFCodecDefault qsv_enc_defaults[] = {
175 { "b", "1M" },
176 { "refs", "0" },
177 // same as the x264 default
178 { "g", "250" },
179 { "bf", "3" },
180 { "qmin", "-1" },
181 { "qmax", "-1" },
182 { "trellis", "-1" },
183 { "flags", "+cgop" },
184 { NULL },
185 };
186
187 const FFCodec ff_h264_qsv_encoder = {
188 .p.name = "h264_qsv",
189 .p.long_name = NULL_IF_CONFIG_SMALL("H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10 (Intel Quick Sync Video acceleration)"),
190 .priv_data_size = sizeof(QSVH264EncContext),
191 .p.type = AVMEDIA_TYPE_VIDEO,
192 .p.id = AV_CODEC_ID_H264,
193 .init = qsv_enc_init,
194 FF_CODEC_ENCODE_CB(qsv_enc_frame),
195 .close = qsv_enc_close,
196 .p.capabilities = AV_CODEC_CAP_DELAY | AV_CODEC_CAP_HYBRID,
197 .p.pix_fmts = (const enum AVPixelFormat[]){ AV_PIX_FMT_NV12,
198 AV_PIX_FMT_P010,
199 AV_PIX_FMT_QSV,
200 AV_PIX_FMT_NONE },
201 .p.priv_class = &class,
202 .defaults = qsv_enc_defaults,
203 .caps_internal = FF_CODEC_CAP_INIT_CLEANUP,
204 .p.wrapper_name = "qsv",
205 .hw_configs = ff_qsv_enc_hw_configs,
206 };
207