FFmpeg
 All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Groups Pages
qsvenc_hevc.c
Go to the documentation of this file.
1 /*
2  * Intel MediaSDK QSV based HEVC encoder
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 
22 #include <stdint.h>
23 #include <sys/types.h>
24 
25 #include <mfx/mfxvideo.h>
26 
27 #include "libavutil/common.h"
28 #include "libavutil/opt.h"
29 
30 #include "avcodec.h"
31 #include "bytestream.h"
32 #include "get_bits.h"
33 #include "hevc.h"
34 #include "internal.h"
35 #include "qsv.h"
36 #include "qsv_internal.h"
37 #include "qsvenc.h"
38 
39 enum LoadPlugin {
43 };
44 
45 typedef struct QSVHEVCEncContext {
46  AVClass *class;
50 
52 {
53  GetByteContext gbc;
54  PutByteContext pbc;
55 
56  GetBitContext gb;
57  HEVCNAL sps_nal = { NULL };
58  HEVCSPS sps = { 0 };
59  HEVCVPS vps = { 0 };
60  uint8_t vps_buf[128], vps_rbsp_buf[128];
61  uint8_t *new_extradata;
62  unsigned int sps_id;
63  int ret, i, type, vps_size;
64 
65  if (!avctx->extradata_size) {
66  av_log(avctx, AV_LOG_ERROR, "No extradata returned from libmfx\n");
67  return AVERROR_UNKNOWN;
68  }
69 
70  /* parse the SPS */
71  ret = ff_hevc_extract_rbsp(NULL, avctx->extradata + 4, avctx->extradata_size - 4, &sps_nal);
72  if (ret < 0) {
73  av_log(avctx, AV_LOG_ERROR, "Error unescaping the SPS buffer\n");
74  return ret;
75  }
76 
77  ret = init_get_bits8(&gb, sps_nal.data, sps_nal.size);
78  if (ret < 0) {
79  av_freep(&sps_nal.rbsp_buffer);
80  return ret;
81  }
82 
83  get_bits(&gb, 1);
84  type = get_bits(&gb, 6);
85  if (type != NAL_SPS) {
86  av_log(avctx, AV_LOG_ERROR, "Unexpected NAL type in the extradata: %d\n",
87  type);
88  av_freep(&sps_nal.rbsp_buffer);
89  return AVERROR_INVALIDDATA;
90  }
91  get_bits(&gb, 9);
92 
93  ret = ff_hevc_parse_sps(&sps, &gb, &sps_id, 0, NULL, avctx);
94  av_freep(&sps_nal.rbsp_buffer);
95  if (ret < 0) {
96  av_log(avctx, AV_LOG_ERROR, "Error parsing the SPS\n");
97  return ret;
98  }
99 
100  /* generate the VPS */
101  vps.vps_max_layers = 1;
103  memcpy(&vps.ptl, &sps.ptl, sizeof(vps.ptl));
105  for (i = 0; i < MAX_SUB_LAYERS; i++) {
109  }
110 
111  vps.vps_num_layer_sets = 1;
117 
118  /* generate the encoded RBSP form of the VPS */
119  ret = ff_hevc_encode_nal_vps(&vps, sps.vps_id, vps_rbsp_buf, sizeof(vps_rbsp_buf));
120  if (ret < 0) {
121  av_log(avctx, AV_LOG_ERROR, "Error writing the VPS\n");
122  return ret;
123  }
124 
125  /* escape and add the startcode */
126  bytestream2_init(&gbc, vps_rbsp_buf, ret);
127  bytestream2_init_writer(&pbc, vps_buf, sizeof(vps_buf));
128 
129  bytestream2_put_be32(&pbc, 1); // startcode
130  bytestream2_put_byte(&pbc, NAL_VPS << 1); // NAL
131  bytestream2_put_byte(&pbc, 1); // header
132 
133  while (bytestream2_get_bytes_left(&gbc)) {
134  uint32_t b = bytestream2_peek_be24(&gbc);
135  if (b <= 3) {
136  bytestream2_put_be24(&pbc, 3);
137  bytestream2_skip(&gbc, 2);
138  } else
139  bytestream2_put_byte(&pbc, bytestream2_get_byte(&gbc));
140  }
141 
142  vps_size = bytestream2_tell_p(&pbc);
143  new_extradata = av_mallocz(vps_size + avctx->extradata_size + AV_INPUT_BUFFER_PADDING_SIZE);
144  if (!new_extradata)
145  return AVERROR(ENOMEM);
146  memcpy(new_extradata, vps_buf, vps_size);
147  memcpy(new_extradata + vps_size, avctx->extradata, avctx->extradata_size);
148 
149  av_freep(&avctx->extradata);
150  avctx->extradata = new_extradata;
151  avctx->extradata_size += vps_size;
152 
153  return 0;
154 }
155 
157 {
158  QSVHEVCEncContext *q = avctx->priv_data;
159  int ret;
160 
161  if (q->load_plugin != LOAD_PLUGIN_NONE) {
162  static const char *uid_hevcenc_sw = "2fca99749fdb49aeb121a5b63ef568f7";
163  static const char *uid_hevcenc_hw = "6fadc791a0c2eb479ab6dcd5ea9da347";
164 
165  if (q->qsv.load_plugins[0]) {
166  av_log(avctx, AV_LOG_WARNING,
167  "load_plugins is not empty, but load_plugin is not set to 'none'."
168  "The load_plugin value will be ignored.\n");
169  } else {
171 
173  q->qsv.load_plugins = av_strdup(uid_hevcenc_sw);
174  else
175  q->qsv.load_plugins = av_strdup(uid_hevcenc_hw);
176 
177  if (!q->qsv.load_plugins)
178  return AVERROR(ENOMEM);
179  }
180  }
181 
182  ret = ff_qsv_enc_init(avctx, &q->qsv);
183  if (ret < 0)
184  return ret;
185 
186  ret = generate_fake_vps(&q->qsv, avctx);
187  if (ret < 0) {
188  ff_qsv_enc_close(avctx, &q->qsv);
189  return ret;
190  }
191 
192  return 0;
193 }
194 
196  const AVFrame *frame, int *got_packet)
197 {
198  QSVHEVCEncContext *q = avctx->priv_data;
199 
200  return ff_qsv_encode(avctx, &q->qsv, pkt, frame, got_packet);
201 }
202 
204 {
205  QSVHEVCEncContext *q = avctx->priv_data;
206 
207  return ff_qsv_enc_close(avctx, &q->qsv);
208 }
209 
210 #define OFFSET(x) offsetof(QSVHEVCEncContext, x)
211 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
212 static const AVOption options[] = {
213  { "async_depth", "Maximum processing parallelism", OFFSET(qsv.async_depth), AV_OPT_TYPE_INT, { .i64 = ASYNC_DEPTH_DEFAULT }, 0, INT_MAX, VE },
214  { "avbr_accuracy", "Accuracy of the AVBR ratecontrol", OFFSET(qsv.avbr_accuracy), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, VE },
215  { "avbr_convergence", "Convergence of the AVBR ratecontrol", OFFSET(qsv.avbr_convergence), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, VE },
216 
217  { "load_plugin", "A user plugin to load in an internal session", OFFSET(load_plugin), AV_OPT_TYPE_INT, { .i64 = LOAD_PLUGIN_HEVC_SW }, LOAD_PLUGIN_NONE, LOAD_PLUGIN_HEVC_HW, VE, "load_plugin" },
218  { "none", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_NONE }, 0, 0, VE, "load_plugin" },
219  { "hevc_sw", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_HEVC_SW }, 0, 0, VE, "load_plugin" },
220  { "hevc_hw", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = LOAD_PLUGIN_HEVC_HW }, 0, 0, VE, "load_plugin" },
221 
222  { "load_plugins", "A :-separate list of hexadecimal plugin UIDs to load in an internal session",
223  OFFSET(qsv.load_plugins), AV_OPT_TYPE_STRING, { .str = "" }, 0, 0, VE },
224 
225  { "profile", NULL, OFFSET(qsv.profile), AV_OPT_TYPE_INT, { .i64 = MFX_PROFILE_UNKNOWN }, 0, INT_MAX, VE, "profile" },
226  { "unknown", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_UNKNOWN }, INT_MIN, INT_MAX, VE, "profile" },
227  { "main", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_HEVC_MAIN }, INT_MIN, INT_MAX, VE, "profile" },
228  { "main10", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_HEVC_MAIN10 }, INT_MIN, INT_MAX, VE, "profile" },
229  { "mainsp", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_PROFILE_HEVC_MAINSP }, INT_MIN, INT_MAX, VE, "profile" },
230 
231  { "preset", NULL, OFFSET(qsv.preset), AV_OPT_TYPE_INT, { .i64 = MFX_TARGETUSAGE_BALANCED }, 0, 7, VE, "preset" },
232  { "fast", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_TARGETUSAGE_BEST_SPEED }, INT_MIN, INT_MAX, VE, "preset" },
233  { "medium", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_TARGETUSAGE_BALANCED }, INT_MIN, INT_MAX, VE, "preset" },
234  { "slow", NULL, 0, AV_OPT_TYPE_CONST, { .i64 = MFX_TARGETUSAGE_BEST_QUALITY }, INT_MIN, INT_MAX, VE, "preset" },
235 
236  { NULL },
237 };
238 
239 static const AVClass class = {
240  .class_name = "hevc_qsv encoder",
241  .item_name = av_default_item_name,
242  .option = options,
244 };
245 
247  { "b", "1M" },
248  { "refs", "0" },
249  // same as the x264 default
250  { "g", "250" },
251  { "bf", "3" },
252 
253  { "flags", "+cgop" },
254  { NULL },
255 };
256 
258  .name = "hevc_qsv",
259  .long_name = NULL_IF_CONFIG_SMALL("HEVC (Intel Quick Sync Video acceleration)"),
260  .priv_data_size = sizeof(QSVHEVCEncContext),
262  .id = AV_CODEC_ID_HEVC,
263  .init = qsv_enc_init,
264  .encode2 = qsv_enc_frame,
265  .close = qsv_enc_close,
266  .capabilities = AV_CODEC_CAP_DELAY,
267  .pix_fmts = (const enum AVPixelFormat[]){ AV_PIX_FMT_NV12,
269  AV_PIX_FMT_NONE },
270  .priv_class = &class,
271  .defaults = qsv_enc_defaults,
272 };
#define NULL
Definition: coverity.c:32
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
AVCodec ff_hevc_qsv_encoder
Definition: qsvenc_hevc.c:257
int ff_hevc_encode_nal_vps(HEVCVPS *vps, unsigned int id, uint8_t *buf, int buf_size)
Definition: hevc_ps_enc.c:66
This structure describes decoded (raw) audio or video data.
Definition: frame.h:171
AVOption.
Definition: opt.h:255
int vui_num_ticks_poc_diff_one_minus1
Definition: hevc.h:337
int max_dec_pic_buffering
Definition: hevc.h:418
static unsigned int get_bits(GetBitContext *s, int n)
Read 1-25 bits.
Definition: get_bits.h:260
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:182
#define LIBAVUTIL_VERSION_INT
Definition: version.h:62
static av_cold int init(AVCodecContext *avctx)
Definition: avrndec.c:35
int vps_num_ticks_poc_diff_one
vps_num_ticks_poc_diff_one_minus1 + 1
Definition: hevc.h:387
VUI vui
Definition: hevc.h:423
const char * b
Definition: vf_curves.c:109
static av_always_inline void bytestream2_init_writer(PutByteContext *p, uint8_t *buf, int buf_size)
Definition: bytestream.h:143
uint32_t vui_time_scale
Definition: hevc.h:335
static int generate_fake_vps(QSVEncContext *q, AVCodecContext *avctx)
Definition: qsvenc_hevc.c:51
static av_always_inline void bytestream2_init(GetByteContext *g, const uint8_t *buf, int buf_size)
Definition: bytestream.h:133
int max_latency_increase
Definition: hevc.h:420
static AVPacket pkt
AVCodec.
Definition: avcodec.h:3472
Definition: h264.h:118
static int qsv_enc_frame(AVCodecContext *avctx, AVPacket *pkt, const AVFrame *frame, int *got_packet)
Definition: qsvenc_hevc.c:195
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:72
#define AV_CODEC_CAP_DELAY
Encoder or decoder requires flushing with NULL input at the end in order to give the complete and cor...
Definition: avcodec.h:882
int ff_qsv_encode(AVCodecContext *avctx, QSVEncContext *q, AVPacket *pkt, const AVFrame *frame, int *got_packet)
Definition: qsvenc.c:417
uint8_t
#define av_cold
Definition: attributes.h:74
unsigned int vps_num_reorder_pics[MAX_SUB_LAYERS]
Definition: hevc.h:379
AVOptions.
const uint8_t * data
Definition: hevc.h:754
uint8_t vps_timing_info_present_flag
Definition: hevc.h:383
uint8_t * rbsp_buffer
Definition: hevc.h:750
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
Definition: avcodec.h:1617
int vps_max_sub_layers
vps_max_temporal_layers_minus1 + 1
Definition: hevc.h:374
static AVFrame * frame
#define OFFSET(x)
Definition: qsvenc_hevc.c:210
bitstream reader API header.
int ff_qsv_enc_close(AVCodecContext *avctx, QSVEncContext *q)
Definition: qsvenc.c:536
#define av_log(a,...)
QSVEncContext qsv
Definition: qsvenc_hevc.c:47
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176
int vps_max_layers
Definition: hevc.h:373
av_default_item_name
#define AVERROR(e)
Definition: error.h:43
static av_always_inline void bytestream2_skip(GetByteContext *g, unsigned int size)
Definition: bytestream.h:164
int vui_timing_info_present_flag
Definition: hevc.h:333
char * load_plugins
Definition: qsvenc.h:74
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:175
static av_always_inline unsigned int bytestream2_get_bytes_left(GetByteContext *g)
Definition: bytestream.h:154
planar YUV 4:2:0, 12bpp, 1 plane for Y and 1 plane for the UV components, which are interleaved (firs...
Definition: pixfmt.h:91
const char * name
Name of the codec implementation.
Definition: avcodec.h:3479
int vui_poc_proportional_to_timing_flag
Definition: hevc.h:336
static av_always_inline int bytestream2_tell_p(PutByteContext *p)
Definition: bytestream.h:193
Libavcodec external API header.
uint32_t vps_num_units_in_tick
Definition: hevc.h:384
#define ASYNC_DEPTH_DEFAULT
Definition: qsv_internal.h:46
int vps_num_layer_sets
vps_num_layer_sets_minus1 + 1
Definition: hevc.h:382
static const AVCodecDefault qsv_enc_defaults[]
Definition: qsvenc_hevc.c:246
uint8_t vps_poc_proportional_to_timing_flag
Definition: hevc.h:386
int size
Definition: hevc.h:753
unsigned vps_id
Definition: hevc.h:399
PTL ptl
Definition: hevc.h:376
uint32_t vps_time_scale
Definition: hevc.h:385
Definition: hevc.h:398
Definition: hevc.h:371
static av_cold int qsv_enc_close(AVCodecContext *avctx)
Definition: qsvenc_hevc.c:203
int ff_hevc_extract_rbsp(HEVCContext *s, const uint8_t *src, int length, HEVCNAL *nal)
Extract the raw (unescaped) HEVC bitstream.
Definition: hevc_parse.c:32
Definition: hevc.h:749
char * av_strdup(const char *s)
Duplicate the string s.
Definition: mem.c:267
PTL ptl
Definition: hevc.h:424
int max_sub_layers
Definition: hevc.h:416
static int init_get_bits8(GetBitContext *s, const uint8_t *buffer, int byte_size)
Initialize GetBitContext.
Definition: get_bits.h:441
main external API structure.
Definition: avcodec.h:1502
Definition: hevc.h:110
uint32_t vui_num_units_in_tick
Definition: hevc.h:334
GLint GLenum type
Definition: opengl_enc.c:105
int extradata_size
Definition: avcodec.h:1618
Describe the class of an AVClass context structure.
Definition: log.h:67
int ff_qsv_enc_init(AVCodecContext *avctx, QSVEncContext *q)
Definition: qsvenc.c:235
#define MAX_SUB_LAYERS
7.4.2.1
Definition: hevc.h:48
HW acceleration through QSV, data[3] contains a pointer to the mfxFrameSurface1 structure.
Definition: pixfmt.h:261
static enum AVPixelFormat pix_fmts[]
Definition: libkvazaar.c:209
common internal api header.
common internal and external API header
#define AVERROR_UNKNOWN
Unknown error, typically from an external library.
Definition: error.h:71
#define AV_INPUT_BUFFER_PADDING_SIZE
Required number of additionally allocated bytes at the end of the input bitstream for decoding...
Definition: avcodec.h:636
void * priv_data
Definition: avcodec.h:1544
unsigned int vps_max_dec_pic_buffering[MAX_SUB_LAYERS]
Definition: hevc.h:378
unsigned int vps_max_latency_increase[MAX_SUB_LAYERS]
Definition: hevc.h:380
int ff_hevc_parse_sps(HEVCSPS *sps, GetBitContext *gb, unsigned int *sps_id, int apply_defdispwin, AVBufferRef **vps_list, AVCodecContext *avctx)
Parse the SPS from the bitstream into the provided HEVCSPS struct.
Definition: hevc_ps.c:796
static av_cold int qsv_enc_init(AVCodecContext *avctx)
Definition: qsvenc_hevc.c:156
#define VE
Definition: qsvenc_hevc.c:211
#define av_freep(p)
int num_reorder_pics
Definition: hevc.h:419
struct HEVCSPS::@50 temporal_layer[MAX_SUB_LAYERS]
AVPixelFormat
Pixel format.
Definition: pixfmt.h:61
This structure stores compressed data.
Definition: avcodec.h:1400
void * av_mallocz(size_t size)
Allocate a block of size bytes with alignment suitable for all memory accesses (including vectors if ...
Definition: mem.c:252
LoadPlugin
Definition: qsvdec_h2645.c:38
int vps_sub_layer_ordering_info_present_flag
Definition: hevc.h:377
static const AVOption options[]
Definition: qsvenc_hevc.c:212