FFmpeg
 All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Groups Pages
libopenh264enc.c
Go to the documentation of this file.
1 /*
2  * OpenH264 video encoder
3  * Copyright (C) 2014 Martin Storsjo
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include <wels/codec_api.h>
23 #include <wels/codec_ver.h>
24 
25 #include "libavutil/attributes.h"
26 #include "libavutil/common.h"
27 #include "libavutil/opt.h"
28 #include "libavutil/internal.h"
29 #include "libavutil/intreadwrite.h"
30 #include "libavutil/mathematics.h"
31 
32 #include "avcodec.h"
33 #include "internal.h"
34 #include "libopenh264.h"
35 
36 #if !OPENH264_VER_AT_LEAST(1, 6)
37 #define SM_SIZELIMITED_SLICE SM_DYN_SLICE
38 #endif
39 
40 typedef struct SVCContext {
41  const AVClass *av_class;
42  ISVCEncoder *encoder;
45  char *profile;
48  int skipped;
49  int cabac;
50 } SVCContext;
51 
52 #define OFFSET(x) offsetof(SVCContext, x)
53 #define VE AV_OPT_FLAG_VIDEO_PARAM | AV_OPT_FLAG_ENCODING_PARAM
54 static const AVOption options[] = {
55 #if OPENH264_VER_AT_LEAST(1, 6)
56  { "slice_mode", "set slice mode", OFFSET(slice_mode), AV_OPT_TYPE_INT, { .i64 = SM_FIXEDSLCNUM_SLICE }, SM_SINGLE_SLICE, SM_RESERVED, VE, "slice_mode" },
57 #else
58  { "slice_mode", "set slice mode", OFFSET(slice_mode), AV_OPT_TYPE_INT, { .i64 = SM_AUTO_SLICE }, SM_SINGLE_SLICE, SM_RESERVED, VE, "slice_mode" },
59 #endif
60  { "fixed", "a fixed number of slices", 0, AV_OPT_TYPE_CONST, { .i64 = SM_FIXEDSLCNUM_SLICE }, 0, 0, VE, "slice_mode" },
61 #if OPENH264_VER_AT_LEAST(1, 6)
62  { "dyn", "Size limited (compatibility name)", 0, AV_OPT_TYPE_CONST, { .i64 = SM_SIZELIMITED_SLICE }, 0, 0, VE, "slice_mode" },
63  { "sizelimited", "Size limited", 0, AV_OPT_TYPE_CONST, { .i64 = SM_SIZELIMITED_SLICE }, 0, 0, VE, "slice_mode" },
64 #else
65  { "rowmb", "one slice per row of macroblocks", 0, AV_OPT_TYPE_CONST, { .i64 = SM_ROWMB_SLICE }, 0, 0, VE, "slice_mode" },
66  { "auto", "automatic number of slices according to number of threads", 0, AV_OPT_TYPE_CONST, { .i64 = SM_AUTO_SLICE }, 0, 0, VE, "slice_mode" },
67  { "dyn", "Dynamic slicing", 0, AV_OPT_TYPE_CONST, { .i64 = SM_DYN_SLICE }, 0, 0, VE, "slice_mode" },
68 #endif
69  { "loopfilter", "enable loop filter", OFFSET(loopfilter), AV_OPT_TYPE_INT, { .i64 = 1 }, 0, 1, VE },
70  { "profile", "set profile restrictions", OFFSET(profile), AV_OPT_TYPE_STRING, { .str = NULL }, 0, 0, VE },
71  { "max_nal_size", "set maximum NAL size in bytes", OFFSET(max_nal_size), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, INT_MAX, VE },
72  { "allow_skip_frames", "allow skipping frames to hit the target bitrate", OFFSET(skip_frames), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, VE },
73  { "cabac", "Enable cabac", OFFSET(cabac), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, VE },
74  { NULL }
75 };
76 
77 static const AVClass class = {
79 };
80 
82 {
83  SVCContext *s = avctx->priv_data;
84 
85  if (s->encoder)
86  WelsDestroySVCEncoder(s->encoder);
87  if (s->skipped > 0)
88  av_log(avctx, AV_LOG_WARNING, "%d frames skipped\n", s->skipped);
89  return 0;
90 }
91 
93 {
94  SVCContext *s = avctx->priv_data;
95  SEncParamExt param = { 0 };
96  int err;
97  int log_level;
98  WelsTraceCallback callback_function;
99  AVCPBProperties *props;
100 
101  if ((err = ff_libopenh264_check_version(avctx)) < 0)
102  return err;
103 
104  if (WelsCreateSVCEncoder(&s->encoder)) {
105  av_log(avctx, AV_LOG_ERROR, "Unable to create encoder\n");
106  return AVERROR_UNKNOWN;
107  }
108 
109  // Pass all libopenh264 messages to our callback, to allow ourselves to filter them.
110  log_level = WELS_LOG_DETAIL;
111  (*s->encoder)->SetOption(s->encoder, ENCODER_OPTION_TRACE_LEVEL, &log_level);
112 
113  // Set the logging callback function to one that uses av_log() (see implementation above).
114  callback_function = (WelsTraceCallback) ff_libopenh264_trace_callback;
115  (*s->encoder)->SetOption(s->encoder, ENCODER_OPTION_TRACE_CALLBACK, &callback_function);
116 
117  // Set the AVCodecContext as the libopenh264 callback context so that it can be passed to av_log().
118  (*s->encoder)->SetOption(s->encoder, ENCODER_OPTION_TRACE_CALLBACK_CONTEXT, &avctx);
119 
120  (*s->encoder)->GetDefaultParams(s->encoder, &param);
121 
122 #if FF_API_CODER_TYPE
124  if (!s->cabac)
125  s->cabac = avctx->coder_type == FF_CODER_TYPE_AC;
127 #endif
128 
129  param.fMaxFrameRate = 1/av_q2d(avctx->time_base);
130  param.iPicWidth = avctx->width;
131  param.iPicHeight = avctx->height;
132  param.iTargetBitrate = avctx->bit_rate;
133  param.iMaxBitrate = FFMAX(avctx->rc_max_rate, avctx->bit_rate);
134  param.iRCMode = RC_QUALITY_MODE;
135  param.iTemporalLayerNum = 1;
136  param.iSpatialLayerNum = 1;
137  param.bEnableDenoise = 0;
138  param.bEnableBackgroundDetection = 1;
139  param.bEnableAdaptiveQuant = 1;
140  param.bEnableFrameSkip = s->skip_frames;
141  param.bEnableLongTermReference = 0;
142  param.iLtrMarkPeriod = 30;
143  param.uiIntraPeriod = avctx->gop_size;
144 #if OPENH264_VER_AT_LEAST(1, 4)
145  param.eSpsPpsIdStrategy = CONSTANT_ID;
146 #else
147  param.bEnableSpsPpsIdAddition = 0;
148 #endif
149  param.bPrefixNalAddingCtrl = 0;
150  param.iLoopFilterDisableIdc = !s->loopfilter;
151  param.iEntropyCodingModeFlag = 0;
152  param.iMultipleThreadIdc = avctx->thread_count;
153  if (s->profile && !strcmp(s->profile, "main"))
154  param.iEntropyCodingModeFlag = 1;
155  else if (!s->profile && s->cabac)
156  param.iEntropyCodingModeFlag = 1;
157 
158  param.sSpatialLayers[0].iVideoWidth = param.iPicWidth;
159  param.sSpatialLayers[0].iVideoHeight = param.iPicHeight;
160  param.sSpatialLayers[0].fFrameRate = param.fMaxFrameRate;
161  param.sSpatialLayers[0].iSpatialBitrate = param.iTargetBitrate;
162  param.sSpatialLayers[0].iMaxSpatialBitrate = param.iMaxBitrate;
163 
164  if ((avctx->slices > 1) && (s->max_nal_size)) {
165  av_log(avctx, AV_LOG_ERROR,
166  "Invalid combination -slices %d and -max_nal_size %d.\n",
167  avctx->slices, s->max_nal_size);
168  return AVERROR(EINVAL);
169  }
170 
171  if (avctx->slices > 1)
172  s->slice_mode = SM_FIXEDSLCNUM_SLICE;
173 
174  if (s->max_nal_size)
176 
177 #if OPENH264_VER_AT_LEAST(1, 6)
178  param.sSpatialLayers[0].sSliceArgument.uiSliceMode = s->slice_mode;
179  param.sSpatialLayers[0].sSliceArgument.uiSliceNum = avctx->slices;
180 #else
181  param.sSpatialLayers[0].sSliceCfg.uiSliceMode = s->slice_mode;
182  param.sSpatialLayers[0].sSliceCfg.sSliceArgument.uiSliceNum = avctx->slices;
183 #endif
184 
185  if (s->slice_mode == SM_SIZELIMITED_SLICE) {
186  if (s->max_nal_size){
187  param.uiMaxNalSize = s->max_nal_size;
188 #if OPENH264_VER_AT_LEAST(1, 6)
189  param.sSpatialLayers[0].sSliceArgument.uiSliceSizeConstraint = s->max_nal_size;
190 #else
191  param.sSpatialLayers[0].sSliceCfg.sSliceArgument.uiSliceSizeConstraint = s->max_nal_size;
192 #endif
193  } else {
194  av_log(avctx, AV_LOG_ERROR, "Invalid -max_nal_size, "
195  "specify a valid max_nal_size to use -slice_mode dyn\n");
196  return AVERROR(EINVAL);
197  }
198  }
199 
200  if ((*s->encoder)->InitializeExt(s->encoder, &param) != cmResultSuccess) {
201  av_log(avctx, AV_LOG_ERROR, "Initialize failed\n");
202  return AVERROR_UNKNOWN;
203  }
204 
205  if (avctx->flags & AV_CODEC_FLAG_GLOBAL_HEADER) {
206  SFrameBSInfo fbi = { 0 };
207  int i, size = 0;
208  (*s->encoder)->EncodeParameterSets(s->encoder, &fbi);
209  for (i = 0; i < fbi.sLayerInfo[0].iNalCount; i++)
210  size += fbi.sLayerInfo[0].pNalLengthInByte[i];
212  if (!avctx->extradata)
213  return AVERROR(ENOMEM);
214  avctx->extradata_size = size;
215  memcpy(avctx->extradata, fbi.sLayerInfo[0].pBsBuf, size);
216  }
217 
218  props = ff_add_cpb_side_data(avctx);
219  if (!props)
220  return AVERROR(ENOMEM);
221  props->max_bitrate = param.iMaxBitrate;
222  props->avg_bitrate = param.iTargetBitrate;
223 
224  return 0;
225 }
226 
227 static int svc_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
228  const AVFrame *frame, int *got_packet)
229 {
230  SVCContext *s = avctx->priv_data;
231  SFrameBSInfo fbi = { 0 };
232  int i, ret;
233  int encoded;
234  SSourcePicture sp = { 0 };
235  int size = 0, layer, first_layer = 0;
236  int layer_size[MAX_LAYER_NUM_OF_FRAME] = { 0 };
237 
238  sp.iColorFormat = videoFormatI420;
239  for (i = 0; i < 3; i++) {
240  sp.iStride[i] = frame->linesize[i];
241  sp.pData[i] = frame->data[i];
242  }
243  sp.iPicWidth = avctx->width;
244  sp.iPicHeight = avctx->height;
245 
246  encoded = (*s->encoder)->EncodeFrame(s->encoder, &sp, &fbi);
247  if (encoded != cmResultSuccess) {
248  av_log(avctx, AV_LOG_ERROR, "EncodeFrame failed\n");
249  return AVERROR_UNKNOWN;
250  }
251  if (fbi.eFrameType == videoFrameTypeSkip) {
252  s->skipped++;
253  av_log(avctx, AV_LOG_DEBUG, "frame skipped\n");
254  return 0;
255  }
256  first_layer = 0;
257  // Normal frames are returned with one single layer, while IDR
258  // frames have two layers, where the first layer contains the SPS/PPS.
259  // If using global headers, don't include the SPS/PPS in the returned
260  // packet - thus, only return one layer.
261  if (avctx->flags & AV_CODEC_FLAG_GLOBAL_HEADER)
262  first_layer = fbi.iLayerNum - 1;
263 
264  for (layer = first_layer; layer < fbi.iLayerNum; layer++) {
265  for (i = 0; i < fbi.sLayerInfo[layer].iNalCount; i++)
266  layer_size[layer] += fbi.sLayerInfo[layer].pNalLengthInByte[i];
267  size += layer_size[layer];
268  }
269  av_log(avctx, AV_LOG_DEBUG, "%d slices\n", fbi.sLayerInfo[fbi.iLayerNum - 1].iNalCount);
270 
271  if ((ret = ff_alloc_packet2(avctx, avpkt, size, size))) {
272  av_log(avctx, AV_LOG_ERROR, "Error getting output packet\n");
273  return ret;
274  }
275  size = 0;
276  for (layer = first_layer; layer < fbi.iLayerNum; layer++) {
277  memcpy(avpkt->data + size, fbi.sLayerInfo[layer].pBsBuf, layer_size[layer]);
278  size += layer_size[layer];
279  }
280  avpkt->pts = frame->pts;
281  if (fbi.eFrameType == videoFrameTypeIDR)
282  avpkt->flags |= AV_PKT_FLAG_KEY;
283  *got_packet = 1;
284  return 0;
285 }
286 
288  .name = "libopenh264",
289  .long_name = NULL_IF_CONFIG_SMALL("OpenH264 H.264 / AVC / MPEG-4 AVC / MPEG-4 part 10"),
290  .type = AVMEDIA_TYPE_VIDEO,
291  .id = AV_CODEC_ID_H264,
292  .priv_data_size = sizeof(SVCContext),
294  .encode2 = svc_encode_frame,
295  .close = svc_encode_close,
296  .capabilities = AV_CODEC_CAP_AUTO_THREADS,
298  .pix_fmts = (const enum AVPixelFormat[]){ AV_PIX_FMT_YUV420P,
299  AV_PIX_FMT_NONE },
300  .priv_class = &class,
301 };
#define FF_CODEC_CAP_INIT_CLEANUP
The codec allows calling the close function for deallocation even if the init function returned a fai...
Definition: internal.h:48
void ff_libopenh264_trace_callback(void *ctx, int level, const char *msg)
Definition: libopenh264.c:41
#define NULL
Definition: coverity.c:32
const char * s
Definition: avisynth_c.h:768
This structure describes decoded (raw) audio or video data.
Definition: frame.h:187
AVOption.
Definition: opt.h:246
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:182
int64_t bit_rate
the average bitrate
Definition: avcodec.h:1797
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
static av_cold int init(AVCodecContext *avctx)
Definition: avrndec.c:35
int max_bitrate
Maximum bitrate of the stream, in bits per second.
Definition: avcodec.h:1351
void * av_mallocz(size_t size)
Allocate a memory block with alignment suitable for all memory accesses (including vectors if availab...
Definition: mem.c:222
#define AV_CODEC_CAP_AUTO_THREADS
Codec supports avctx->thread_count == 0 (auto).
Definition: avcodec.h:1069
AVCodec.
Definition: avcodec.h:3681
Macro definitions for various function/variable attributes.
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented...
Definition: avcodec.h:1869
#define FF_CODEC_CAP_INIT_THREADSAFE
The codec does not modify any global variables in the init function, allowing to call the init functi...
Definition: internal.h:40
#define av_cold
Definition: attributes.h:82
AVOptions.
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
Definition: frame.h:271
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
Definition: avcodec.h:1847
static AVFrame * frame
uint8_t * data
Definition: avcodec.h:1657
static double av_q2d(AVRational a)
Convert an AVRational to a double.
Definition: rational.h:104
#define OFFSET(x)
#define sp
Definition: regdef.h:63
ptrdiff_t size
Definition: opengl_enc.c:101
ISVCEncoder * encoder
#define av_log(a,...)
#define AV_PKT_FLAG_KEY
The packet contains a keyframe.
Definition: avcodec.h:1689
static const AVOption options[]
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176
av_default_item_name
#define AVERROR(e)
Definition: error.h:43
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:179
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:197
const AVClass * av_class
int flags
AV_CODEC_FLAG_*.
Definition: avcodec.h:1827
const char * name
Name of the codec implementation.
Definition: avcodec.h:3688
static av_cold int svc_encode_close(AVCodecContext *avctx)
#define FFMAX(a, b)
Definition: common.h:94
int flags
A combination of AV_PKT_FLAG values.
Definition: avcodec.h:1663
static av_cold int svc_encode_init(AVCodecContext *avctx)
common internal API header
#define VE
int width
picture width / height.
Definition: avcodec.h:1919
attribute_deprecated int coder_type
Definition: avcodec.h:2785
int thread_count
thread count is used to decide how many independent tasks should be passed to execute() ...
Definition: avcodec.h:3161
This structure describes the bitrate properties of an encoded bitstream.
Definition: avcodec.h:1346
Libavcodec external API header.
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Definition: frame.h:218
main external API structure.
Definition: avcodec.h:1732
#define FF_CODER_TYPE_AC
Definition: avcodec.h:2775
char * profile
int extradata_size
Definition: avcodec.h:1848
Describe the class of an AVClass context structure.
Definition: log.h:67
static int svc_encode_frame(AVCodecContext *avctx, AVPacket *avpkt, const AVFrame *frame, int *got_packet)
#define SM_SIZELIMITED_SLICE
int ff_alloc_packet2(AVCodecContext *avctx, AVPacket *avpkt, int64_t size, int64_t min_size)
Check AVPacket size and/or allocate data.
Definition: utils.c:1736
static enum AVPixelFormat pix_fmts[]
Definition: libkvazaar.c:262
mfxU16 profile
Definition: qsvenc.c:44
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:201
#define AV_CODEC_FLAG_GLOBAL_HEADER
Place global headers in extradata instead of every keyframe.
Definition: avcodec.h:917
int gop_size
the number of pictures in a group of pictures, or 0 for intra_only
Definition: avcodec.h:1945
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:62
#define FF_DISABLE_DEPRECATION_WARNINGS
Definition: internal.h:83
common internal api header.
common internal and external API header
#define AVERROR_UNKNOWN
Unknown error, typically from an external library.
Definition: error.h:71
AVCPBProperties * ff_add_cpb_side_data(AVCodecContext *avctx)
Add a CPB properties side data to an encoding context.
Definition: utils.c:4122
#define AV_INPUT_BUFFER_PADDING_SIZE
Required number of additionally allocated bytes at the end of the input bitstream for decoding...
Definition: avcodec.h:769
int slices
Number of slices.
Definition: avcodec.h:2485
void * priv_data
Definition: avcodec.h:1774
#define FF_ENABLE_DEPRECATION_WARNINGS
Definition: internal.h:84
int avg_bitrate
Average bitrate of the stream, in bits per second.
Definition: avcodec.h:1361
int ff_libopenh264_check_version(void *logctx)
Definition: libopenh264.c:49
AVCodec ff_libopenh264_encoder
AVPixelFormat
Pixel format.
Definition: pixfmt.h:60
This structure stores compressed data.
Definition: avcodec.h:1634
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: avcodec.h:1650
int64_t rc_max_rate
maximum bitrate
Definition: avcodec.h:2732