FFmpeg
nvdec_h264.c
Go to the documentation of this file.
1 /*
2  * MPEG-4 Part 10 / AVC / H.264 HW decode acceleration through NVDEC
3  *
4  * Copyright (c) 2016 Anton Khirnov
5  *
6  * This file is part of FFmpeg.
7  *
8  * FFmpeg is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2.1 of the License, or (at your option) any later version.
12  *
13  * FFmpeg is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public
19  * License along with FFmpeg; if not, write to the Free Software
20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21  */
22 
23 #include <stdint.h>
24 #include <string.h>
25 
26 #include "libavutil/mem.h"
27 #include "avcodec.h"
28 #include "nvdec.h"
29 #include "decode.h"
30 #include "internal.h"
31 #include "h264dec.h"
32 #include "hwaccel_internal.h"
33 
34 static void dpb_add(const H264Context *h, CUVIDH264DPBENTRY *dst, const H264Picture *src,
35  int frame_idx)
36 {
37  FrameDecodeData *fdd = (FrameDecodeData*)src->f->private_ref->data;
38  const NVDECFrame *cf = fdd->hwaccel_priv;
39 
40  dst->PicIdx = cf ? cf->idx : -1;
41  dst->FrameIdx = frame_idx;
42  dst->is_long_term = src->long_ref;
43  dst->not_existing = 0;
44  dst->used_for_reference = src->reference & 3;
45  dst->FieldOrderCnt[0] = src->field_poc[0];
46  dst->FieldOrderCnt[1] = src->field_poc[1];
47 }
48 
50  const uint8_t *buffer, uint32_t size)
51 {
52  const H264Context *h = avctx->priv_data;
53  const PPS *pps = h->ps.pps;
54  const SPS *sps = h->ps.sps;
55 
57  CUVIDPICPARAMS *pp = &ctx->pic_params;
58  CUVIDH264PICPARAMS *ppc = &pp->CodecSpecific.h264;
59  FrameDecodeData *fdd;
60  NVDECFrame *cf;
61 
62  int i, dpb_size, ret;
63 
64  ret = ff_nvdec_start_frame(avctx, h->cur_pic_ptr->f);
65  if (ret < 0)
66  return ret;
67 
68  fdd = (FrameDecodeData*)h->cur_pic_ptr->f->private_ref->data;
69  cf = (NVDECFrame*)fdd->hwaccel_priv;
70 
71  *pp = (CUVIDPICPARAMS) {
72  .PicWidthInMbs = h->mb_width,
73  .FrameHeightInMbs = h->mb_height,
74  .CurrPicIdx = cf->idx,
75  .field_pic_flag = FIELD_PICTURE(h),
76  .bottom_field_flag = h->picture_structure == PICT_BOTTOM_FIELD,
77  .second_field = FIELD_PICTURE(h) && !h->first_field,
78  .ref_pic_flag = h->nal_ref_idc != 0,
79  .intra_pic_flag = 1,
80 
81  .CodecSpecific.h264 = {
82  .log2_max_frame_num_minus4 = sps->log2_max_frame_num - 4,
83  .pic_order_cnt_type = sps->poc_type,
84  .log2_max_pic_order_cnt_lsb_minus4 = FFMAX(sps->log2_max_poc_lsb - 4, 0),
85  .delta_pic_order_always_zero_flag = sps->delta_pic_order_always_zero_flag,
86  .frame_mbs_only_flag = sps->frame_mbs_only_flag,
87  .direct_8x8_inference_flag = sps->direct_8x8_inference_flag,
88  .num_ref_frames = sps->ref_frame_count,
89  .residual_colour_transform_flag = sps->residual_color_transform_flag,
90  .bit_depth_luma_minus8 = sps->bit_depth_luma - 8,
91  .bit_depth_chroma_minus8 = sps->bit_depth_chroma - 8,
92  .qpprime_y_zero_transform_bypass_flag = sps->transform_bypass,
93 
94  .entropy_coding_mode_flag = pps->cabac,
95  .pic_order_present_flag = pps->pic_order_present,
96  .num_ref_idx_l0_active_minus1 = pps->ref_count[0] - 1,
97  .num_ref_idx_l1_active_minus1 = pps->ref_count[1] - 1,
98  .weighted_pred_flag = pps->weighted_pred,
99  .weighted_bipred_idc = pps->weighted_bipred_idc,
100  .pic_init_qp_minus26 = pps->init_qp - 26,
101  .deblocking_filter_control_present_flag = pps->deblocking_filter_parameters_present,
102  .redundant_pic_cnt_present_flag = pps->redundant_pic_cnt_present,
103  .transform_8x8_mode_flag = pps->transform_8x8_mode,
104  .MbaffFrameFlag = sps->mb_aff && !FIELD_PICTURE(h),
105  .constrained_intra_pred_flag = pps->constrained_intra_pred,
106  .chroma_qp_index_offset = pps->chroma_qp_index_offset[0],
107  .second_chroma_qp_index_offset = pps->chroma_qp_index_offset[1],
108  .ref_pic_flag = h->nal_ref_idc != 0,
109  .frame_num = h->poc.frame_num,
110  .CurrFieldOrderCnt[0] = h->cur_pic_ptr->field_poc[0],
111  .CurrFieldOrderCnt[1] = h->cur_pic_ptr->field_poc[1],
112  },
113  };
114 
115  memcpy(ppc->WeightScale4x4, pps->scaling_matrix4, sizeof(ppc->WeightScale4x4));
116  memcpy(ppc->WeightScale8x8[0], pps->scaling_matrix8[0], sizeof(ppc->WeightScale8x8[0]));
117  memcpy(ppc->WeightScale8x8[1], pps->scaling_matrix8[3], sizeof(ppc->WeightScale8x8[0]));
118 
119  dpb_size = 0;
120  for (i = 0; i < h->short_ref_count; i++)
121  dpb_add(h, &ppc->dpb[dpb_size++], h->short_ref[i], h->short_ref[i]->frame_num);
122  for (i = 0; i < 16; i++) {
123  if (h->long_ref[i])
124  dpb_add(h, &ppc->dpb[dpb_size++], h->long_ref[i], i);
125  }
126 
127  for (i = dpb_size; i < FF_ARRAY_ELEMS(ppc->dpb); i++)
128  ppc->dpb[i].PicIdx = -1;
129 
130  return 0;
131 }
132 
133 static int nvdec_h264_decode_slice(AVCodecContext *avctx, const uint8_t *buffer,
134  uint32_t size)
135 {
137  CUVIDPICPARAMS *pp = &ctx->pic_params;
138  const H264Context *h = avctx->priv_data;
139  const H264SliceContext *sl = &h->slice_ctx[0];
140  void *tmp;
141 
142  tmp = av_fast_realloc(ctx->bitstream_internal, &ctx->bitstream_allocated,
143  ctx->bitstream_len + size + 3);
144  if (!tmp)
145  return AVERROR(ENOMEM);
146  ctx->bitstream = ctx->bitstream_internal = tmp;
147 
148  tmp = av_fast_realloc(ctx->slice_offsets, &ctx->slice_offsets_allocated,
149  (ctx->nb_slices + 1) * sizeof(*ctx->slice_offsets));
150  if (!tmp)
151  return AVERROR(ENOMEM);
152  ctx->slice_offsets = tmp;
153 
154  AV_WB24(ctx->bitstream_internal + ctx->bitstream_len, 1);
155  memcpy(ctx->bitstream_internal + ctx->bitstream_len + 3, buffer, size);
156  ctx->slice_offsets[ctx->nb_slices] = ctx->bitstream_len ;
157  ctx->bitstream_len += size + 3;
158  ctx->nb_slices++;
159 
161  pp->intra_pic_flag = 0;
162 
163  return 0;
164 }
165 
167  AVBufferRef *hw_frames_ctx)
168 {
169  const H264Context *h = avctx->priv_data;
170  const SPS *sps = h->ps.sps;
171  return ff_nvdec_frame_params(avctx, hw_frames_ctx, sps->ref_frame_count + sps->num_reorder_frames, 0);
172 }
173 
175  .p.name = "h264_nvdec",
176  .p.type = AVMEDIA_TYPE_VIDEO,
177  .p.id = AV_CODEC_ID_H264,
178  .p.pix_fmt = AV_PIX_FMT_CUDA,
179  .start_frame = nvdec_h264_start_frame,
180  .end_frame = ff_nvdec_end_frame,
181  .decode_slice = nvdec_h264_decode_slice,
182  .frame_params = nvdec_h264_frame_params,
183  .init = ff_nvdec_decode_init,
184  .uninit = ff_nvdec_decode_uninit,
185  .priv_data_size = sizeof(NVDECContext),
186 };
AV_PIX_FMT_CUDA
@ AV_PIX_FMT_CUDA
HW acceleration through CUDA.
Definition: pixfmt.h:260
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
FFHWAccel::p
AVHWAccel p
The public AVHWAccel.
Definition: hwaccel_internal.h:38
FrameDecodeData
This struct stores per-frame lavc-internal data and is attached to it via private_ref.
Definition: decode.h:33
tmp
static uint8_t tmp[11]
Definition: aes_ctr.c:28
internal.h
PICT_BOTTOM_FIELD
#define PICT_BOTTOM_FIELD
Definition: mpegutils.h:32
FFMAX
#define FFMAX(a, b)
Definition: macros.h:47
H264SliceContext
Definition: h264dec.h:180
FFHWAccel
Definition: hwaccel_internal.h:34
ff_nvdec_start_frame
int ff_nvdec_start_frame(AVCodecContext *avctx, AVFrame *frame)
Definition: nvdec.c:561
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
av_fast_realloc
void * av_fast_realloc(void *ptr, unsigned int *size, size_t min_size)
Reallocate the given buffer if it is not large enough, otherwise do nothing.
Definition: mem.c:497
FIELD_PICTURE
#define FIELD_PICTURE(h)
Definition: h264dec.h:67
NVDECFrame
Definition: nvdec.h:44
ctx
AVFormatContext * ctx
Definition: movenc.c:49
decode.h
H264SliceContext::slice_type
int slice_type
Definition: h264dec.h:186
AV_CODEC_ID_H264
@ AV_CODEC_ID_H264
Definition: codec_id.h:79
dpb_size
int dpb_size
Definition: h264_levels.c:111
hwaccel_internal.h
ff_nvdec_decode_init
int ff_nvdec_decode_init(AVCodecContext *avctx)
Definition: nvdec.c:327
SPS
Sequence parameter set.
Definition: h264_ps.h:44
AVCodecContext::internal
struct AVCodecInternal * internal
Private context used for internal data.
Definition: avcodec.h:486
AV_PICTURE_TYPE_SI
@ AV_PICTURE_TYPE_SI
Switching Intra.
Definition: avutil.h:283
AV_PICTURE_TYPE_I
@ AV_PICTURE_TYPE_I
Intra.
Definition: avutil.h:279
PPS
Picture parameter set.
Definition: h264_ps.h:110
dpb_add
static void dpb_add(const H264Context *h, CUVIDH264DPBENTRY *dst, const H264Picture *src, int frame_idx)
Definition: nvdec_h264.c:34
AVCodecInternal::hwaccel_priv_data
void * hwaccel_priv_data
hwaccel-specific private data
Definition: internal.h:130
dst
uint8_t ptrdiff_t const uint8_t ptrdiff_t int intptr_t intptr_t int int16_t * dst
Definition: dsp.h:83
NVDECFrame::idx
unsigned int idx
Definition: nvdec.h:45
size
int size
Definition: twinvq_data.h:10344
AV_WB24
#define AV_WB24(p, d)
Definition: intreadwrite.h:446
nvdec.h
ff_nvdec_decode_uninit
int ff_nvdec_decode_uninit(AVCodecContext *avctx)
Definition: nvdec.c:259
nvdec_h264_start_frame
static int nvdec_h264_start_frame(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
Definition: nvdec_h264.c:49
nvdec_h264_frame_params
static int nvdec_h264_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx)
Definition: nvdec_h264.c:166
AVHWAccel::name
const char * name
Name of the hardware accelerated codec.
Definition: avcodec.h:2121
h264dec.h
H264Context
H264Context.
Definition: h264dec.h:340
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
ff_nvdec_end_frame
int ff_nvdec_end_frame(AVCodecContext *avctx)
Definition: nvdec.c:633
avcodec.h
nvdec_h264_decode_slice
static int nvdec_h264_decode_slice(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
Definition: nvdec_h264.c:133
ret
ret
Definition: filter_design.txt:187
sps
static int FUNC() sps(CodedBitstreamContext *ctx, RWContext *rw, H264RawSPS *current)
Definition: cbs_h264_syntax_template.c:260
AVCodecContext
main external API structure.
Definition: avcodec.h:451
buffer
the frame and frame reference mechanism is intended to as much as expensive copies of that data while still allowing the filters to produce correct results The data is stored in buffers represented by AVFrame structures Several references can point to the same frame buffer
Definition: filter_design.txt:49
ff_nvdec_frame_params
int ff_nvdec_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx, int dpb_size, int supports_444)
Definition: nvdec.c:695
H264Picture
Definition: h264dec.h:114
pps
uint64_t pps
Definition: dovi_rpuenc.c:35
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
mem.h
AVBufferRef
A reference to a data buffer.
Definition: buffer.h:82
AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:478
ff_h264_nvdec_hwaccel
const FFHWAccel ff_h264_nvdec_hwaccel
Definition: nvdec_h264.c:174
FrameDecodeData::hwaccel_priv
void * hwaccel_priv
Per-frame private data for hwaccels.
Definition: decode.h:51
h
h
Definition: vp9dsp_template.c:2070
NVDECContext
Definition: nvdec.h:52
src
#define src
Definition: vp8dsp.c:248