FFmpeg
nvdec_vp9.c
Go to the documentation of this file.
1 /*
2  * VP9 HW decode acceleration through NVDEC
3  *
4  * Copyright (c) 2016 Timo Rothenpieler
5  *
6  * This file is part of FFmpeg.
7  *
8  * FFmpeg is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU Lesser General Public
10  * License as published by the Free Software Foundation; either
11  * version 2.1 of the License, or (at your option) any later version.
12  *
13  * FFmpeg is distributed in the hope that it will be useful,
14  * but WITHOUT ANY WARRANTY; without even the implied warranty of
15  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16  * Lesser General Public License for more details.
17  *
18  * You should have received a copy of the GNU Lesser General Public
19  * License along with FFmpeg; if not, write to the Free Software
20  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
21  */
22 
23 #include "libavutil/pixdesc.h"
24 
25 #include "avcodec.h"
26 #include "nvdec.h"
27 #include "decode.h"
28 #include "hwaccel_internal.h"
29 #include "internal.h"
30 #include "vp9shared.h"
31 
32 static int nvdec_vp9_start_frame(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
33 {
34  VP9SharedContext *h = avctx->priv_data;
35  const AVPixFmtDescriptor *pixdesc = av_pix_fmt_desc_get(avctx->sw_pix_fmt);
36 
38  CUVIDPICPARAMS *pp = &ctx->pic_params;
39  CUVIDVP9PICPARAMS *ppc = &pp->CodecSpecific.vp9;
40  FrameDecodeData *fdd;
41  NVDECFrame *cf;
42  AVFrame *cur_frame = h->frames[CUR_FRAME].tf.f;
43 
44  int ret, i;
45 
46  ret = ff_nvdec_start_frame(avctx, cur_frame);
47  if (ret < 0)
48  return ret;
49 
50  fdd = (FrameDecodeData*)cur_frame->private_ref->data;
51  cf = (NVDECFrame*)fdd->hwaccel_priv;
52 
53  *pp = (CUVIDPICPARAMS) {
54  .PicWidthInMbs = (cur_frame->width + 15) / 16,
55  .FrameHeightInMbs = (cur_frame->height + 15) / 16,
56  .CurrPicIdx = cf->idx,
57 
58  .CodecSpecific.vp9 = {
59  .width = cur_frame->width,
60  .height = cur_frame->height,
61 
62  .LastRefIdx = ff_nvdec_get_ref_idx(h->refs[h->h.refidx[0]].f),
63  .GoldenRefIdx = ff_nvdec_get_ref_idx(h->refs[h->h.refidx[1]].f),
64  .AltRefIdx = ff_nvdec_get_ref_idx(h->refs[h->h.refidx[2]].f),
65 
66  .profile = h->h.profile,
67  .frameContextIdx = h->h.framectxid,
68  .frameType = !h->h.keyframe,
69  .showFrame = !h->h.invisible,
70  .errorResilient = h->h.errorres,
71  .frameParallelDecoding = h->h.parallelmode,
72  .subSamplingX = pixdesc->log2_chroma_w,
73  .subSamplingY = pixdesc->log2_chroma_h,
74  .intraOnly = h->h.intraonly,
75  .allow_high_precision_mv = h->h.keyframe ? 0 : h->h.highprecisionmvs,
76  .refreshEntropyProbs = h->h.refreshctx,
77 
78  .bitDepthMinus8Luma = pixdesc->comp[0].depth - 8,
79  .bitDepthMinus8Chroma = pixdesc->comp[1].depth - 8,
80 
81  .loopFilterLevel = h->h.filter.level,
82  .loopFilterSharpness = h->h.filter.sharpness,
83  .modeRefLfEnabled = h->h.lf_delta.enabled,
84 
85  .log2_tile_columns = h->h.tiling.log2_tile_cols,
86  .log2_tile_rows = h->h.tiling.log2_tile_rows,
87 
88  .segmentEnabled = h->h.segmentation.enabled,
89  .segmentMapUpdate = h->h.segmentation.update_map,
90  .segmentMapTemporalUpdate = h->h.segmentation.temporal,
91  .segmentFeatureMode = h->h.segmentation.absolute_vals,
92 
93  .qpYAc = h->h.yac_qi,
94  .qpYDc = h->h.ydc_qdelta,
95  .qpChDc = h->h.uvdc_qdelta,
96  .qpChAc = h->h.uvac_qdelta,
97 
98  .resetFrameContext = h->h.resetctx,
99  .mcomp_filter_type = h->h.filtermode ^ (h->h.filtermode <= 1),
100 
101  .frameTagSize = h->h.uncompressed_header_size,
102  .offsetToDctParts = h->h.compressed_header_size,
103 
104  .refFrameSignBias[0] = 0,
105  }
106  };
107 
108  for (i = 0; i < 2; i++)
109  ppc->mbModeLfDelta[i] = h->h.lf_delta.mode[i];
110 
111  for (i = 0; i < 4; i++)
112  ppc->mbRefLfDelta[i] = h->h.lf_delta.ref[i];
113 
114  for (i = 0; i < 7; i++)
115  ppc->mb_segment_tree_probs[i] = h->h.segmentation.prob[i];
116 
117  for (i = 0; i < 3; i++) {
118  ppc->activeRefIdx[i] = h->h.refidx[i];
119  ppc->segment_pred_probs[i] = h->h.segmentation.pred_prob[i];
120  ppc->refFrameSignBias[i + 1] = h->h.signbias[i];
121  }
122 
123  for (i = 0; i < 8; i++) {
124  ppc->segmentFeatureEnable[i][0] = h->h.segmentation.feat[i].q_enabled;
125  ppc->segmentFeatureEnable[i][1] = h->h.segmentation.feat[i].lf_enabled;
126  ppc->segmentFeatureEnable[i][2] = h->h.segmentation.feat[i].ref_enabled;
127  ppc->segmentFeatureEnable[i][3] = h->h.segmentation.feat[i].skip_enabled;
128 
129  ppc->segmentFeatureData[i][0] = h->h.segmentation.feat[i].q_val;
130  ppc->segmentFeatureData[i][1] = h->h.segmentation.feat[i].lf_val;
131  ppc->segmentFeatureData[i][2] = h->h.segmentation.feat[i].ref_val;
132  ppc->segmentFeatureData[i][3] = 0;
133  }
134 
135  switch (avctx->colorspace) {
136  default:
138  ppc->colorSpace = 0;
139  break;
140  case AVCOL_SPC_BT470BG:
141  ppc->colorSpace = 1;
142  break;
143  case AVCOL_SPC_BT709:
144  ppc->colorSpace = 2;
145  break;
146  case AVCOL_SPC_SMPTE170M:
147  ppc->colorSpace = 3;
148  break;
149  case AVCOL_SPC_SMPTE240M:
150  ppc->colorSpace = 4;
151  break;
153  ppc->colorSpace = 5;
154  break;
155  case AVCOL_SPC_RESERVED:
156  ppc->colorSpace = 6;
157  break;
158  case AVCOL_SPC_RGB:
159  ppc->colorSpace = 7;
160  break;
161  }
162 
163  return 0;
164 }
165 
167  AVBufferRef *hw_frames_ctx)
168 {
169  // VP9 uses a fixed size pool of 8 possible reference frames
170  return ff_nvdec_frame_params(avctx, hw_frames_ctx, 8, 0);
171 }
172 
174  .p.name = "vp9_nvdec",
175  .p.type = AVMEDIA_TYPE_VIDEO,
176  .p.id = AV_CODEC_ID_VP9,
177  .p.pix_fmt = AV_PIX_FMT_CUDA,
178  .start_frame = nvdec_vp9_start_frame,
179  .end_frame = ff_nvdec_simple_end_frame,
180  .decode_slice = ff_nvdec_simple_decode_slice,
181  .frame_params = nvdec_vp9_frame_params,
182  .init = ff_nvdec_decode_init,
183  .uninit = ff_nvdec_decode_uninit,
184  .priv_data_size = sizeof(NVDECContext),
185 };
AV_PIX_FMT_CUDA
@ AV_PIX_FMT_CUDA
HW acceleration through CUDA.
Definition: pixfmt.h:253
AVCodecContext::colorspace
enum AVColorSpace colorspace
YUV colorspace type.
Definition: avcodec.h:1029
nvdec_vp9_start_frame
static int nvdec_vp9_start_frame(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
Definition: nvdec_vp9.c:32
av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2964
AVBufferRef::data
uint8_t * data
The data buffer.
Definition: buffer.h:90
ff_nvdec_get_ref_idx
int ff_nvdec_get_ref_idx(AVFrame *frame)
Definition: nvdec.c:747
FFHWAccel::p
AVHWAccel p
The public AVHWAccel.
Definition: hwaccel_internal.h:38
FrameDecodeData
This struct stores per-frame lavc-internal data and is attached to it via private_ref.
Definition: decode.h:33
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:340
pixdesc.h
AVFrame::width
int width
Definition: frame.h:412
internal.h
AVComponentDescriptor::depth
int depth
Number of bits in the component.
Definition: pixdesc.h:57
AVCOL_SPC_RGB
@ AVCOL_SPC_RGB
order of coefficients is actually GBR, also IEC 61966-2-1 (sRGB), YZX and ST 428-1
Definition: pixfmt.h:600
AVCOL_SPC_BT470BG
@ AVCOL_SPC_BT470BG
also ITU-R BT601-6 625 / ITU-R BT1358 625 / ITU-R BT1700 625 PAL & SECAM / IEC 61966-2-4 xvYCC601
Definition: pixfmt.h:605
AVCOL_SPC_RESERVED
@ AVCOL_SPC_RESERVED
reserved for future use by ITU-T and ISO/IEC just like 15-255 are
Definition: pixfmt.h:603
FFHWAccel
Definition: hwaccel_internal.h:34
ff_nvdec_start_frame
int ff_nvdec_start_frame(AVCodecContext *avctx, AVFrame *frame)
Definition: nvdec.c:561
vp9shared.h
VP9SharedContext
Definition: vp9shared.h:164
AVCOL_SPC_SMPTE170M
@ AVCOL_SPC_SMPTE170M
also ITU-R BT601-6 525 / ITU-R BT1358 525 / ITU-R BT1700 NTSC / functionally identical to above
Definition: pixfmt.h:606
AV_CODEC_ID_VP9
@ AV_CODEC_ID_VP9
Definition: codec_id.h:220
NVDECFrame
Definition: nvdec.h:44
ctx
AVFormatContext * ctx
Definition: movenc.c:48
decode.h
AVPixFmtDescriptor::log2_chroma_w
uint8_t log2_chroma_w
Amount to shift the luma width right to find the chroma width.
Definition: pixdesc.h:80
ff_nvdec_simple_end_frame
int ff_nvdec_simple_end_frame(AVCodecContext *avctx)
Definition: nvdec.c:663
hwaccel_internal.h
ff_nvdec_decode_init
int ff_nvdec_decode_init(AVCodecContext *avctx)
Definition: nvdec.c:325
AVCodecContext::internal
struct AVCodecInternal * internal
Private context used for internal data.
Definition: avcodec.h:476
nvdec_vp9_frame_params
static int nvdec_vp9_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx)
Definition: nvdec_vp9.c:166
AVCodecInternal::hwaccel_priv_data
void * hwaccel_priv_data
hwaccel-specific private data
Definition: internal.h:124
for
for(k=2;k<=8;++k)
Definition: h264pred_template.c:425
NVDECFrame::idx
unsigned int idx
Definition: nvdec.h:45
size
int size
Definition: twinvq_data.h:10344
nvdec.h
ff_nvdec_decode_uninit
int ff_nvdec_decode_uninit(AVCodecContext *avctx)
Definition: nvdec.c:257
AVFrame::private_ref
AVBufferRef * private_ref
AVBufferRef for internal use by a single libav* library.
Definition: frame.h:797
AVHWAccel::name
const char * name
Name of the hardware accelerated codec.
Definition: avcodec.h:2135
AVCOL_SPC_SMPTE240M
@ AVCOL_SPC_SMPTE240M
derived from 170M primaries and D65 white point, 170M is derived from BT470 System M's primaries
Definition: pixfmt.h:607
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:255
AVCOL_SPC_BT2020_NCL
@ AVCOL_SPC_BT2020_NCL
ITU-R BT2020 non-constant luminance system.
Definition: pixfmt.h:610
AVCOL_SPC_UNSPECIFIED
@ AVCOL_SPC_UNSPECIFIED
Definition: pixfmt.h:602
avcodec.h
ret
ret
Definition: filter_design.txt:187
AVCodecContext
main external API structure.
Definition: avcodec.h:441
AVFrame::height
int height
Definition: frame.h:412
ff_nvdec_simple_decode_slice
int ff_nvdec_simple_decode_slice(AVCodecContext *avctx, const uint8_t *buffer, uint32_t size)
Definition: nvdec.c:673
buffer
the frame and frame reference mechanism is intended to as much as expensive copies of that data while still allowing the filters to produce correct results The data is stored in buffers represented by AVFrame structures Several references can point to the same frame buffer
Definition: filter_design.txt:49
ff_nvdec_frame_params
int ff_nvdec_frame_params(AVCodecContext *avctx, AVBufferRef *hw_frames_ctx, int dpb_size, int supports_444)
Definition: nvdec.c:695
AVPixFmtDescriptor::comp
AVComponentDescriptor comp[4]
Parameters that describe how pixels are packed.
Definition: pixdesc.h:105
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
AVBufferRef
A reference to a data buffer.
Definition: buffer.h:82
CUR_FRAME
#define CUR_FRAME
Definition: vp9shared.h:168
AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:69
AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:468
FrameDecodeData::hwaccel_priv
void * hwaccel_priv
Per-frame private data for hwaccels.
Definition: decode.h:51
h
h
Definition: vp9dsp_template.c:2038
AVCodecContext::sw_pix_fmt
enum AVPixelFormat sw_pix_fmt
Nominal unaccelerated pixel format, see AV_PIX_FMT_xxx.
Definition: avcodec.h:1810
NVDECContext
Definition: nvdec.h:52
AVCOL_SPC_BT709
@ AVCOL_SPC_BT709
also ITU-R BT1361 / IEC 61966-2-4 xvYCC709 / derived in SMPTE RP 177 Annex B
Definition: pixfmt.h:601
AVPixFmtDescriptor::log2_chroma_h
uint8_t log2_chroma_h
Amount to shift the luma height right to find the chroma height.
Definition: pixdesc.h:89
ff_vp9_nvdec_hwaccel
const FFHWAccel ff_vp9_nvdec_hwaccel
Definition: nvdec_vp9.c:173