[FFmpeg-devel] [PATCH v2 2/2] lavc/vaapi_av1: Avoid sending the same slice buffer multiple times

Neal Gompa ngompa13 at gmail.com
Mon May 27 23:00:40 EEST 2024


On Wed, May 8, 2024 at 3:13 AM David Rosca <nowrep at gmail.com> wrote:
>
> When there are multiple tiles in one slice buffer, use multiple slice
> params to avoid sending the same slice buffer multiple times and thus
> increasing the bitstream size the driver will need to upload to hw.
> ---
> v2: Avoid allocations every slice.
>
>  libavcodec/vaapi_av1.c | 47 +++++++++++++++++++++++++++++-------------
>  1 file changed, 33 insertions(+), 14 deletions(-)
>
> diff --git a/libavcodec/vaapi_av1.c b/libavcodec/vaapi_av1.c
> index 4a90db1e09..4ee33a3ae3 100644
> --- a/libavcodec/vaapi_av1.c
> +++ b/libavcodec/vaapi_av1.c
> @@ -19,6 +19,7 @@
>   */
>
>  #include "libavutil/frame.h"
> +#include "libavutil/mem.h"
>  #include "hwaccel_internal.h"
>  #include "vaapi_decode.h"
>  #include "internal.h"
> @@ -42,6 +43,9 @@ typedef struct VAAPIAV1DecContext {
>      */
>      VAAPIAV1FrameRef ref_tab[AV1_NUM_REF_FRAMES];
>      AVFrame *tmp_frame;
> +
> +    int nb_slice_params;
> +    VASliceParameterBufferAV1 *slice_params;
>  } VAAPIAV1DecContext;
>
>  static VASurfaceID vaapi_av1_surface_id(AV1Frame *vf)
> @@ -97,6 +101,8 @@ static int vaapi_av1_decode_uninit(AVCodecContext *avctx)
>      for (int i = 0; i < FF_ARRAY_ELEMS(ctx->ref_tab); i++)
>          av_frame_free(&ctx->ref_tab[i].frame);
>
> +    av_freep(&ctx->slice_params);
> +
>      return ff_vaapi_decode_uninit(avctx);
>  }
>
> @@ -393,13 +399,24 @@ static int vaapi_av1_decode_slice(AVCodecContext *avctx,
>  {
>      const AV1DecContext *s = avctx->priv_data;
>      VAAPIDecodePicture *pic = s->cur_frame.hwaccel_picture_private;
> -    VASliceParameterBufferAV1 slice_param;
> -    int err = 0;
> +    VAAPIAV1DecContext *ctx = avctx->internal->hwaccel_priv_data;
> +    int err, nb_params;
> +
> +    nb_params = s->tg_end - s->tg_start + 1;
> +    if (ctx->nb_slice_params < nb_params) {
> +        ctx->slice_params = av_realloc_array(ctx->slice_params,
> +                                             nb_params,
> +                                             sizeof(*ctx->slice_params));
> +        if (!ctx->slice_params) {
> +            ctx->nb_slice_params = 0;
> +            err = AVERROR(ENOMEM);
> +            goto fail;
> +        }
> +        ctx->nb_slice_params = nb_params;
> +    }
>
>      for (int i = s->tg_start; i <= s->tg_end; i++) {
> -        memset(&slice_param, 0, sizeof(VASliceParameterBufferAV1));
> -
> -        slice_param = (VASliceParameterBufferAV1) {
> +        ctx->slice_params[i - s->tg_start] = (VASliceParameterBufferAV1) {
>              .slice_data_size   = s->tile_group_info[i].tile_size,
>              .slice_data_offset = s->tile_group_info[i].tile_offset,
>              .slice_data_flag   = VA_SLICE_DATA_FLAG_ALL,
> @@ -408,18 +425,20 @@ static int vaapi_av1_decode_slice(AVCodecContext *avctx,
>              .tg_start          = s->tg_start,
>              .tg_end            = s->tg_end,
>          };
> -
> -        err = ff_vaapi_decode_make_slice_buffer(avctx, pic, &slice_param, 1,
> -                                                sizeof(VASliceParameterBufferAV1),
> -                                                buffer,
> -                                                size);
> -        if (err) {
> -            ff_vaapi_decode_cancel(avctx, pic);
> -            return err;
> -        }
>      }
>
> +    err = ff_vaapi_decode_make_slice_buffer(avctx, pic, ctx->slice_params, nb_params,
> +                                            sizeof(VASliceParameterBufferAV1),
> +                                            buffer,
> +                                            size);
> +    if (err)
> +        goto fail;
> +
>      return 0;
> +
> +fail:
> +    ff_vaapi_decode_cancel(avctx, pic);
> +    return err;
>  }
>
>  const FFHWAccel ff_av1_vaapi_hwaccel = {
> --
> 2.45.0
>

LGTM and works fine with my AMD GPU.

Reviewed-by: Neal Gompa <ngompa13 at gmail.com>



-- 
真実はいつも一つ!/ Always, there's only one truth!


More information about the ffmpeg-devel mailing list