[FFmpeg-devel] [PATCH 2/2] add libyami.cpp for h264 decoding by libyami

Fri Jan 9 09:15:13 CET 2015

From: "Zhao, Halley" <halley.zhao at intel.com>

- do not support multi-thread decoding, it is unnecessary for hw
- create a decode thread to interface with yami decoding, decouple
  frame in and out
- the output frame type (raw data | drm handle | dmabuf) are specified
  in avctx->coder during init
- yami frame is assigned to AVFrame->buf[0], yami_recycle_frame() is
  registered to AVBufferRef. then it is recycle when AVFrame/AVBufferRef
  is unref'ed.
---
 libavcodec/libyami.cpp | 386 +++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 386 insertions(+)
 create mode 100644 libavcodec/libyami.cpp

diff --git a/libavcodec/libyami.cpp b/libavcodec/libyami.cpp
new file mode 100644
index 0000000..e944cde
--- /dev/null
+++ b/libavcodec/libyami.cpp
@@ -0,0 +1,386 @@
+/*
+ * libyami.cpp -- h264 decoder uses libyami
+ *
+ *  Copyright (C) 2014 Intel Corporation
+ *    Author: Zhao Halley<halley.zhao at intel.com>
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#include <pthread.h>
+#include <unistd.h>
+#include <assert.h>
+#include <deque>
+extern "C" {
+#include "avcodec.h"
+#include "libavutil/imgutils.h"
+#include "internal.h"
+}
+#include "VideoDecoderHost.h"
+
+using namespace YamiMediaCodec;
+#ifndef VA_FOURCC_I420
+#define VA_FOURCC_I420 VA_FOURCC('I','4','2','0')
+#endif
+#define PRINT_DECODE_THREAD(format, ...)  av_log(avctx, AV_LOG_VERBOSE, "## decode thread ## line:%4d " format, __LINE__, ##__VA_ARGS__)
+
+typedef enum {
+    DECODE_THREAD_NOT_INIT = 0,
+    DECODE_THREAD_RUNING,
+    DECODE_THREAD_GOT_EOS,
+    DECODE_THREAD_EXIT,
+} DecodeThreadStatus;
+
+struct YamiContext {
+    AVCodecContext *avctx;
+    pthread_mutex_t mutex_; // mutex for decoder->getOutput() and YamiContext itself update (decode_status, etc)
+
+    IVideoDecoder *decoder;
+    VideoDataMemoryType output_type;
+    const VideoFormatInfo *format_info;
+    pthread_t decode_thread_id;
+    std::deque<VideoDecodeBuffer*> *in_queue;
+    pthread_mutex_t in_mutex; // mutex for in_queue
+    pthread_cond_t in_cond;   // decode thread condition wait
+    DecodeThreadStatus decode_status;
+
+    // debug use
+    int decode_count;
+    int decode_count_yami;
+    int render_count;
+};
+
+static av_cold int yami_init(AVCodecContext *avctx)
+{
+    YamiContext *s = (YamiContext*)avctx->priv_data;
+    Decode_Status status;
+
+    av_log(avctx, AV_LOG_VERBOSE, "yami_init\n");
+    s->decoder = createVideoDecoder("video/h264");
+    if (!s->decoder) {
+        av_log(avctx, AV_LOG_ERROR, "fail to create libyami h264 decoder\n");
+        return -1;
+    }
+
+    NativeDisplay native_display;
+    native_display.type = NATIVE_DISPLAY_DRM;
+    native_display.handle = 0;
+    s->decoder ->setNativeDisplay(&native_display);
+
+    VideoConfigBuffer config_buffer;
+    memset(&config_buffer,0,sizeof(VideoConfigBuffer));
+    if (avctx->extradata && avctx->extradata_size && avctx->extradata[0] == 1) {
+        config_buffer.data = avctx->extradata;
+        config_buffer.size = avctx->extradata_size;
+    }
+    config_buffer.profile = VAProfileNone;
+    status = s->decoder->start(&config_buffer);
+    if (status != DECODE_SUCCESS) {
+        av_log(avctx, AV_LOG_ERROR, "yami h264 decoder fail to start\n");
+        return -1;
+    }
+
+    switch (avctx->coder_type) {
+    case 0:
+        s->output_type = VIDEO_DATA_MEMORY_TYPE_RAW_POINTER;
+        break;
+    case 1:
+        s->output_type = VIDEO_DATA_MEMORY_TYPE_DRM_NAME;
+        break;
+    case 2:
+        s->output_type = VIDEO_DATA_MEMORY_TYPE_DMA_BUF;
+        break;
+    default:
+        av_log(avctx, AV_LOG_ERROR, "unknown output frame type: %d", avctx->coder_type);
+        break;
+    }
+
+    s->in_queue = new std::deque<VideoDecodeBuffer*>;
+    pthread_mutex_init(&s->mutex_, NULL);
+    pthread_mutex_init(&s->in_mutex, NULL);
+    pthread_cond_init(&s->in_cond, NULL);
+    s->decode_status = DECODE_THREAD_NOT_INIT;
+    s->decode_count = 0;
+    s->decode_count_yami = 0;
+    s->render_count = 0;
+
+    return 0;
+}
+
+static void* decodeThread(void *arg)
+{
+    AVCodecContext *avctx = (AVCodecContext*)arg;
+    YamiContext *s = (YamiContext*)avctx->priv_data;
+
+    while (1) {
+        VideoDecodeBuffer *in_buffer = NULL;
+        // deque one input buffer
+        PRINT_DECODE_THREAD("decode thread runs one cycle start ... \n");
+        pthread_mutex_lock(&s->in_mutex);
+            if (s->in_queue->empty()) {
+                if (s->decode_status == DECODE_THREAD_GOT_EOS) {
+                    pthread_mutex_unlock(&s->in_mutex);
+                    break;
+                } else {
+                    PRINT_DECODE_THREAD("decode thread wait because s->in_queue is empty\n");
+                    pthread_cond_wait(&s->in_cond, &s->in_mutex); // wait if no todo frame is available
+                }
+            }
+
+            if (s->in_queue->empty()) { // may wake up from EOS/Close
+                pthread_mutex_unlock(&s->in_mutex);
+                continue;
+            }
+
+            PRINT_DECODE_THREAD("s->in_queue->size()=%ld\n", s->in_queue->size());
+            in_buffer = s->in_queue->front();
+            s->in_queue->pop_front();
+        pthread_mutex_unlock(&s->in_mutex);
+
+        // decode one input buffer
+        PRINT_DECODE_THREAD("try to process one input buffer, in_buffer->data=%p, in_buffer->size=%d\n", in_buffer->data, in_buffer->size);
+        Decode_Status status = s->decoder->decode(in_buffer);
+        PRINT_DECODE_THREAD("decode() status=%d, decode_count_yami=%d\n", status, s->decode_count_yami);
+
+        if (DECODE_FORMAT_CHANGE == status) {
+            s->format_info = s->decoder->getFormatInfo();
+            PRINT_DECODE_THREAD("decode format change %dx%d\n",s->format_info->width,s->format_info->height);
+            // resend the buffer
+            status = s->decoder->decode(in_buffer);
+            PRINT_DECODE_THREAD("decode() status=%d\n",status);
+            avctx->width = s->format_info->width;
+            avctx->height = s->format_info->height;
+            avctx->pix_fmt = AV_PIX_FMT_YUV420P;
+        }
+        s->decode_count_yami++;
+        av_free(in_buffer);
+    }
+
+    PRINT_DECODE_THREAD("decode thread exit\n");
+    pthread_mutex_lock(&s->mutex_);
+    s->decode_status = DECODE_THREAD_EXIT;
+    pthread_mutex_unlock(&s->mutex_);
+    return NULL;
+}
+
+static void yami_recycle_frame(void *opaque, uint8_t *data)
+{
+    AVCodecContext *avctx = (AVCodecContext*)opaque;
+    YamiContext *s = (YamiContext*)avctx->priv_data;
+    VideoFrameRawData *frame = (VideoFrameRawData*)data;
+
+    if (!s->decoder) // XXX, use shared pointer for s
+        return;
+    pthread_mutex_lock(&s->mutex_);
+    s->decoder->renderDone(frame);
+    pthread_mutex_unlock(&s->mutex_);
+    av_log(avctx, AV_LOG_DEBUG, "recycle previous frame: %p\n", frame);
+}
+
+static int yami_decode_frame(AVCodecContext *avctx, void *data /* output frame */,
+                                    int *got_frame, AVPacket *avpkt /* input compressed data*/)
+{
+    YamiContext *s = (YamiContext*)avctx->priv_data;
+    VideoDecodeBuffer *in_buffer = NULL;
+    Decode_Status status = RENDER_NO_AVAILABLE_FRAME;
+    VideoFrameRawData *yami_frame = NULL;
+    AVFrame  *frame = (AVFrame*)data;
+
+    av_log(avctx, AV_LOG_VERBOSE, "yami_decode_frame\n");
+    // append avpkt to input buffer queue
+    in_buffer = (VideoDecodeBuffer*)av_mallocz(sizeof(VideoDecodeBuffer));
+    in_buffer->data = avpkt->data;
+    in_buffer->size = avpkt->size;
+    in_buffer->timeStamp = avpkt->pts;
+    while (s->decode_status < DECODE_THREAD_GOT_EOS) { // we need enque eos buffer more than once
+        pthread_mutex_lock(&s->in_mutex);
+            if (s->in_queue->size()<4) {
+                s->in_queue->push_back(in_buffer);
+                av_log(avctx, AV_LOG_VERBOSE, "wakeup decode thread ...\n");
+                pthread_cond_signal(&s->in_cond);
+                pthread_mutex_unlock(&s->in_mutex);
+                break;
+            }
+        pthread_mutex_unlock(&s->in_mutex);
+
+        av_log(avctx, AV_LOG_DEBUG, "s->in_queue->size()=%ld, s->decode_count=%d, s->decode_count_yami=%d, too many buffer are under decoding, wait ...\n",
+        s->in_queue->size(), s->decode_count, s->decode_count_yami);
+        usleep(10000);
+    };
+    s->decode_count++;
+
+    // decode thread status update
+    pthread_mutex_lock(&s->mutex_);
+    switch (s->decode_status) {
+    case DECODE_THREAD_NOT_INIT:
+    case DECODE_THREAD_EXIT:
+        if (avpkt->data && avpkt->size) {
+            s->decode_status = DECODE_THREAD_RUNING;
+            pthread_create(&s->decode_thread_id, NULL, &decodeThread, avctx);
+        }
+        break;
+    case DECODE_THREAD_RUNING:
+        if (!avpkt->data || ! avpkt->size)
+            s->decode_status = DECODE_THREAD_GOT_EOS; // call releaseLock for seek
+        break;
+    case DECODE_THREAD_GOT_EOS:
+        s->decode_status = DECODE_THREAD_NOT_INIT;
+        break;
+    default:
+        break;
+    }
+    pthread_mutex_unlock(&s->mutex_);
+
+    // get an output buffer from yami
+    do {
+        if (!s->format_info) {
+            usleep(10000);
+            continue;
+        }
+        yami_frame = (VideoFrameRawData*)av_malloc(sizeof(VideoFrameRawData));
+        yami_frame->memoryType = s->output_type;
+        if (s->output_type == VIDEO_DATA_MEMORY_TYPE_DRM_NAME || s->output_type == VIDEO_DATA_MEMORY_TYPE_DMA_BUF) {
+            yami_frame->fourcc = VA_FOURCC_BGRX;
+        } else {
+            yami_frame->fourcc = VA_FOURCC_I420;
+        }
+        yami_frame->width = s->format_info->width;
+        yami_frame->height = s->format_info->height;
+
+        pthread_mutex_lock(&s->mutex_);
+        status = s->decoder->getOutput(yami_frame); // do not use draining flag here, both draining here and in decode thread will cause race condition
+        pthread_mutex_unlock(&s->mutex_);
+        av_log(avctx, AV_LOG_DEBUG, "getoutput() status=%d\n",status);
+        if (status == RENDER_SUCCESS)
+            break;
+
+        if (s->decode_status == DECODE_THREAD_GOT_EOS) {
+            usleep(10000);
+            continue;
+        } else {
+            *got_frame = 0;
+            return avpkt->size;
+        }
+    } while (s->decode_status == DECODE_THREAD_RUNING);
+
+    if (status != RENDER_SUCCESS) {
+        assert(s->decode_status != DECODE_THREAD_RUNING);
+        av_log(avctx, AV_LOG_VERBOSE, "after processed EOS, return\n");
+        return avpkt->size;
+    }
+
+    // process the output frame
+    if (s->output_type == VIDEO_DATA_MEMORY_TYPE_DRM_NAME || s->output_type == VIDEO_DATA_MEMORY_TYPE_DMA_BUF) {
+        frame = (AVFrame*)data;
+        frame->data[0] = (uint8_t*)yami_frame->handle;
+        frame->data[1] = (uint8_t*)yami_frame->pitch[0];
+        ((AVFrame*)data)->extended_data = ((AVFrame*)data)->data;
+    }else {
+        AVFrame *vframe = av_frame_alloc();
+        int src_linesize[4];
+        const uint8_t *src_data[4];
+        int ret = ff_get_buffer(avctx, vframe, AV_GET_BUFFER_FLAG_REF);
+        if (ret < 0) {
+            return -1;
+        }
+
+        src_linesize[0] = yami_frame->pitch[0];
+        src_linesize[1] = yami_frame->pitch[1];
+        src_linesize[2] = yami_frame->pitch[2];
+        uint8_t* yamidata = reinterpret_cast<uint8_t*>(yami_frame->handle);
+        src_data[0] = yamidata + yami_frame->offset[0];
+        src_data[1] = yamidata + yami_frame->offset[1];
+        src_data[2] = yamidata + yami_frame->offset[2];
+
+        vframe->pts = yami_frame->timeStamp;
+        vframe->width = avctx->width;
+        vframe->height = avctx->height;
+        vframe->key_frame = yami_frame->flags & IS_SYNC_FRAME;
+        vframe->format = AV_PIX_FMT_YUV420P;
+        vframe->extended_data = NULL;
+        av_image_copy(vframe->data, vframe->linesize, src_data, src_linesize, avctx->pix_fmt, avctx->width, avctx->height);
+        *(AVFrame*)data = *vframe;
+        ((AVFrame*)data)->extended_data = ((AVFrame*)data)->data;
+    }
+    *got_frame = 1;
+    frame->buf[0] = av_buffer_create((uint8_t*)yami_frame, sizeof(VideoFrameRawData), yami_recycle_frame, avctx, 0);
+    s->render_count++;
+    assert(data->buf[0] || !*got_frame);
+    av_log(avctx, AV_LOG_VERBOSE, "decode_count_yami=%d, decode_count=%d, render_count=%d\n", s->decode_count_yami, s->decode_count, s->render_count);
+
+    return avpkt->size;
+}
+
+static av_cold int yami_close(AVCodecContext *avctx)
+{
+    YamiContext *s = (YamiContext*)avctx->priv_data;
+
+    // wait decode thread exit
+    pthread_mutex_lock(&s->mutex_);
+    while (s->decode_status != DECODE_THREAD_EXIT) {
+        // potential race condition on s->decode_status
+        s->decode_status = DECODE_THREAD_GOT_EOS;
+        pthread_mutex_unlock(&s->mutex_);
+        pthread_cond_signal(&s->in_cond);
+        usleep(10000);
+        pthread_mutex_lock(&s->mutex_);
+    }
+    pthread_mutex_unlock(&s->mutex_);
+
+    if (s->decoder) {
+        s->decoder->stop();
+        releaseVideoDecoder(s->decoder);
+        s->decoder = NULL;
+    }
+
+    pthread_mutex_destroy(&s->in_mutex);
+    pthread_cond_destroy(&s->in_cond);
+    delete s->in_queue;
+    av_log(avctx, AV_LOG_VERBOSE, "yami_close\n");
+
+    return 0;
+}
+
+AVCodec ff_libyami_h264_decoder = {
+    .name                   = "libyami_h264",
+    .long_name              = NULL_IF_CONFIG_SMALL("libyami H.264"),
+    .type                   = AVMEDIA_TYPE_VIDEO,
+    .id                     = AV_CODEC_ID_H264,
+    .capabilities           = CODEC_CAP_DELAY, // it is not necessary to support multi-threads
+    .supported_framerates   = NULL,
+    .pix_fmts               = NULL,
+    .supported_samplerates  = NULL,
+    .sample_fmts            = NULL,
+    .channel_layouts        = NULL,
+#if FF_API_LOWRES
+    .max_lowres             = 0,
+#endif
+    .priv_class             = NULL,
+    .profiles               = NULL,
+    .priv_data_size         = sizeof(YamiContext),
+    .next                   = NULL,
+    .init_thread_copy       = NULL,
+    .update_thread_context  = NULL,
+    .defaults               = NULL,
+    .init_static_data       = NULL,
+    .init                   = yami_init,
+    .encode_sub             = NULL,
+    .encode2                = NULL,
+    .decode                 = yami_decode_frame,
+    .close                  = yami_close,
+    .flush                  = NULL, // TODO, add it
+};
-- 
1.8.3.2