doxygen/trunk/zmbvenc_8c_source.html

/*

 * Zip Motion Blocks Video (ZMBV) encoder

 * Copyright (c) 2006 Konstantin Shishkov

 *

 * This file is part of FFmpeg.

 *

 * FFmpeg is free software; you can redistribute it and/or

 * modify it under the terms of the GNU Lesser General Public

 * License as published by the Free Software Foundation; either

 * version 2.1 of the License, or (at your option) any later version.

 *

 * FFmpeg is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

 * Lesser General Public License for more details.

 *

 * You should have received a copy of the GNU Lesser General Public

 * License along with FFmpeg; if not, write to the Free Software

 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

 */


/**

 * @file

 * Zip Motion Blocks Video encoder

 */


#include <stddef.h>


#include "libavutil/intreadwrite.h"

#include "libavutil/mem.h"

#include "avcodec.h"

#include "codec_internal.h"

#include "encode.h"

#include "zlib_wrapper.h"


#include <zlib.h>


/* Frame header flags */

#define ZMBV_KEYFRAME 1

#define ZMBV_DELTAPAL 2


/* Motion block width/height (maximum allowed value is 255)

 * Note: histogram datatype in block_cmp() must be big enough to hold values

 * up to (4 * ZMBV_BLOCK * ZMBV_BLOCK)

 */

#define ZMBV_BLOCK 16


/* Keyframe header format values */

enum ZmbvFormat {

    ZMBV_FMT_NONE  = 0,

    ZMBV_FMT_1BPP  = 1,

    ZMBV_FMT_2BPP  = 2,

    ZMBV_FMT_4BPP  = 3,

    ZMBV_FMT_8BPP  = 4,

    ZMBV_FMT_15BPP = 5,

    ZMBV_FMT_16BPP = 6,

    ZMBV_FMT_24BPP = 7,

    ZMBV_FMT_32BPP = 8

};


/**

 * Encoder context

 */

typedef struct ZmbvEncContext {

    AVCodecContext *avctx;


    int lrange, urange;

    uint8_t *comp_buf, *work_buf;

    uint8_t pal[768];

    uint32_t pal2[256]; //for quick comparisons

    uint8_t *prev, *prev_buf;

    int pstride;

    int comp_size;

    int keyint, curfrm;

    int bypp;

    enum ZmbvFormat fmt;

    FFZStream zstream;


    int score_tab[ZMBV_BLOCK * ZMBV_BLOCK * 4 + 1];

} ZmbvEncContext;


/** Block comparing function

 * XXX should be optimized and moved to DSPContext

 */

static inline int block_cmp(ZmbvEncContext *c, const uint8_t *src, int stride,

                            const uint8_t *src2, int stride2, int bw, int bh,

                            int *xored)

{

    int sum = 0;

    int i, j;

    uint16_t histogram[256] = {0};

    int bw_bytes = bw * c->bypp;


    /* Build frequency histogram of byte values for src[] ^ src2[] */

    for(j = 0; j < bh; j++){

        for(i = 0; i < bw_bytes; i++){

            int t = src[i] ^ src2[i];

            histogram[t]++;

        }

        src += stride;

        src2 += stride2;

    }


    /* If not all the xored values were 0, then the blocks are different */

    *xored = (histogram[0] < bw_bytes * bh);


    /* Exit early if blocks are equal */

    if (!*xored) return 0;


    /* Sum the entropy of all values */

    for(i = 0; i < 256; i++)

        sum += c->score_tab[histogram[i]];


    return sum;

}


/** Motion estimation function

 * TODO make better ME decisions

 */

static int zmbv_me(ZmbvEncContext *c, const uint8_t *src, int sstride, const uint8_t *prev,

                   int pstride, int x, int y, int *mx, int *my, int *xored)

{

    int dx, dy, txored, tv, bv, bw, bh;

    int mx0, my0;


    mx0 = *mx;

    my0 = *my;

    bw = FFMIN(ZMBV_BLOCK, c->avctx->width - x);

    bh = FFMIN(ZMBV_BLOCK, c->avctx->height - y);


    /* Try (0,0) */

    bv = block_cmp(c, src, sstride, prev, pstride, bw, bh, xored);

    *mx = *my = 0;

    if(!bv) return 0;


    /* Try previous block's MV (if not 0,0) */

    if (mx0 || my0){

        tv = block_cmp(c, src, sstride, prev + mx0 * c->bypp + my0 * pstride, pstride, bw, bh, &txored);

        if(tv < bv){

            bv = tv;

            *mx = mx0;

            *my = my0;

            *xored = txored;

            if(!bv) return 0;

        }

    }


    /* Try other MVs from top-to-bottom, left-to-right */

    for(dy = -c->lrange; dy <= c->urange; dy++){

        for(dx = -c->lrange; dx <= c->urange; dx++){

            if(!dx && !dy) continue; // we already tested this block

            if(dx == mx0 && dy == my0) continue; // this one too

            tv = block_cmp(c, src, sstride, prev + dx * c->bypp + dy * pstride, pstride, bw, bh, &txored);

            if(tv < bv){

                 bv = tv;

                 *mx = dx;

                 *my = dy;

                 *xored = txored;

                 if(!bv) return 0;

             }

         }

    }

    return bv;

}


static int encode_frame(AVCodecContext *avctx, AVPacket *pkt,

                        const AVFrame *pict, int *got_packet)

{

    ZmbvEncContext * const c = avctx->priv_data;

    z_stream  *const zstream = &c->zstream.zstream;

    const AVFrame * const p = pict;

    const uint8_t *src;

    uint8_t *prev, *buf;

    uint32_t *palptr;

    int keyframe, chpal;

    int fl;

    int work_size = 0, pkt_size;

    int bw, bh;

    int i, j, ret;


    keyframe = !c->curfrm;

    c->curfrm++;

    if(c->curfrm == c->keyint)

        c->curfrm = 0;


    palptr = (avctx->pix_fmt == AV_PIX_FMT_PAL8) ? (uint32_t *)p->data[1] : NULL;

    chpal = !keyframe && palptr && memcmp(palptr, c->pal2, 1024);


    src = p->data[0];

    prev = c->prev;

    if(chpal){

        uint8_t tpal[3];

        for(i = 0; i < 256; i++){

            AV_WB24(tpal, palptr[i]);

            c->work_buf[work_size++] = tpal[0] ^ c->pal[i * 3 + 0];

            c->work_buf[work_size++] = tpal[1] ^ c->pal[i * 3 + 1];

            c->work_buf[work_size++] = tpal[2] ^ c->pal[i * 3 + 2];

            c->pal[i * 3 + 0] = tpal[0];

            c->pal[i * 3 + 1] = tpal[1];

            c->pal[i * 3 + 2] = tpal[2];

        }

        memcpy(c->pal2, palptr, 1024);

    }

    if(keyframe){

        if (palptr){

            for(i = 0; i < 256; i++){

                AV_WB24(c->pal+(i*3), palptr[i]);

            }

            memcpy(c->work_buf, c->pal, 768);

            memcpy(c->pal2, palptr, 1024);

            work_size = 768;

        }

        for(i = 0; i < avctx->height; i++){

            memcpy(c->work_buf + work_size, src, avctx->width * c->bypp);

            src += p->linesize[0];

            work_size += avctx->width * c->bypp;

        }

    }else{

        int x, y, bh2, bw2, xored;

        const uint8_t *tsrc, *tprev;

        uint8_t *mv;

        int mx = 0, my = 0;


        bw = (avctx->width + ZMBV_BLOCK - 1) / ZMBV_BLOCK;

        bh = (avctx->height + ZMBV_BLOCK - 1) / ZMBV_BLOCK;

        mv = c->work_buf + work_size;

        memset(c->work_buf + work_size, 0, (bw * bh * 2 + 3) & ~3);

        work_size += (bw * bh * 2 + 3) & ~3;

        /* for now just XOR'ing */

        for(y = 0; y < avctx->height; y += ZMBV_BLOCK) {

            bh2 = FFMIN(avctx->height - y, ZMBV_BLOCK);

            for(x = 0; x < avctx->width; x += ZMBV_BLOCK, mv += 2) {

                bw2 = FFMIN(avctx->width - x, ZMBV_BLOCK);


                tsrc = src + x * c->bypp;

                tprev = prev + x * c->bypp;


                zmbv_me(c, tsrc, p->linesize[0], tprev, c->pstride, x, y, &mx, &my, &xored);

                mv[0] = (mx * 2) | !!xored;

                mv[1] = my * 2;

                tprev += mx * c->bypp + my * c->pstride;

                if(xored){

                    for(j = 0; j < bh2; j++){

                        for(i = 0; i < bw2 * c->bypp; i++)

                            c->work_buf[work_size++] = tsrc[i] ^ tprev[i];

                        tsrc += p->linesize[0];

                        tprev += c->pstride;

                    }

                }

            }

            src += p->linesize[0] * ZMBV_BLOCK;

            prev += c->pstride * ZMBV_BLOCK;

        }

    }

    /* save the previous frame */

    src = p->data[0];

    prev = c->prev;

    for(i = 0; i < avctx->height; i++){

        memcpy(prev, src, avctx->width * c->bypp);

        prev += c->pstride;

        src += p->linesize[0];

    }


    if (keyframe)

        deflateReset(zstream);


    zstream->next_in   = c->work_buf;

    zstream->avail_in  = work_size;

    zstream->total_in  = 0;


    zstream->next_out  = c->comp_buf;

    zstream->avail_out = c->comp_size;

    zstream->total_out = 0;

    if (deflate(zstream, Z_SYNC_FLUSH) != Z_OK) {

        av_log(avctx, AV_LOG_ERROR, "Error compressing data\n");

        return -1;

    }


    pkt_size = zstream->total_out + 1 + 6 * keyframe;

    if ((ret = ff_get_encode_buffer(avctx, pkt, pkt_size, 0)) < 0)

        return ret;

    buf = pkt->data;


    fl = (keyframe ? ZMBV_KEYFRAME : 0) | (chpal ? ZMBV_DELTAPAL : 0);

    *buf++ = fl;

    if (keyframe) {

        *buf++ = 0; // hi ver

        *buf++ = 1; // lo ver

        *buf++ = 1; // comp

        *buf++ = c->fmt; // format

        *buf++ = ZMBV_BLOCK; // block width

        *buf++ = ZMBV_BLOCK; // block height

        pkt->flags |= AV_PKT_FLAG_KEY;

    }

    memcpy(buf, c->comp_buf, zstream->total_out);


    *got_packet = 1;


    return 0;

}


static av_cold int encode_end(AVCodecContext *avctx)

{

    ZmbvEncContext * const c = avctx->priv_data;


    av_freep(&c->comp_buf);

    av_freep(&c->work_buf);


    av_freep(&c->prev_buf);

    ff_deflate_end(&c->zstream);


    return 0;

}


/**

 * Init zmbv encoder

 */

static av_cold int encode_init(AVCodecContext *avctx)

{

    ZmbvEncContext * const c = avctx->priv_data;

    int i;

    int lvl = 9;

    int prev_size, prev_offset;


    switch (avctx->pix_fmt) {

    case AV_PIX_FMT_PAL8:

        c->fmt = ZMBV_FMT_8BPP;

        c->bypp = 1;

        break;

    case AV_PIX_FMT_RGB555LE:

        c->fmt = ZMBV_FMT_15BPP;

        c->bypp = 2;

        break;

    case AV_PIX_FMT_RGB565LE:

        c->fmt = ZMBV_FMT_16BPP;

        c->bypp = 2;

        break;

#ifdef ZMBV_ENABLE_24BPP

    case AV_PIX_FMT_BGR24:

        c->fmt = ZMBV_FMT_24BPP;

        c->bypp = 3;

        break;

#endif //ZMBV_ENABLE_24BPP

    case AV_PIX_FMT_BGR0:

        c->fmt = ZMBV_FMT_32BPP;

        c->bypp = 4;

        break;

    }


    /* Entropy-based score tables for comparing blocks.

     * Suitable for blocks up to (ZMBV_BLOCK * ZMBV_BLOCK) bytes.

     * Scores are nonnegative, lower is better.

     */

    for(i = 1; i <= ZMBV_BLOCK * ZMBV_BLOCK * c->bypp; i++)

        c->score_tab[i] = -i * log2(i / (double)(ZMBV_BLOCK * ZMBV_BLOCK * c->bypp)) * 256;


    c->avctx = avctx;


    c->curfrm = 0;

    c->keyint = avctx->keyint_min;


    /* Motion estimation range: maximum distance is -64..63 */

    c->lrange = c->urange = 8;

    if(avctx->me_range > 0){

        c->lrange = FFMIN(avctx->me_range, 64);

        c->urange = FFMIN(avctx->me_range, 63);

    }


    if(avctx->compression_level >= 0)

        lvl = avctx->compression_level;

    if(lvl < 0 || lvl > 9){

        av_log(avctx, AV_LOG_ERROR, "Compression level should be 0-9, not %i\n", lvl);

        return AVERROR(EINVAL);

    }


    c->comp_size = avctx->width * c->bypp * avctx->height + 1024 +

        ((avctx->width + ZMBV_BLOCK - 1) / ZMBV_BLOCK) * ((avctx->height + ZMBV_BLOCK - 1) / ZMBV_BLOCK) * 2 + 4;

    if (!(c->work_buf = av_malloc(c->comp_size))) {

        av_log(avctx, AV_LOG_ERROR, "Can't allocate work buffer.\n");

        return AVERROR(ENOMEM);

    }

    /* Conservative upper bound taken from zlib v1.2.1 source via lcl.c */

    c->comp_size = c->comp_size + ((c->comp_size + 7) >> 3) +

                           ((c->comp_size + 63) >> 6) + 11;


    /* Allocate compression buffer */

    if (!(c->comp_buf = av_malloc(c->comp_size))) {

        av_log(avctx, AV_LOG_ERROR, "Can't allocate compression buffer.\n");

        return AVERROR(ENOMEM);

    }


    /* Allocate prev buffer - pad around the image to allow out-of-edge ME:

     * - The image should be padded with `lrange` rows before and `urange` rows

     *   after.

     * - The stride should be padded with `lrange` pixels, then rounded up to a

     *   multiple of 16 bytes.

     * - The first row should also be padded with `lrange` pixels before, then

     *   aligned up to a multiple of 16 bytes.

     */

    c->pstride = FFALIGN((avctx->width + c->lrange) * c->bypp, 16);

    prev_size = FFALIGN(c->lrange * c->bypp, 16) + c->pstride * (c->lrange + avctx->height + c->urange);

    prev_offset = FFALIGN(c->lrange * c->bypp, 16) + c->pstride * c->lrange;

    if (!(c->prev_buf = av_mallocz(prev_size))) {

        av_log(avctx, AV_LOG_ERROR, "Can't allocate picture.\n");

        return AVERROR(ENOMEM);

    }

    c->prev = c->prev_buf + prev_offset;


    return ff_deflate_init(&c->zstream, lvl, avctx);

}


const FFCodec ff_zmbv_encoder = {

    .p.name         = "zmbv",

    CODEC_LONG_NAME("Zip Motion Blocks Video"),

    .p.type         = AVMEDIA_TYPE_VIDEO,

    .p.id           = AV_CODEC_ID_ZMBV,

    .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_ENCODER_REORDERED_OPAQUE,

    .priv_data_size = sizeof(ZmbvEncContext),

    .init           = encode_init,

    FF_CODEC_ENCODE_CB(encode_frame),

    .close          = encode_end,

    .p.pix_fmts     = (const enum AVPixelFormat[]) { AV_PIX_FMT_PAL8,

                                                     AV_PIX_FMT_RGB555LE,

                                                     AV_PIX_FMT_RGB565LE,

#ifdef ZMBV_ENABLE_24BPP

                                                     AV_PIX_FMT_BGR24,

#endif //ZMBV_ENABLE_24BPP

                                                     AV_PIX_FMT_BGR0,

                                                     AV_PIX_FMT_NONE },

    .caps_internal  = FF_CODEC_CAP_INIT_CLEANUP,

};