doxygen/trunk/westwood__vqa_8c_source.html

/*

 * Westwood Studios VQA Format Demuxer

 * Copyright (c) 2003 Mike Melanson <melanson@pcisys.net>

 * Copyright (c) 2021 Pekka Väänänen <pekka.vaananen@iki.fi>

 *

 * This file is part of FFmpeg.

 *

 * FFmpeg is free software; you can redistribute it and/or

 * modify it under the terms of the GNU Lesser General Public

 * License as published by the Free Software Foundation; either

 * version 2.1 of the License, or (at your option) any later version.

 *

 * FFmpeg is distributed in the hope that it will be useful,

 * but WITHOUT ANY WARRANTY; without even the implied warranty of

 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

 * Lesser General Public License for more details.

 *

 * You should have received a copy of the GNU Lesser General Public

 * License along with FFmpeg; if not, write to the Free Software

 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

 */


/**

 * @file

 * Westwood Studios VQA file demuxer

 * by Mike Melanson (melanson@pcisys.net)

 * for more information on the Westwood file formats, visit:

 *   http://www.pcisys.net/~melanson/codecs/

 *   http://www.geocities.com/SiliconValley/8682/aud3.txt

 */


#include "libavutil/intreadwrite.h"

#include "avformat.h"

#include "avio_internal.h"

#include "demux.h"

#include "internal.h"


#define FORM_TAG MKBETAG('F', 'O', 'R', 'M')

#define WVQA_TAG MKBETAG('W', 'V', 'Q', 'A')

#define VQHD_TAG MKBETAG('V', 'Q', 'H', 'D')

#define FINF_TAG MKBETAG('F', 'I', 'N', 'F')

#define SND0_TAG MKBETAG('S', 'N', 'D', '0')

#define SND1_TAG MKBETAG('S', 'N', 'D', '1')

#define SND2_TAG MKBETAG('S', 'N', 'D', '2')

#define VQFR_TAG MKBETAG('V', 'Q', 'F', 'R')

#define VQFL_TAG MKBETAG('V', 'Q', 'F', 'L')


/* don't know what these tags are for, but acknowledge their existence */

#define CINF_TAG MKBETAG('C', 'I', 'N', 'F')

#define CINH_TAG MKBETAG('C', 'I', 'N', 'H')

#define CIND_TAG MKBETAG('C', 'I', 'N', 'D')

#define LINF_TAG MKBETAG('L', 'I', 'N', 'F')

#define PINF_TAG MKBETAG('P', 'I', 'N', 'F')

#define PINH_TAG MKBETAG('P', 'I', 'N', 'H')

#define PIND_TAG MKBETAG('P', 'I', 'N', 'D')

#define CMDS_TAG MKBETAG('C', 'M', 'D', 'S')

#define SN2J_TAG MKBETAG('S', 'N', '2', 'J')

#define VIEW_TAG MKBETAG('V', 'I', 'E', 'W')

#define ZBUF_TAG MKBETAG('Z', 'B', 'U', 'F')


#define VQA_HEADER_SIZE 0x2A

#define VQA_PREAMBLE_SIZE 8


typedef struct WsVqaDemuxContext {

    int version;

    int bps;

    int channels;

    int sample_rate;

    int audio_stream_index;

    int video_stream_index;

    int64_t vqfl_chunk_pos;

    int vqfl_chunk_size;

} WsVqaDemuxContext;


static int wsvqa_probe(const AVProbeData *p)

{

    /* need 12 bytes to qualify */

    if (p->buf_size < 12)

        return 0;


    /* check for the VQA signatures */

    if ((AV_RB32(&p->buf[0]) != FORM_TAG) ||

        (AV_RB32(&p->buf[8]) != WVQA_TAG))

        return 0;


    return AVPROBE_SCORE_MAX;

}


static int wsvqa_read_header(AVFormatContext *s)

{

    WsVqaDemuxContext *wsvqa = s->priv_data;

    AVIOContext *pb = s->pb;

    AVStream *st;

    uint8_t *header;

    uint8_t scratch[VQA_PREAMBLE_SIZE];

    uint32_t chunk_tag;

    uint32_t chunk_size;

    int fps, ret;


    /* initialize the video decoder stream */

    st = avformat_new_stream(s, NULL);

    if (!st)

        return AVERROR(ENOMEM);

    st->start_time = 0;

    wsvqa->video_stream_index = st->index;

    st->codecpar->codec_type = AVMEDIA_TYPE_VIDEO;

    st->codecpar->codec_id = AV_CODEC_ID_WS_VQA;

    st->codecpar->codec_tag = 0;  /* no fourcc */


    /* skip to the start of the VQA header */

    avio_seek(pb, 20, SEEK_SET);


    /* the VQA header needs to go to the decoder */

    if ((ret = ff_get_extradata(s, st->codecpar, pb, VQA_HEADER_SIZE)) < 0)

        return ret;

    header = st->codecpar->extradata;

    st->codecpar->width = AV_RL16(&header[6]);

    st->codecpar->height = AV_RL16(&header[8]);

    fps = header[12];

    st->nb_frames =

    st->duration  = AV_RL16(&header[4]);

    if (fps < 1 || fps > 30) {

        av_log(s, AV_LOG_ERROR, "invalid fps: %d\n", fps);

        return AVERROR_INVALIDDATA;

    }

    avpriv_set_pts_info(st, 64, 1, fps);


    wsvqa->version      = AV_RL16(&header[ 0]);

    wsvqa->sample_rate  = AV_RL16(&header[24]);

    wsvqa->channels     = header[26];

    wsvqa->bps          = header[27];

    wsvqa->audio_stream_index = -1;

    wsvqa->vqfl_chunk_pos     = 0;

    wsvqa->vqfl_chunk_size    = 0;


    s->ctx_flags |= AVFMTCTX_NOHEADER;


    /* there are 0 or more chunks before the FINF chunk; iterate until

     * FINF has been skipped and the file will be ready to be demuxed */

    do {

        if ((ret = ffio_read_size(pb, scratch, VQA_PREAMBLE_SIZE)) < 0)

            return ret;

        chunk_tag = AV_RB32(&scratch[0]);

        chunk_size = AV_RB32(&scratch[4]);


        /* catch any unknown header tags, for curiosity */

        switch (chunk_tag) {

        case CINF_TAG:

        case CINH_TAG:

        case CIND_TAG:

        case LINF_TAG:

        case PINF_TAG:

        case PINH_TAG:

        case PIND_TAG:

        case FINF_TAG:

        case CMDS_TAG:

        case VIEW_TAG:

        case ZBUF_TAG:

            break;


        default:

            av_log(s, AV_LOG_ERROR, " note: unknown chunk seen (%s)\n",

                   av_fourcc2str(chunk_tag));

            break;

        }


        avio_skip(pb, chunk_size);

    } while (chunk_tag != FINF_TAG);


    return 0;

}


static int wsvqa_read_packet(AVFormatContext *s,

                             AVPacket *pkt)

{

    WsVqaDemuxContext *wsvqa = s->priv_data;

    AVIOContext *pb = s->pb;

    int ret = -1;

    uint8_t preamble[VQA_PREAMBLE_SIZE];

    uint32_t chunk_type;

    int chunk_size;

    unsigned skip_byte;


    while (avio_read(pb, preamble, VQA_PREAMBLE_SIZE) == VQA_PREAMBLE_SIZE) {

        chunk_type = AV_RB32(&preamble[0]);

        chunk_size = AV_RB32(&preamble[4]);


        if (chunk_size < 0)

            return AVERROR_INVALIDDATA;

        skip_byte = chunk_size & 0x01;


        if (chunk_type == VQFL_TAG) {

            /* Each VQFL chunk carries only a codebook update inside which must be applied

             * before the next VQFR is rendered. That's why we stash the VQFL offset here

             * so it can be combined with the next VQFR packet. This way each packet

             * includes a whole frame as expected. */

            wsvqa->vqfl_chunk_pos = avio_tell(pb);

            if (chunk_size > 3 * (1 << 20))

                return AVERROR_INVALIDDATA;

            wsvqa->vqfl_chunk_size = chunk_size;

            /* We need a big seekback buffer because there can be SNxx, VIEW and ZBUF

             * chunks (<512 KiB total) in the stream before we read VQFR (<256 KiB) and

             * seek back here. */

            ret = ffio_ensure_seekback(pb, wsvqa->vqfl_chunk_size + (512 + 256) * 1024);

            avio_skip(pb, chunk_size + skip_byte);

            if (ret < 0)

                return ret;

            continue;

        } else if ((chunk_type == SND0_TAG) || (chunk_type == SND1_TAG) ||

            (chunk_type == SND2_TAG) || (chunk_type == VQFR_TAG)) {


            ret= av_get_packet(pb, pkt, chunk_size);

            if (ret<0)

                return AVERROR_INVALIDDATA;


            switch (chunk_type) {

            case SND0_TAG:

            case SND1_TAG:

            case SND2_TAG:

                if (wsvqa->audio_stream_index == -1) {

                    AVStream *st = avformat_new_stream(s, NULL);

                    if (!st)

                        return AVERROR(ENOMEM);


                    wsvqa->audio_stream_index = st->index;

                    if (!wsvqa->sample_rate)

                        wsvqa->sample_rate = 22050;

                    if (!wsvqa->channels)

                        wsvqa->channels = 1;

                    if (!wsvqa->bps)

                        wsvqa->bps = 8;

                    st->codecpar->sample_rate = wsvqa->sample_rate;

                    st->codecpar->bits_per_coded_sample = wsvqa->bps;

                    av_channel_layout_default(&st->codecpar->ch_layout, wsvqa->channels);

                    st->codecpar->codec_type = AVMEDIA_TYPE_AUDIO;


                    avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);


                    switch (chunk_type) {

                    case SND0_TAG:

                        if (wsvqa->bps == 16)

                            st->codecpar->codec_id = AV_CODEC_ID_PCM_S16LE;

                        else

                            st->codecpar->codec_id = AV_CODEC_ID_PCM_U8;

                        break;

                    case SND1_TAG:

                        st->codecpar->codec_id = AV_CODEC_ID_WESTWOOD_SND1;

                        break;

                    case SND2_TAG:

                        st->codecpar->codec_id = AV_CODEC_ID_ADPCM_IMA_WS;

                        if ((ret = ff_alloc_extradata(st->codecpar, 2)) < 0)

                            return ret;

                        AV_WL16(st->codecpar->extradata, wsvqa->version);

                        break;

                    }

                }


                pkt->stream_index = wsvqa->audio_stream_index;

                switch (chunk_type) {

                case SND1_TAG:

                    /* unpacked size is stored in header */

                    if(pkt->data)

                        pkt->duration = AV_RL16(pkt->data) / wsvqa->channels;

                    break;

                case SND2_TAG:

                    /* 2 samples/byte, 1 or 2 samples per frame depending on stereo */

                    pkt->duration = (chunk_size * 2LL) / wsvqa->channels;

                    break;

                }

                break;

            case VQFR_TAG:

                /* if a new codebook is available inside an earlier a VQFL chunk then

                 * append it to 'pkt' */

                if (wsvqa->vqfl_chunk_size > 0) {

                    int64_t ret64, current_pos = pkt->pos;


                    if ((ret64 = avio_seek(pb, wsvqa->vqfl_chunk_pos, SEEK_SET)) < 0)

                        return (int)ret64;


                    /* the decoder expects chunks to be 16-bit aligned */

                    if (wsvqa->vqfl_chunk_size % 2 == 1)

                        wsvqa->vqfl_chunk_size++;


                    if (av_append_packet(pb, pkt, wsvqa->vqfl_chunk_size) < 0)

                        return AVERROR_INVALIDDATA;


                    if ((ret64 = avio_seek(pb, current_pos, SEEK_SET)) < 0)

                        return (int)ret64;


                    wsvqa->vqfl_chunk_pos = 0;

                    wsvqa->vqfl_chunk_size = 0;

                }


                pkt->stream_index = wsvqa->video_stream_index;

                pkt->duration = 1;

                break;

            }


            /* stay on 16-bit alignment */

            if (skip_byte)

                avio_skip(pb, 1);


            return ret;

        } else {

            switch(chunk_type){

            case CMDS_TAG:

            case SN2J_TAG:

            case VIEW_TAG:

            case ZBUF_TAG:

                break;

            default:

                av_log(s, AV_LOG_INFO, "Skipping unknown chunk %s\n",

                       av_fourcc2str(av_bswap32(chunk_type)));

            }

            avio_skip(pb, chunk_size + skip_byte);

        }

    }


    return ret;

}


const FFInputFormat ff_wsvqa_demuxer = {

    .p.name         = "wsvqa",

    .p.long_name    = NULL_IF_CONFIG_SMALL("Westwood Studios VQA"),

    .priv_data_size = sizeof(WsVqaDemuxContext),

    .read_probe     = wsvqa_probe,

    .read_header    = wsvqa_read_header,

    .read_packet    = wsvqa_read_packet,

};