FFmpeg
takdec.c
Go to the documentation of this file.
1 /*
2  * Raw TAK demuxer
3  * Copyright (c) 2012 Paul B Mahol
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "libavutil/crc.h"
23 
24 #define BITSTREAM_READER_LE
25 #include "libavcodec/tak.h"
26 
27 #include "apetag.h"
28 #include "avformat.h"
29 #include "avio_internal.h"
30 #include "internal.h"
31 #include "rawdec.h"
32 
33 typedef struct TAKDemuxContext {
34  AVClass *class;
37  int64_t data_end;
39 
40 static int tak_probe(const AVProbeData *p)
41 {
42  if (!memcmp(p->buf, "tBaK", 4))
44  return 0;
45 }
46 
47 static unsigned long tak_check_crc(unsigned long checksum, const uint8_t *buf,
48  unsigned int len)
49 {
50  return av_crc(av_crc_get_table(AV_CRC_24_IEEE), checksum, buf, len);
51 }
52 
54 {
56  AVIOContext *pb = s->pb;
57  GetBitContext gb;
58  AVStream *st;
59  uint8_t *buffer = NULL;
60  int ret;
61 
62  st = avformat_new_stream(s, 0);
63  if (!st)
64  return AVERROR(ENOMEM);
65 
69 
70  tc->mlast_frame = 0;
71  if (avio_rl32(pb) != MKTAG('t', 'B', 'a', 'K')) {
72  avio_seek(pb, -4, SEEK_CUR);
73  return 0;
74  }
75 
76  while (!avio_feof(pb)) {
77  enum TAKMetaDataType type;
78  int size;
79 
80  type = avio_r8(pb) & 0x7f;
81  size = avio_rl24(pb);
82 
83  switch (type) {
85  if (st->codecpar->extradata)
86  return AVERROR_INVALIDDATA;
89  if (size <= 3)
90  return AVERROR_INVALIDDATA;
91 
92  buffer = av_malloc(size - 3 + AV_INPUT_BUFFER_PADDING_SIZE);
93  if (!buffer)
94  return AVERROR(ENOMEM);
95  memset(buffer + size - 3, 0, AV_INPUT_BUFFER_PADDING_SIZE);
96 
97  ffio_init_checksum(pb, tak_check_crc, 0xCE04B7U);
98  if (avio_read(pb, buffer, size - 3) != size - 3) {
99  av_freep(&buffer);
100  return AVERROR(EIO);
101  }
102  if (ffio_get_checksum(s->pb) != avio_rb24(pb)) {
103  av_log(s, AV_LOG_ERROR, "%d metadata block CRC error.\n", type);
104  if (s->error_recognition & AV_EF_EXPLODE) {
105  av_freep(&buffer);
106  return AVERROR_INVALIDDATA;
107  }
108  }
109 
110  break;
111  case TAK_METADATA_MD5: {
112  uint8_t md5[16];
113  int i;
114 
115  if (size != 19)
116  return AVERROR_INVALIDDATA;
117  ffio_init_checksum(pb, tak_check_crc, 0xCE04B7U);
118  avio_read(pb, md5, 16);
119  if (ffio_get_checksum(s->pb) != avio_rb24(pb)) {
120  av_log(s, AV_LOG_ERROR, "MD5 metadata block CRC error.\n");
122  return AVERROR_INVALIDDATA;
123  }
124 
125  av_log(s, AV_LOG_VERBOSE, "MD5=");
126  for (i = 0; i < 16; i++)
127  av_log(s, AV_LOG_VERBOSE, "%02x", md5[i]);
128  av_log(s, AV_LOG_VERBOSE, "\n");
129  break;
130  }
131  case TAK_METADATA_END: {
132  int64_t curpos = avio_tell(pb);
133 
134  if (pb->seekable & AVIO_SEEKABLE_NORMAL) {
135  ff_ape_parse_tag(s);
136  avio_seek(pb, curpos, SEEK_SET);
137  }
138 
139  tc->data_end += curpos;
140  return 0;
141  }
142  default:
143  ret = avio_skip(pb, size);
144  if (ret < 0)
145  return ret;
146  }
147 
148  if (type == TAK_METADATA_STREAMINFO) {
149  TAKStreamInfo ti;
150 
151  ret = avpriv_tak_parse_streaminfo(&ti, buffer, size -3);
152  if (ret < 0)
153  goto end;
154  if (ti.samples > 0)
155  st->duration = ti.samples;
157  if (ti.ch_layout)
159  st->codecpar->sample_rate = ti.sample_rate;
160  st->codecpar->channels = ti.channels;
161  st->start_time = 0;
162  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
163  st->codecpar->extradata = buffer;
164  st->codecpar->extradata_size = size - 3;
165  buffer = NULL;
166  } else if (type == TAK_METADATA_LAST_FRAME) {
167  if (size != 11) {
168  ret = AVERROR_INVALIDDATA;
169  goto end;
170  }
171  init_get_bits8(&gb, buffer, size - 3);
172  tc->mlast_frame = 1;
175  av_freep(&buffer);
176  } else if (type == TAK_METADATA_ENCODER) {
177  init_get_bits8(&gb, buffer, size - 3);
178  av_log(s, AV_LOG_VERBOSE, "encoder version: %0X\n",
180  av_freep(&buffer);
181  }
182  }
183 
184  return AVERROR_EOF;
185 end:
186  av_freep(&buffer);
187  return ret;
188 }
189 
191 {
193  int ret;
194 
195  if (tc->mlast_frame) {
196  AVIOContext *pb = s->pb;
197  int64_t size, left;
198 
199  left = tc->data_end - avio_tell(pb);
200  size = FFMIN(left, 1024);
201  if (size <= 0)
202  return AVERROR_EOF;
203 
204  ret = av_get_packet(pb, pkt, size);
205  if (ret < 0)
206  return ret;
207 
208  pkt->stream_index = 0;
209  } else {
210  ret = ff_raw_read_partial_packet(s, pkt);
211  }
212 
213  return ret;
214 }
215 
218  .name = "tak",
219  .long_name = NULL_IF_CONFIG_SMALL("raw TAK"),
220  .priv_data_size = sizeof(TAKDemuxContext),
225  .extensions = "tak",
226  .raw_codec_id = AV_CODEC_ID_TAK,
227  .priv_class = &tak_demuxer_class,
228 };
#define NULL
Definition: coverity.c:32
Bytestream IO Context.
Definition: avio.h:161
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
int channels
Definition: tak.h:133
static unsigned int get_bits(GetBitContext *s, int n)
Read 1-25 bits.
Definition: get_bits.h:379
void avpriv_set_pts_info(AVStream *s, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: utils.c:4892
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: avcodec.h:3957
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:246
#define tc
Definition: regdef.h:69
uint64_t ch_layout
Definition: tak.h:138
GLint GLenum type
Definition: opengl_enc.c:104
int raw_packet_size
Definition: takdec.c:35
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:334
static AVPacket pkt
TAKMetaDataType
Definition: tak.h:104
Format I/O context.
Definition: avformat.h:1358
static int tak_probe(const AVProbeData *p)
Definition: takdec.c:40
uint8_t
#define av_malloc(s)
static av_cold int end(AVCodecContext *avctx)
Definition: avrndec.c:90
enum AVStreamParseType need_parsing
Definition: avformat.h:1099
AVStream * avformat_new_stream(AVFormatContext *s, const AVCodec *c)
Add a new stream to a media file.
Definition: utils.c:4465
int64_t data_end
Definition: takdec.c:37
Public header for CRC hash function implementation.
struct AVMD5 * md5
Definition: movenc.c:56
#define AVERROR_EOF
End of file.
Definition: error.h:55
#define AV_LOG_VERBOSE
Detailed information.
Definition: log.h:192
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:310
ptrdiff_t size
Definition: opengl_enc.c:100
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:557
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:804
uint64_t channel_layout
Audio only.
Definition: avcodec.h:4059
#define av_log(a,...)
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:650
static uint64_t get_bits64(GetBitContext *s, int n)
Read 0-64 bits.
Definition: get_bits.h:572
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:259
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:772
int ff_raw_read_partial_packet(AVFormatContext *s, AVPacket *pkt)
Definition: rawdec.c:35
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:186
enum AVMediaType codec_type
General type of the encoded data.
Definition: avcodec.h:3953
static int raw_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: takdec.c:190
int64_t ff_ape_parse_tag(AVFormatContext *s)
Read and parse an APE tag.
Definition: apetag.c:118
#define FF_RAW_DEMUXER_CLASS(name)
Definition: rawdec.h:55
int extradata_size
Size of the extradata content in bytes.
Definition: avcodec.h:3975
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:641
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:448
int bps
Definition: tak.h:134
int64_t samples
Definition: tak.h:139
void ffio_init_checksum(AVIOContext *s, unsigned long(*update_checksum)(unsigned long c, const uint8_t *p, unsigned int len), unsigned long checksum)
Definition: aviobuf.c:629
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:260
unsigned int avio_rb24(AVIOContext *s)
Definition: aviobuf.c:796
#define FFMIN(a, b)
Definition: common.h:96
uint32_t av_crc(const AVCRC *ctx, uint32_t crc, const uint8_t *buffer, size_t length)
Calculate the CRC of a block.
Definition: crc.c:392
AVInputFormat ff_tak_demuxer
Definition: takdec.c:217
#define s(width, name)
Definition: cbs_vp9.c:257
#define AV_EF_EXPLODE
abort decoding on minor error detection
Definition: avcodec.h:2705
static volatile int checksum
Definition: adler32.c:30
#define TAK_LAST_FRAME_SIZE_BITS
Definition: tak.h:44
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:530
Stream structure.
Definition: avformat.h:881
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_reading.c:42
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:40
AVIOContext * pb
I/O context.
Definition: avformat.h:1400
static int init_get_bits8(GetBitContext *s, const uint8_t *buffer, int byte_size)
Initialize GetBitContext.
Definition: get_bits.h:677
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2]...the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so...,+,-,+,-,+,+,-,+,-,+,...hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32-hcoeff[1]-hcoeff[2]-...a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2}an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||.........intra?||||:Block01:yes no||||:Block02:.................||||:Block03::y DC::ref index:||||:Block04::cb DC::motion x:||||.........:cr DC::motion y:||||.................|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------------------------------|||Y subbands||Cb subbands||Cr subbands||||------||------||------|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||------||------||------||||------||------||------|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||------||------||------||||------||------||------|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||------||------||------||||------||------||------|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------------------------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction------------|\Dequantization-------------------\||Reference frames|\IDWT|--------------|Motion\|||Frame 0||Frame 1||Compensation.OBMC v-------|--------------|--------------.\------> Frame n output Frame Frame<----------------------------------/|...|-------------------Range Coder:============Binary Range Coder:-------------------The implemented range coder is an adapted version based upon"Range encoding: an algorithm for removing redundancy from a digitised message."by G.N.N.Martin.The symbols encoded by the Snow range coder are bits(0|1).The associated probabilities are not fix but change depending on the symbol mix seen so far.bit seen|new state---------+-----------------------------------------------0|256-state_transition_table[256-old_state];1|state_transition_table[old_state];state_transition_table={0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:-------------------------FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1.the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:206
void * buf
Definition: avisynth_c.h:766
Describe the class of an AVClass context structure.
Definition: log.h:67
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:468
TAK (Tom&#39;s lossless Audio Kompressor) decoder/demuxer common functions.
unsigned long ffio_get_checksum(AVIOContext *s)
Definition: aviobuf.c:621
int mlast_frame
Definition: takdec.c:36
static unsigned long tak_check_crc(unsigned long checksum, const uint8_t *buf, unsigned int len)
Definition: takdec.c:47
static int tak_read_header(AVFormatContext *s)
Definition: takdec.c:53
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:456
This structure contains the data a format has to probe a file.
Definition: avformat.h:446
static unsigned int get_bits_long(GetBitContext *s, int n)
Read 0-32 bits.
Definition: get_bits.h:546
int sample_rate
Definition: tak.h:132
#define flags(name, subs,...)
Definition: cbs_av1.c:561
static int read_probe(const AVProbeData *pd)
Definition: jvdec.c:55
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:930
const AVCRC * av_crc_get_table(AVCRCId crc_id)
Get an initialized standard CRC table.
Definition: crc.c:374
int sample_rate
Audio only.
Definition: avcodec.h:4067
Main libavformat public API header.
int64_t start_time
Decoding: pts of the first frame of the stream in presentation order, in stream time base...
Definition: avformat.h:920
int error_recognition
Error recognition; higher values will detect more errors but may misdetect some more or less valid pa...
Definition: avformat.h:1625
#define AV_INPUT_BUFFER_PADDING_SIZE
Required number of additionally allocated bytes at the end of the input bitstream for decoding...
Definition: avcodec.h:790
int len
void * priv_data
Format private data.
Definition: avformat.h:1386
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: avcodec.h:3999
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: avcodec.h:3971
int channels
Audio only.
Definition: avcodec.h:4063
int avpriv_tak_parse_streaminfo(TAKStreamInfo *s, const uint8_t *buf, int size)
Parse the Streaminfo metadata block.
Definition: tak.c:128
#define av_freep(p)
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:654
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:1028
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:361
#define TAK_ENCODER_VERSION_BITS
Definition: tak.h:47
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:764
int stream_index
Definition: avcodec.h:1479
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later.That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another.Frame references ownership and permissions
#define TAK_LAST_FRAME_POS_BITS
Definition: tak.h:43
#define MKTAG(a, b, c, d)
Definition: common.h:366
This structure stores compressed data.
Definition: avcodec.h:1454
GLuint buffer
Definition: opengl_enc.c:101