FFmpeg
takdec.c
Go to the documentation of this file.
1 /*
2  * Raw TAK demuxer
3  * Copyright (c) 2012 Paul B Mahol
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "libavutil/crc.h"
23 
24 #define BITSTREAM_READER_LE
25 #include "libavcodec/tak.h"
26 
27 #include "apetag.h"
28 #include "avformat.h"
29 #include "avio_internal.h"
30 #include "internal.h"
31 #include "rawdec.h"
32 
33 typedef struct TAKDemuxContext {
35  int64_t data_end;
37 
38 static int tak_probe(const AVProbeData *p)
39 {
40  if (!memcmp(p->buf, "tBaK", 4))
42  return 0;
43 }
44 
45 static unsigned long tak_check_crc(unsigned long checksum, const uint8_t *buf,
46  unsigned int len)
47 {
48  return av_crc(av_crc_get_table(AV_CRC_24_IEEE), checksum, buf, len);
49 }
50 
52 {
54  AVIOContext *pb = s->pb;
55  GetBitContext gb;
56  AVStream *st;
57  uint8_t *buffer = NULL;
58  int ret;
59 
60  st = avformat_new_stream(s, 0);
61  if (!st)
62  return AVERROR(ENOMEM);
63 
67 
68  tc->mlast_frame = 0;
69  if (avio_rl32(pb) != MKTAG('t', 'B', 'a', 'K')) {
70  avio_seek(pb, -4, SEEK_CUR);
71  return 0;
72  }
73 
74  while (!avio_feof(pb)) {
75  enum TAKMetaDataType type;
76  int size;
77 
78  type = avio_r8(pb) & 0x7f;
79  size = avio_rl24(pb);
80 
81  switch (type) {
85  if (size <= 3)
86  return AVERROR_INVALIDDATA;
87 
88  buffer = av_malloc(size - 3 + AV_INPUT_BUFFER_PADDING_SIZE);
89  if (!buffer)
90  return AVERROR(ENOMEM);
91  memset(buffer + size - 3, 0, AV_INPUT_BUFFER_PADDING_SIZE);
92 
93  ffio_init_checksum(pb, tak_check_crc, 0xCE04B7U);
94  if (avio_read(pb, buffer, size - 3) != size - 3) {
95  av_freep(&buffer);
96  return AVERROR(EIO);
97  }
98  if (ffio_get_checksum(s->pb) != avio_rb24(pb)) {
99  av_log(s, AV_LOG_ERROR, "%d metadata block CRC error.\n", type);
100  if (s->error_recognition & AV_EF_EXPLODE) {
101  av_freep(&buffer);
102  return AVERROR_INVALIDDATA;
103  }
104  }
105 
106  break;
107  case TAK_METADATA_MD5: {
108  uint8_t md5[16];
109  int i;
110 
111  if (size != 19)
112  return AVERROR_INVALIDDATA;
113  ffio_init_checksum(pb, tak_check_crc, 0xCE04B7U);
114  avio_read(pb, md5, 16);
115  if (ffio_get_checksum(s->pb) != avio_rb24(pb)) {
116  av_log(s, AV_LOG_ERROR, "MD5 metadata block CRC error.\n");
118  return AVERROR_INVALIDDATA;
119  }
120 
121  av_log(s, AV_LOG_VERBOSE, "MD5=");
122  for (i = 0; i < 16; i++)
123  av_log(s, AV_LOG_VERBOSE, "%02x", md5[i]);
124  av_log(s, AV_LOG_VERBOSE, "\n");
125  break;
126  }
127  case TAK_METADATA_END: {
128  int64_t curpos = avio_tell(pb);
129 
130  if (pb->seekable & AVIO_SEEKABLE_NORMAL) {
131  ff_ape_parse_tag(s);
132  avio_seek(pb, curpos, SEEK_SET);
133  }
134 
135  tc->data_end += curpos;
136  return 0;
137  }
138  default:
139  ret = avio_skip(pb, size);
140  if (ret < 0)
141  return ret;
142  }
143 
144  if (type == TAK_METADATA_STREAMINFO) {
145  TAKStreamInfo ti;
146 
147  ret = avpriv_tak_parse_streaminfo(&ti, buffer, size -3);
148  if (ret < 0)
149  return AVERROR_INVALIDDATA;
150  if (ti.samples > 0)
151  st->duration = ti.samples;
153  if (ti.ch_layout)
155  st->codecpar->sample_rate = ti.sample_rate;
156  st->codecpar->channels = ti.channels;
157  st->start_time = 0;
158  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
159  st->codecpar->extradata = buffer;
160  st->codecpar->extradata_size = size - 3;
161  buffer = NULL;
162  } else if (type == TAK_METADATA_LAST_FRAME) {
163  if (size != 11)
164  return AVERROR_INVALIDDATA;
165  init_get_bits8(&gb, buffer, size - 3);
166  tc->mlast_frame = 1;
169  av_freep(&buffer);
170  } else if (type == TAK_METADATA_ENCODER) {
171  init_get_bits8(&gb, buffer, size - 3);
172  av_log(s, AV_LOG_VERBOSE, "encoder version: %0X\n",
174  av_freep(&buffer);
175  }
176  }
177 
178  return AVERROR_EOF;
179 }
180 
182 {
184  int ret;
185 
186  if (tc->mlast_frame) {
187  AVIOContext *pb = s->pb;
188  int64_t size, left;
189 
190  left = tc->data_end - avio_tell(pb);
191  size = FFMIN(left, 1024);
192  if (size <= 0)
193  return AVERROR_EOF;
194 
195  ret = av_get_packet(pb, pkt, size);
196  if (ret < 0)
197  return ret;
198 
199  pkt->stream_index = 0;
200  } else {
201  ret = ff_raw_read_partial_packet(s, pkt);
202  }
203 
204  return ret;
205 }
206 
208  .name = "tak",
209  .long_name = NULL_IF_CONFIG_SMALL("raw TAK"),
210  .priv_data_size = sizeof(TAKDemuxContext),
215  .extensions = "tak",
216  .raw_codec_id = AV_CODEC_ID_TAK,
217 };
#define NULL
Definition: coverity.c:32
Bytestream IO Context.
Definition: avio.h:161
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
int channels
Definition: tak.h:133
static unsigned int get_bits(GetBitContext *s, int n)
Read 1-25 bits.
Definition: get_bits.h:379
void avpriv_set_pts_info(AVStream *s, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: utils.c:4882
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: avcodec.h:3953
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:246
#define tc
Definition: regdef.h:69
uint64_t ch_layout
Definition: tak.h:138
GLint GLenum type
Definition: opengl_enc.c:104
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:331
static AVPacket pkt
TAKMetaDataType
Definition: tak.h:104
Format I/O context.
Definition: avformat.h:1358
static int tak_probe(const AVProbeData *p)
Definition: takdec.c:38
uint8_t
#define av_malloc(s)
enum AVStreamParseType need_parsing
Definition: avformat.h:1099
AVStream * avformat_new_stream(AVFormatContext *s, const AVCodec *c)
Add a new stream to a media file.
Definition: utils.c:4455
int64_t data_end
Definition: takdec.c:35
Public header for CRC hash function implementation.
struct AVMD5 * md5
Definition: movenc.c:56
#define AVERROR_EOF
End of file.
Definition: error.h:55
#define AV_LOG_VERBOSE
Detailed information.
Definition: log.h:192
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:310
ptrdiff_t size
Definition: opengl_enc.c:100
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:557
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:804
uint64_t channel_layout
Audio only.
Definition: avcodec.h:4055
#define av_log(a,...)
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:648
static uint64_t get_bits64(GetBitContext *s, int n)
Read 0-64 bits.
Definition: get_bits.h:572
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:260
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:770
int ff_raw_read_partial_packet(AVFormatContext *s, AVPacket *pkt)
Definition: rawdec.c:35
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:186
enum AVMediaType codec_type
General type of the encoded data.
Definition: avcodec.h:3949
static int raw_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: takdec.c:181
int64_t ff_ape_parse_tag(AVFormatContext *s)
Read and parse an APE tag.
Definition: apetag.c:118
int extradata_size
Size of the extradata content in bytes.
Definition: avcodec.h:3971
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:639
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:448
int bps
Definition: tak.h:134
int64_t samples
Definition: tak.h:139
void ffio_init_checksum(AVIOContext *s, unsigned long(*update_checksum)(unsigned long c, const uint8_t *p, unsigned int len), unsigned long checksum)
Definition: aviobuf.c:627
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:260
unsigned int avio_rb24(AVIOContext *s)
Definition: aviobuf.c:794
#define FFMIN(a, b)
Definition: common.h:96
uint32_t av_crc(const AVCRC *ctx, uint32_t crc, const uint8_t *buffer, size_t length)
Calculate the CRC of a block.
Definition: crc.c:392
AVInputFormat ff_tak_demuxer
Definition: takdec.c:207
#define s(width, name)
Definition: cbs_vp9.c:257
#define AV_EF_EXPLODE
abort decoding on minor error detection
Definition: avcodec.h:2701
static volatile int checksum
Definition: adler32.c:30
#define TAK_LAST_FRAME_SIZE_BITS
Definition: tak.h:44
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:530
Stream structure.
Definition: avformat.h:881
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_reading.c:42
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:40
AVIOContext * pb
I/O context.
Definition: avformat.h:1400
static int init_get_bits8(GetBitContext *s, const uint8_t *buffer, int byte_size)
Initialize GetBitContext.
Definition: get_bits.h:677
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2]...the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so...,+,-,+,-,+,+,-,+,-,+,...hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32-hcoeff[1]-hcoeff[2]-...a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2}an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||.........intra?||||:Block01:yes no||||:Block02:.................||||:Block03::y DC::ref index:||||:Block04::cb DC::motion x:||||.........:cr DC::motion y:||||.................|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------------------------------|||Y subbands||Cb subbands||Cr subbands||||------||------||------|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||------||------||------||||------||------||------|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||------||------||------||||------||------||------|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||------||------||------||||------||------||------|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------------------------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction------------|\Dequantization-------------------\||Reference frames|\IDWT|--------------|Motion\|||Frame 0||Frame 1||Compensation.OBMC v-------|--------------|--------------.\------> Frame n output Frame Frame<----------------------------------/|...|-------------------Range Coder:============Binary Range Coder:-------------------The implemented range coder is an adapted version based upon"Range encoding: an algorithm for removing redundancy from a digitised message."by G.N.N.Martin.The symbols encoded by the Snow range coder are bits(0|1).The associated probabilities are not fix but change depending on the symbol mix seen so far.bit seen|new state---------+-----------------------------------------------0|256-state_transition_table[256-old_state];1|state_transition_table[old_state];state_transition_table={0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:-------------------------FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1.the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:206
void * buf
Definition: avisynth_c.h:766
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:468
TAK (Tom&#39;s lossless Audio Kompressor) decoder/demuxer common functions.
unsigned long ffio_get_checksum(AVIOContext *s)
Definition: aviobuf.c:619
int mlast_frame
Definition: takdec.c:34
static unsigned long tak_check_crc(unsigned long checksum, const uint8_t *buf, unsigned int len)
Definition: takdec.c:45
static int tak_read_header(AVFormatContext *s)
Definition: takdec.c:51
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:456
This structure contains the data a format has to probe a file.
Definition: avformat.h:446
static unsigned int get_bits_long(GetBitContext *s, int n)
Read 0-32 bits.
Definition: get_bits.h:546
int sample_rate
Definition: tak.h:132
#define flags(name, subs,...)
Definition: cbs_av1.c:561
static int read_probe(const AVProbeData *pd)
Definition: jvdec.c:55
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:930
const AVCRC * av_crc_get_table(AVCRCId crc_id)
Get an initialized standard CRC table.
Definition: crc.c:374
int sample_rate
Audio only.
Definition: avcodec.h:4063
Main libavformat public API header.
int64_t start_time
Decoding: pts of the first frame of the stream in presentation order, in stream time base...
Definition: avformat.h:920
int error_recognition
Error recognition; higher values will detect more errors but may misdetect some more or less valid pa...
Definition: avformat.h:1625
#define AV_INPUT_BUFFER_PADDING_SIZE
Required number of additionally allocated bytes at the end of the input bitstream for decoding...
Definition: avcodec.h:790
int len
void * priv_data
Format private data.
Definition: avformat.h:1386
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: avcodec.h:3995
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: avcodec.h:3967
int channels
Audio only.
Definition: avcodec.h:4059
int avpriv_tak_parse_streaminfo(TAKStreamInfo *s, const uint8_t *buf, int size)
Parse the Streaminfo metadata block.
Definition: tak.c:128
#define av_freep(p)
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:654
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:1028
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:358
#define TAK_ENCODER_VERSION_BITS
Definition: tak.h:47
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:762
int stream_index
Definition: avcodec.h:1479
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later.That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another.Frame references ownership and permissions
#define TAK_LAST_FRAME_POS_BITS
Definition: tak.h:43
#define MKTAG(a, b, c, d)
Definition: common.h:366
This structure stores compressed data.
Definition: avcodec.h:1454
GLuint buffer
Definition: opengl_enc.c:101