FFmpeg
flac_picture.c
Go to the documentation of this file.
1 /*
2  * Raw FLAC picture parser
3  * Copyright (c) 2001 Fabrice Bellard
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "libavutil/intreadwrite.h"
23 #include "libavcodec/bytestream.h"
24 #include "libavcodec/png.h"
25 #include "avformat.h"
26 #include "flac_picture.h"
27 #include "id3v2.h"
28 #include "internal.h"
29 
30 #define MAX_TRUNC_PICTURE_SIZE (500 * 1024 * 1024)
31 
32 int ff_flac_parse_picture(AVFormatContext *s, uint8_t *buf, int buf_size, int truncate_workaround)
33 {
34  const CodecMime *mime = ff_id3v2_mime_tags;
35  enum AVCodecID id = AV_CODEC_ID_NONE;
37  uint8_t mimetype[64], *desc = NULL;
39  AVStream *st;
40  int width, height, ret = 0;
41  unsigned int type;
42  uint32_t len, left, trunclen = 0;
43 
44  if (buf_size < 34) {
45  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
47  return AVERROR_INVALIDDATA;
48  return 0;
49  }
50 
51  bytestream2_init(&g, buf, buf_size);
52 
53  /* read the picture type */
54  type = bytestream2_get_be32u(&g);
56  av_log(s, AV_LOG_ERROR, "Invalid picture type: %d.\n", type);
58  return AVERROR_INVALIDDATA;
59  }
60  type = 0;
61  }
62 
63  /* picture mimetype */
64  len = bytestream2_get_be32u(&g);
65  if (len <= 0 || len >= sizeof(mimetype)) {
66  av_log(s, AV_LOG_ERROR, "Could not read mimetype from an attached "
67  "picture.\n");
69  return AVERROR_INVALIDDATA;
70  return 0;
71  }
72  if (len + 24 > bytestream2_get_bytes_left(&g)) {
73  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
75  return AVERROR_INVALIDDATA;
76  return 0;
77  }
78  bytestream2_get_bufferu(&g, mimetype, len);
79  mimetype[len] = 0;
80 
81  while (mime->id != AV_CODEC_ID_NONE) {
82  if (!strncmp(mime->str, mimetype, sizeof(mimetype))) {
83  id = mime->id;
84  break;
85  }
86  mime++;
87  }
88  if (id == AV_CODEC_ID_NONE) {
89  av_log(s, AV_LOG_ERROR, "Unknown attached picture mimetype: %s.\n",
90  mimetype);
92  return AVERROR_INVALIDDATA;
93  return 0;
94  }
95 
96  /* picture description */
97  len = bytestream2_get_be32u(&g);
98  if (len > bytestream2_get_bytes_left(&g) - 20) {
99  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
101  return AVERROR_INVALIDDATA;
102  return 0;
103  }
104  if (len > 0) {
105  if (!(desc = av_malloc(len + 1))) {
106  return AVERROR(ENOMEM);
107  }
108 
109  bytestream2_get_bufferu(&g, desc, len);
110  desc[len] = 0;
111  }
112 
113  /* picture metadata */
114  width = bytestream2_get_be32u(&g);
115  height = bytestream2_get_be32u(&g);
116  bytestream2_skipu(&g, 8);
117 
118  /* picture data */
119  len = bytestream2_get_be32u(&g);
120 
121  left = bytestream2_get_bytes_left(&g);
122  if (len <= 0 || len > left) {
123  if (len > MAX_TRUNC_PICTURE_SIZE || len >= INT_MAX - AV_INPUT_BUFFER_PADDING_SIZE) {
124  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too big %u\n", len);
126  ret = AVERROR_INVALIDDATA;
127  goto fail;
128  }
129 
130  // Workaround bug for flac muxers that writs truncated metadata picture block size if
131  // the picture size do not fit in 24 bits. lavf flacenc used to have the issue and based
132  // on existing broken files other unknown flac muxers seems to truncate also.
133  if (truncate_workaround &&
135  len > left && (len & 0xffffff) == left) {
136  av_log(s, AV_LOG_INFO, "Correcting truncated metadata picture size from %u to %u\n", left, len);
137  trunclen = len - left;
138  } else {
139  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
141  ret = AVERROR_INVALIDDATA;
142  goto fail;
143  }
144  }
145  if (!(data = av_buffer_alloc(len + AV_INPUT_BUFFER_PADDING_SIZE))) {
146  RETURN_ERROR(AVERROR(ENOMEM));
147  }
148 
149  if (trunclen == 0) {
150  bytestream2_get_bufferu(&g, data->data, len);
151  } else {
152  // If truncation was detected copy all data from block and read missing bytes
153  // not included in the block size
154  bytestream2_get_bufferu(&g, data->data, left);
155  if (avio_read(s->pb, data->data + len - trunclen, trunclen) < trunclen)
157  }
158  memset(data->data + len, 0, AV_INPUT_BUFFER_PADDING_SIZE);
159 
160  if (AV_RB64(data->data) == PNGSIG)
161  id = AV_CODEC_ID_PNG;
162 
163  st = avformat_new_stream(s, NULL);
164  if (!st) {
165  RETURN_ERROR(AVERROR(ENOMEM));
166  }
167 
169  st->attached_pic.buf = data;
170  st->attached_pic.data = data->data;
171  st->attached_pic.size = len;
172  st->attached_pic.stream_index = st->index;
174 
177  st->codecpar->codec_id = id;
178  st->codecpar->width = width;
179  st->codecpar->height = height;
180  av_dict_set(&st->metadata, "comment", ff_id3v2_picture_types[type], 0);
181  if (desc)
182  av_dict_set(&st->metadata, "title", desc, AV_DICT_DONT_STRDUP_VAL);
183 
184  return 0;
185 
186 fail:
187  av_buffer_unref(&data);
188  av_freep(&desc);
189 
190  return ret;
191 }
#define NULL
Definition: coverity.c:32
#define MAX_TRUNC_PICTURE_SIZE
Definition: flac_picture.c:30
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it...
Definition: buffer.c:125
ptrdiff_t const GLvoid * data
Definition: opengl_enc.c:100
const char * desc
Definition: libsvtav1.c:79
const char * g
Definition: vf_curves.c:115
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:60
int index
stream index in AVFormatContext
Definition: avformat.h:877
int size
Definition: packet.h:364
static av_always_inline void bytestream2_init(GetByteContext *g, const uint8_t *buf, int buf_size)
Definition: bytestream.h:133
GLint GLenum type
Definition: opengl_enc.c:104
int strict_std_compliance
Allow non-standard and experimental extension.
Definition: avformat.h:1659
static av_always_inline unsigned int bytestream2_get_bufferu(GetByteContext *g, uint8_t *dst, unsigned int size)
Definition: bytestream.h:273
Format I/O context.
Definition: avformat.h:1351
char str[32]
Definition: internal.h:48
uint8_t
#define av_malloc(s)
int width
Video only.
Definition: codec_par.h:126
AVStream * avformat_new_stream(AVFormatContext *s, const AVCodec *c)
Add a new stream to a media file.
Definition: utils.c:4450
#define height
uint8_t * data
Definition: packet.h:363
static av_always_inline void bytestream2_skipu(GetByteContext *g, unsigned int size)
Definition: bytestream.h:170
enum AVCodecID id
Definition: internal.h:49
#define av_log(a,...)
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:637
#define AV_PKT_FLAG_KEY
The packet contains a keyframe.
Definition: packet.h:401
static av_always_inline int bytestream2_get_bytes_left(GetByteContext *g)
Definition: bytestream.h:154
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:46
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:194
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:56
AVBufferRef * buf
A reference to the reference-counted buffer where the packet data is stored.
Definition: packet.h:346
#define PNGSIG
Definition: png.h:47
#define fail()
Definition: checkasm.h:123
int flags
A combination of AV_PKT_FLAG values.
Definition: packet.h:369
const CodecMime ff_id3v2_mime_tags[]
Definition: id3v2.c:131
#define width
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that&#39;s been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:76
#define s(width, name)
Definition: cbs_vp9.c:257
#define AV_EF_EXPLODE
abort decoding on minor error detection
Definition: avcodec.h:1666
AVDictionary * metadata
Definition: avformat.h:940
#define FF_ARRAY_ELEMS(a)
#define AV_DISPOSITION_ATTACHED_PIC
The stream is stored in the file as an attached picture/"cover art" (e.g.
Definition: avformat.h:844
Stream structure.
Definition: avformat.h:876
#define AV_LOG_INFO
Standard information.
Definition: log.h:205
AVBufferRef * av_buffer_alloc(int size)
Allocate an AVBuffer of the given size using av_malloc().
Definition: buffer.c:67
AVIOContext * pb
I/O context.
Definition: avformat.h:1393
uint8_t * data
The data buffer.
Definition: buffer.h:89
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2]...the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so...,+,-,+,-,+,+,-,+,-,+,...hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32-hcoeff[1]-hcoeff[2]-...a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2}an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||.........intra?||||:Block01:yes no||||:Block02:.................||||:Block03::y DC::ref index:||||:Block04::cb DC::motion x:||||.........:cr DC::motion y:||||.................|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------------------------------|||Y subbands||Cb subbands||Cr subbands||||------||------||------|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||------||------||------||||------||------||------|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||------||------||------||||------||------||------|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||------||------||------||||------||------||------|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------------------------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction------------|\Dequantization-------------------\||Reference frames|\IDWT|--------------|Motion\|||Frame 0||Frame 1||Compensation.OBMC v-------|--------------|--------------.\------> Frame n output Frame Frame<----------------------------------/|...|-------------------Range Coder:============Binary Range Coder:-------------------The implemented range coder is an adapted version based upon"Range encoding: an algorithm for removing redundancy from a digitised message."by G.N.N.Martin.The symbols encoded by the Snow range coder are bits(0|1).The associated probabilities are not fix but change depending on the symbol mix seen so far.bit seen|new state---------+-----------------------------------------------0|256-state_transition_table[256-old_state];1|state_transition_table[old_state];state_transition_table={0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:-------------------------FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1.the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:206
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:70
#define FF_COMPLIANCE_NORMAL
Definition: avcodec.h:1592
A reference to a data buffer.
Definition: buffer.h:81
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_WL16 uint64_t_TMPL AV_RB64
Definition: bytestream.h:87
Main libavformat public API header.
int error_recognition
Error recognition; higher values will detect more errors but may misdetect some more or less valid pa...
Definition: avformat.h:1618
int disposition
AV_DISPOSITION_* bit field.
Definition: avformat.h:929
void av_init_packet(AVPacket *pkt)
Initialize optional fields of a packet with default values.
Definition: avpacket.c:35
#define AV_INPUT_BUFFER_PADDING_SIZE
Required number of additionally allocated bytes at the end of the input bitstream for decoding...
Definition: avcodec.h:215
int len
int ff_flac_parse_picture(AVFormatContext *s, uint8_t *buf, int buf_size, int truncate_workaround)
Definition: flac_picture.c:32
#define av_freep(p)
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:1023
const char *const ff_id3v2_picture_types[21]
Definition: id3v2.c:107
int stream_index
Definition: packet.h:365
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later.That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another.Frame references ownership and permissions
enum AVCodecID id
AVPacket attached_pic
For streams with AV_DISPOSITION_ATTACHED_PIC disposition, this packet will contain the attached pictu...
Definition: avformat.h:958
#define RETURN_ERROR(code)
Definition: avidec.c:468