FFmpeg
flac_picture.c
Go to the documentation of this file.
1 /*
2  * Raw FLAC picture parser
3  * Copyright (c) 2001 Fabrice Bellard
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "libavutil/intreadwrite.h"
23 #include "libavcodec/bytestream.h"
24 #include "libavcodec/png.h"
25 #include "avformat.h"
26 #include "flac_picture.h"
27 #include "id3v2.h"
28 #include "internal.h"
29 
30 #define MAX_TRUNC_PICTURE_SIZE (500 * 1024 * 1024)
31 
32 int ff_flac_parse_picture(AVFormatContext *s, uint8_t *buf, int buf_size, int truncate_workaround)
33 {
34  const CodecMime *mime = ff_id3v2_mime_tags;
35  enum AVCodecID id = AV_CODEC_ID_NONE;
37  uint8_t mimetype[64], *desc = NULL;
39  AVStream *st;
40  int width, height, ret = 0;
41  unsigned int type;
42  uint32_t len, left, trunclen = 0;
43 
44  if (buf_size < 34) {
45  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
46  if (s->error_recognition & AV_EF_EXPLODE)
47  return AVERROR_INVALIDDATA;
48  return 0;
49  }
50 
51  bytestream2_init(&g, buf, buf_size);
52 
53  /* read the picture type */
54  type = bytestream2_get_be32u(&g);
56  av_log(s, AV_LOG_ERROR, "Invalid picture type: %d.\n", type);
57  if (s->error_recognition & AV_EF_EXPLODE) {
58  return AVERROR_INVALIDDATA;
59  }
60  type = 0;
61  }
62 
63  /* picture mimetype */
64  len = bytestream2_get_be32u(&g);
65  if (len <= 0 || len >= sizeof(mimetype)) {
66  av_log(s, AV_LOG_ERROR, "Could not read mimetype from an attached "
67  "picture.\n");
68  if (s->error_recognition & AV_EF_EXPLODE)
69  return AVERROR_INVALIDDATA;
70  return 0;
71  }
72  if (len + 24 > bytestream2_get_bytes_left(&g)) {
73  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
74  if (s->error_recognition & AV_EF_EXPLODE)
75  return AVERROR_INVALIDDATA;
76  return 0;
77  }
78  bytestream2_get_bufferu(&g, mimetype, len);
79  mimetype[len] = 0;
80 
81  while (mime->id != AV_CODEC_ID_NONE) {
82  if (!strncmp(mime->str, mimetype, sizeof(mimetype))) {
83  id = mime->id;
84  break;
85  }
86  mime++;
87  }
88  if (id == AV_CODEC_ID_NONE) {
89  av_log(s, AV_LOG_ERROR, "Unknown attached picture mimetype: %s.\n",
90  mimetype);
91  if (s->error_recognition & AV_EF_EXPLODE)
92  return AVERROR_INVALIDDATA;
93  return 0;
94  }
95 
96  /* picture description */
97  len = bytestream2_get_be32u(&g);
98  if (len > bytestream2_get_bytes_left(&g) - 20) {
99  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
100  if (s->error_recognition & AV_EF_EXPLODE)
101  return AVERROR_INVALIDDATA;
102  return 0;
103  }
104  if (len > 0) {
105  if (!(desc = av_malloc(len + 1))) {
106  return AVERROR(ENOMEM);
107  }
108 
110  desc[len] = 0;
111  }
112 
113  /* picture metadata */
114  width = bytestream2_get_be32u(&g);
115  height = bytestream2_get_be32u(&g);
116  bytestream2_skipu(&g, 8);
117 
118  /* picture data */
119  len = bytestream2_get_be32u(&g);
120 
122  if (len <= 0 || len > left) {
124  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too big %u\n", len);
125  if (s->error_recognition & AV_EF_EXPLODE)
127  goto fail;
128  }
129 
130  // Workaround bug for flac muxers that writs truncated metadata picture block size if
131  // the picture size do not fit in 24 bits. lavf flacenc used to have the issue and based
132  // on existing broken files other unknown flac muxers seems to truncate also.
133  if (truncate_workaround &&
134  s->strict_std_compliance <= FF_COMPLIANCE_NORMAL &&
135  len > left && (len & 0xffffff) == left) {
136  av_log(s, AV_LOG_INFO, "Correcting truncated metadata picture size from %u to %u\n", left, len);
137  trunclen = len - left;
138  } else {
139  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
140  if (s->error_recognition & AV_EF_EXPLODE)
142  goto fail;
143  }
144  }
146  RETURN_ERROR(AVERROR(ENOMEM));
147  }
148 
149  if (trunclen == 0) {
150  bytestream2_get_bufferu(&g, data->data, len);
151  } else {
152  // If truncation was detected copy all data from block and read missing bytes
153  // not included in the block size
155  if (avio_read(s->pb, data->data + len - trunclen, trunclen) < trunclen)
157  }
158  memset(data->data + len, 0, AV_INPUT_BUFFER_PADDING_SIZE);
159 
160  if (AV_RB64(data->data) == PNGSIG)
161  id = AV_CODEC_ID_PNG;
162 
164  if (ret < 0)
165  RETURN_ERROR(ret);
166 
167  st = s->streams[s->nb_streams - 1];
168  st->codecpar->codec_id = id;
169  st->codecpar->width = width;
170  st->codecpar->height = height;
171  av_dict_set(&st->metadata, "comment", ff_id3v2_picture_types[type], 0);
172  if (desc)
174 
175  return 0;
176 
177 fail:
179  av_freep(&desc);
180 
181  return ret;
182 }
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
GetByteContext
Definition: bytestream.h:33
bytestream2_skipu
static av_always_inline void bytestream2_skipu(GetByteContext *g, unsigned int size)
Definition: bytestream.h:174
id3v2.h
RETURN_ERROR
#define RETURN_ERROR(code)
Definition: avidec.c:477
data
const char data[16]
Definition: mxf.c:142
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31
CodecMime
Definition: internal.h:47
fail
#define fail()
Definition: checkasm.h:134
type
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf type
Definition: writing_filters.txt:86
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:74
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:181
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
width
#define width
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:257
g
const char * g
Definition: vf_curves.c:117
AVCodecParameters::width
int width
Video only.
Definition: codec_par.h:126
flac_picture.h
AV_CODEC_ID_PNG
@ AV_CODEC_ID_PNG
Definition: codec_id.h:110
AVFormatContext
Format I/O context.
Definition: avformat.h:1106
internal.h
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:979
NULL
#define NULL
Definition: coverity.c:32
av_buffer_unref
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
Definition: buffer.c:125
AVStream::metadata
AVDictionary * metadata
Definition: avformat.h:890
AV_EF_EXPLODE
#define AV_EF_EXPLODE
abort decoding on minor error detection
Definition: avcodec.h:1441
ff_id3v2_picture_types
const char *const ff_id3v2_picture_types[21]
Definition: id3v2.c:107
ff_id3v2_mime_tags
const CodecMime ff_id3v2_mime_tags[]
Definition: id3v2.c:131
bytestream2_get_bytes_left
static av_always_inline int bytestream2_get_bytes_left(GetByteContext *g)
Definition: bytestream.h:158
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:46
id
enum AVCodecID id
Definition: extract_extradata_bsf.c:325
height
#define height
av_buffer_alloc
AVBufferRef * av_buffer_alloc(size_t size)
Allocate an AVBuffer of the given size using av_malloc().
Definition: buffer.c:67
FF_COMPLIANCE_NORMAL
#define FF_COMPLIANCE_NORMAL
Definition: avcodec.h:1389
PNGSIG
#define PNGSIG
Definition: png.h:49
AV_LOG_INFO
#define AV_LOG_INFO
Standard information.
Definition: log.h:192
AV_CODEC_ID_NONE
@ AV_CODEC_ID_NONE
Definition: codec_id.h:47
AVCodecParameters::height
int height
Definition: codec_par.h:127
len
int len
Definition: vorbis_enc_data.h:426
ret
ret
Definition: filter_design.txt:187
AVStream
Stream structure.
Definition: avformat.h:832
avformat.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: avcodec.h:192
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:616
CodecMime::str
char str[32]
Definition: internal.h:48
MAX_TRUNC_PICTURE_SIZE
#define MAX_TRUNC_PICTURE_SIZE
Definition: flac_picture.c:30
CodecMime::id
enum AVCodecID id
Definition: internal.h:49
desc
const char * desc
Definition: libsvtav1.c:79
ff_flac_parse_picture
int ff_flac_parse_picture(AVFormatContext *s, uint8_t *buf, int buf_size, int truncate_workaround)
Definition: flac_picture.c:32
AVBufferRef
A reference to a data buffer.
Definition: buffer.h:84
bytestream2_get_bufferu
static av_always_inline unsigned int bytestream2_get_bufferu(GetByteContext *g, uint8_t *dst, unsigned int size)
Definition: bytestream.h:277
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:60
png.h
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:70
bytestream.h
bytestream2_init
static av_always_inline void bytestream2_init(GetByteContext *g, const uint8_t *buf, int buf_size)
Definition: bytestream.h:137
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
AV_RB64
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_WL16 uint64_t_TMPL AV_RB64
Definition: bytestream.h:95
ff_add_attached_pic
int ff_add_attached_pic(AVFormatContext *s, AVStream *st, AVIOContext *pb, AVBufferRef **buf, int size)
Add an attached pic to an AVStream.
Definition: utils.c:420