FFmpeg
 All Data Structures Namespaces Files Functions Variables Typedefs Enumerations Enumerator Macros Groups Pages
vorbis_parser.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2012 Justin Ruggles
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 /**
22  * @file
23  * Vorbis audio parser
24  *
25  * Determines the duration for each packet.
26  */
27 
28 #include "libavutil/log.h"
29 
30 #include "get_bits.h"
31 #include "parser.h"
32 #include "xiph.h"
33 #include "vorbis_parser_internal.h"
34 
35 static const AVClass vorbis_parser_class = {
36  .class_name = "Vorbis parser",
37  .item_name = av_default_item_name,
38  .version = LIBAVUTIL_VERSION_INT,
39 };
40 
42  const uint8_t *buf, int buf_size)
43 {
44  /* Id header should be 30 bytes */
45  if (buf_size < 30) {
46  av_log(s, AV_LOG_ERROR, "Id header is too short\n");
47  return AVERROR_INVALIDDATA;
48  }
49 
50  /* make sure this is the Id header */
51  if (buf[0] != 1) {
52  av_log(s, AV_LOG_ERROR, "Wrong packet type in Id header\n");
53  return AVERROR_INVALIDDATA;
54  }
55 
56  /* check for header signature */
57  if (memcmp(&buf[1], "vorbis", 6)) {
58  av_log(s, AV_LOG_ERROR, "Invalid packet signature in Id header\n");
59  return AVERROR_INVALIDDATA;
60  }
61 
62  if (!(buf[29] & 0x1)) {
63  av_log(s, AV_LOG_ERROR, "Invalid framing bit in Id header\n");
64  return AVERROR_INVALIDDATA;
65  }
66 
67  s->blocksize[0] = 1 << (buf[28] & 0xF);
68  s->blocksize[1] = 1 << (buf[28] >> 4);
69 
70  return 0;
71 }
72 
74  const uint8_t *buf, int buf_size)
75 {
76  GetBitContext gb, gb0;
77  uint8_t *rev_buf;
78  int i, ret = 0;
79  int got_framing_bit, mode_count, got_mode_header, last_mode_count = 0;
80 
81  /* avoid overread */
82  if (buf_size < 7) {
83  av_log(s, AV_LOG_ERROR, "Setup header is too short\n");
84  return AVERROR_INVALIDDATA;
85  }
86 
87  /* make sure this is the Setup header */
88  if (buf[0] != 5) {
89  av_log(s, AV_LOG_ERROR, "Wrong packet type in Setup header\n");
90  return AVERROR_INVALIDDATA;
91  }
92 
93  /* check for header signature */
94  if (memcmp(&buf[1], "vorbis", 6)) {
95  av_log(s, AV_LOG_ERROR, "Invalid packet signature in Setup header\n");
96  return AVERROR_INVALIDDATA;
97  }
98 
99  /* reverse bytes so we can easily read backwards with get_bits() */
100  if (!(rev_buf = av_malloc(buf_size))) {
101  av_log(s, AV_LOG_ERROR, "Out of memory\n");
102  return AVERROR(ENOMEM);
103  }
104  for (i = 0; i < buf_size; i++)
105  rev_buf[i] = buf[buf_size - 1 - i];
106  init_get_bits(&gb, rev_buf, buf_size * 8);
107 
108  got_framing_bit = 0;
109  while (get_bits_left(&gb) > 97) {
110  if (get_bits1(&gb)) {
111  got_framing_bit = get_bits_count(&gb);
112  break;
113  }
114  }
115  if (!got_framing_bit) {
116  av_log(s, AV_LOG_ERROR, "Invalid Setup header\n");
117  ret = AVERROR_INVALIDDATA;
118  goto bad_header;
119  }
120 
121  /* Now we search backwards to find possible valid mode counts. This is not
122  * fool-proof because we could have false positive matches and read too
123  * far, but there isn't really any way to be sure without parsing through
124  * all the many variable-sized fields before the modes. This approach seems
125  * to work well in testing, and it is similar to how it is handled in
126  * liboggz. */
127  mode_count = 0;
128  got_mode_header = 0;
129  while (get_bits_left(&gb) >= 97) {
130  if (get_bits(&gb, 8) > 63 || get_bits(&gb, 16) || get_bits(&gb, 16))
131  break;
132  skip_bits(&gb, 1);
133  mode_count++;
134  if (mode_count > 64)
135  break;
136  gb0 = gb;
137  if (get_bits(&gb0, 6) + 1 == mode_count) {
138  got_mode_header = 1;
139  last_mode_count = mode_count;
140  }
141  }
142  if (!got_mode_header) {
143  av_log(s, AV_LOG_ERROR, "Invalid Setup header\n");
144  ret = AVERROR_INVALIDDATA;
145  goto bad_header;
146  }
147  /* All samples I've seen use <= 2 modes, so ask for a sample if we find
148  * more than that, as it is most likely a false positive. If we get any
149  * we may need to approach this the long way and parse the whole Setup
150  * header, but I hope very much that it never comes to that. */
151  if (last_mode_count > 2) {
153  "%d modes (either a false positive or a "
154  "sample from an unknown encoder)",
155  last_mode_count);
156  }
157  /* We're limiting the mode count to 63 so that we know that the previous
158  * block flag will be in the first packet byte. */
159  if (last_mode_count > 63) {
160  av_log(s, AV_LOG_ERROR, "Unsupported mode count: %d\n",
161  last_mode_count);
162  ret = AVERROR_INVALIDDATA;
163  goto bad_header;
164  }
165  s->mode_count = mode_count = last_mode_count;
166  /* Determine the number of bits required to code the mode and turn that
167  * into a bitmask to directly access the mode from the first frame byte. */
168  s->mode_mask = ((1 << (av_log2(mode_count - 1) + 1)) - 1) << 1;
169  /* The previous window flag is the next bit after the mode */
170  s->prev_mask = (s->mode_mask | 0x1) + 1;
171 
172  init_get_bits(&gb, rev_buf, buf_size * 8);
173  skip_bits_long(&gb, got_framing_bit);
174  for (i = mode_count - 1; i >= 0; i--) {
175  skip_bits_long(&gb, 40);
176  s->mode_blocksize[i] = get_bits1(&gb);
177  }
178 
179 bad_header:
180  av_free(rev_buf);
181  return ret;
182 }
183 
185  const uint8_t *extradata, int extradata_size)
186 {
187  const uint8_t *header_start[3];
188  int header_len[3];
189  int ret;
190 
192  s->extradata_parsed = 1;
193 
194  if ((ret = avpriv_split_xiph_headers(extradata,
195  extradata_size, 30,
196  header_start, header_len)) < 0) {
197  av_log(s, AV_LOG_ERROR, "Extradata corrupt.\n");
198  return ret;
199  }
200 
201  if ((ret = parse_id_header(s, header_start[0], header_len[0])) < 0)
202  return ret;
203 
204  if ((ret = parse_setup_header(s, header_start[2], header_len[2])) < 0)
205  return ret;
206 
207  s->valid_extradata = 1;
209 
210  return 0;
211 }
212 
214  int buf_size, int *flags)
215 {
216  int duration = 0;
217 
218  if (s->valid_extradata && buf_size > 0) {
219  int mode, current_blocksize;
220  int previous_blocksize = s->previous_blocksize;
221 
222  if (buf[0] & 1) {
223  /* If the user doesn't care about special packets, it's a bad one. */
224  if (!flags)
225  goto bad_packet;
226 
227  /* Set the flag for which kind of special packet it is. */
228  if (buf[0] == 1)
229  *flags |= VORBIS_FLAG_HEADER;
230  else if (buf[0] == 3)
231  *flags |= VORBIS_FLAG_COMMENT;
232  else if (buf[0] == 5)
233  *flags |= VORBIS_FLAG_SETUP;
234  else
235  goto bad_packet;
236 
237  /* Special packets have no duration. */
238  return 0;
239 
240 bad_packet:
241  av_log(s, AV_LOG_ERROR, "Invalid packet\n");
242  return AVERROR_INVALIDDATA;
243  }
244  if (s->mode_count == 1)
245  mode = 0;
246  else
247  mode = (buf[0] & s->mode_mask) >> 1;
248  if (mode >= s->mode_count) {
249  av_log(s, AV_LOG_ERROR, "Invalid mode in packet\n");
250  return AVERROR_INVALIDDATA;
251  }
252  if(s->mode_blocksize[mode]){
253  int flag = !!(buf[0] & s->prev_mask);
254  previous_blocksize = s->blocksize[flag];
255  }
256  current_blocksize = s->blocksize[s->mode_blocksize[mode]];
257  duration = (previous_blocksize + current_blocksize) >> 2;
258  s->previous_blocksize = current_blocksize;
259  }
260 
261  return duration;
262 }
263 
265  int buf_size)
266 {
267  return av_vorbis_parse_frame_flags(s, buf, buf_size, NULL);
268 }
269 
271 {
272  if (s->valid_extradata)
273  s->previous_blocksize = s->blocksize[0];
274 }
275 
277 {
278  av_freep(s);
279 }
280 
282  int extradata_size)
283 {
284  AVVorbisParseContext *s = av_mallocz(sizeof(*s));
285  int ret;
286 
287  if (!s)
288  return NULL;
289 
290  ret = vorbis_parse_init(s, extradata, extradata_size);
291  if (ret < 0) {
293  return NULL;
294  }
295 
296  return s;
297 }
298 
299 #if LIBAVCODEC_VERSION_MAJOR < 57
301 {
302  return vorbis_parse_init(s, avctx->extradata, avctx->extradata_size);
303 }
305 {
307 }
309  int buf_size)
310 {
311  return av_vorbis_parse_frame(s, buf, buf_size);
312 }
314  int buf_size, int *flags)
315 {
316  return av_vorbis_parse_frame_flags(s, buf, buf_size, flags);
317 }
318 #endif
319 
320 #if CONFIG_VORBIS_PARSER
321 
322 typedef struct VorbisParseContext {
324 } VorbisParseContext;
325 
326 static int vorbis_parse(AVCodecParserContext *s1, AVCodecContext *avctx,
327  const uint8_t **poutbuf, int *poutbuf_size,
328  const uint8_t *buf, int buf_size)
329 {
330  VorbisParseContext *s = s1->priv_data;
331  int duration;
332 
333  if (!s->vp && avctx->extradata && avctx->extradata_size) {
334  s->vp = av_vorbis_parse_init(avctx->extradata, avctx->extradata_size);
335  }
336  if (!s->vp)
337  goto end;
338 
339  if ((duration = av_vorbis_parse_frame(s->vp, buf, buf_size)) >= 0)
340  s1->duration = duration;
341 
342 end:
343  /* always return the full packet. this parser isn't doing any splitting or
344  combining, only packet analysis */
345  *poutbuf = buf;
346  *poutbuf_size = buf_size;
347  return buf_size;
348 }
349 
350 static void vorbis_parser_close(AVCodecParserContext *ctx)
351 {
352  VorbisParseContext *s = ctx->priv_data;
353  av_vorbis_parse_free(&s->vp);
354 }
355 
356 AVCodecParser ff_vorbis_parser = {
358  .priv_data_size = sizeof(VorbisParseContext),
359  .parser_parse = vorbis_parse,
360  .parser_close = vorbis_parser_close,
361 };
362 #endif /* CONFIG_VORBIS_PARSER */