FFmpeg
wavdec.c
Go to the documentation of this file.
1 /*
2  * WAV demuxer
3  * Copyright (c) 2001, 2002 Fabrice Bellard
4  *
5  * Sony Wave64 demuxer
6  * RF64 demuxer
7  * Copyright (c) 2009 Daniel Verkamp
8  *
9  * BW64 demuxer
10  *
11  * This file is part of FFmpeg.
12  *
13  * FFmpeg is free software; you can redistribute it and/or
14  * modify it under the terms of the GNU Lesser General Public
15  * License as published by the Free Software Foundation; either
16  * version 2.1 of the License, or (at your option) any later version.
17  *
18  * FFmpeg is distributed in the hope that it will be useful,
19  * but WITHOUT ANY WARRANTY; without even the implied warranty of
20  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21  * Lesser General Public License for more details.
22  *
23  * You should have received a copy of the GNU Lesser General Public
24  * License along with FFmpeg; if not, write to the Free Software
25  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26  */
27 
28 #include <stdint.h>
29 
30 #include "config_components.h"
31 #include "libavutil/avassert.h"
32 #include "libavutil/dict.h"
33 #include "libavutil/intreadwrite.h"
34 #include "libavutil/log.h"
35 #include "libavutil/mathematics.h"
36 #include "libavutil/mem.h"
37 #include "libavutil/opt.h"
38 #include "libavcodec/internal.h"
39 #include "avformat.h"
40 #include "avio.h"
41 #include "avio_internal.h"
42 #include "demux.h"
43 #include "id3v2.h"
44 #include "internal.h"
45 #include "metadata.h"
46 #include "pcm.h"
47 #include "riff.h"
48 #include "w64.h"
49 #include "spdif.h"
50 
51 typedef struct WAVDemuxContext {
52  const AVClass *class;
54  int w64;
59  int smv_block;
61  int smv_eof;
62  int audio_eof;
64  int max_size;
65  int spdif;
67  int unaligned; // e.g. if an odd number of bytes ID3 tag was prepended
68  int rifx; // RIFX: integer byte order for parameters is big endian
70 
71 #define OFFSET(x) offsetof(WAVDemuxContext, x)
72 #define DEC AV_OPT_FLAG_DECODING_PARAM
73 static const AVOption demux_options[] = {
74 #define W64_DEMUXER_OPTIONS_OFFSET (1 * CONFIG_WAV_DEMUXER)
75 #if CONFIG_WAV_DEMUXER
76  { "ignore_length", "Ignore length", OFFSET(ignore_length), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, DEC },
77 #endif
78  { "max_size", "max size of single packet", OFFSET(max_size), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1 << 22, DEC },
79  { NULL },
80 };
81 
82 static void set_max_size(AVStream *st, WAVDemuxContext *wav)
83 {
84  if (wav->max_size <= 0) {
85  int max_size = ff_pcm_default_packet_size(st->codecpar);
86  wav->max_size = max_size < 0 ? 4096 : max_size;
87  }
88 }
89 
91 {
92  if (CONFIG_SPDIF_DEMUXER && s->streams[0]->codecpar->codec_tag == 1) {
93  enum AVCodecID codec;
94  int len = 1<<16;
95  int ret = ffio_ensure_seekback(s->pb, len);
96 
97  if (ret >= 0) {
98  uint8_t *buf = av_malloc(len + AV_INPUT_BUFFER_PADDING_SIZE);
99  if (!buf) {
100  ret = AVERROR(ENOMEM);
101  } else {
102  int64_t pos = avio_tell(s->pb);
103  len = ret = avio_read(s->pb, buf, len);
104  if (len >= 0) {
105  ret = ff_spdif_probe(buf, len, &codec);
107  s->streams[0]->codecpar->codec_id = codec;
108  wav->spdif = 1;
109  }
110  }
111  avio_seek(s->pb, pos, SEEK_SET);
112  av_free(buf);
113  }
114  }
115 
116  if (ret < 0)
117  av_log(s, AV_LOG_WARNING, "Cannot check for SPDIF\n");
118  }
119 }
120 
121 #if CONFIG_WAV_DEMUXER
122 
123 static int64_t next_tag(AVIOContext *pb, uint32_t *tag, int big_endian)
124 {
125  *tag = avio_rl32(pb);
126  if (!big_endian) {
127  return avio_rl32(pb);
128  } else {
129  return avio_rb32(pb);
130  }
131 }
132 
133 /* RIFF chunks are always at even offsets relative to where they start. */
134 static int64_t wav_seek_tag(WAVDemuxContext * wav, AVIOContext *s, int64_t offset)
135 {
136  offset += offset < INT64_MAX && offset + wav->unaligned & 1;
137 
138  return avio_seek(s, offset, SEEK_SET);
139 }
140 
141 /* return the size of the found tag */
142 static int64_t find_tag(WAVDemuxContext * wav, AVIOContext *pb, uint32_t tag1)
143 {
144  unsigned int tag;
145  int64_t size;
146 
147  if (avio_tell(pb) + wav->unaligned & 1)
148  avio_skip(pb, 1);
149 
150  for (;;) {
151  if (avio_feof(pb))
152  return AVERROR_EOF;
153  size = next_tag(pb, &tag, wav->rifx);
154  if (tag == tag1)
155  break;
156  avio_skip(pb, size + (size & 1));
157  }
158  return size;
159 }
160 
161 static int wav_probe(const AVProbeData *p)
162 {
163  /* check file header */
164  if (p->buf_size <= 32)
165  return 0;
166  if (!memcmp(p->buf + 8, "WAVE", 4)) {
167  if (!memcmp(p->buf, "RIFF", 4) || !memcmp(p->buf, "RIFX", 4))
168  /* Since the ACT demuxer has a standard WAV header at the top of
169  * its own, the returned score is decreased to avoid a probe
170  * conflict between ACT and WAV. */
171  return AVPROBE_SCORE_MAX - 1;
172  else if ((!memcmp(p->buf, "RF64", 4) ||
173  !memcmp(p->buf, "BW64", 4)) &&
174  !memcmp(p->buf + 12, "ds64", 4))
175  return AVPROBE_SCORE_MAX;
176  }
177  return 0;
178 }
179 
180 static void handle_stream_probing(AVStream *st)
181 {
183  FFStream *const sti = ffstream(st);
185  sti->probe_packets = FFMIN(sti->probe_packets, 32);
186  }
187 }
188 
189 static int wav_parse_fmt_tag(AVFormatContext *s, int64_t size, AVStream *st)
190 {
191  AVIOContext *pb = s->pb;
192  WAVDemuxContext *wav = s->priv_data;
193  int ret;
194 
195  /* parse fmt header */
196  ret = ff_get_wav_header(s, pb, st->codecpar, size, wav->rifx);
197  if (ret < 0)
198  return ret;
199  handle_stream_probing(st);
200 
202 
203  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
204 
205  return 0;
206 }
207 
208 static int wav_parse_xma2_tag(AVFormatContext *s, int64_t size, AVStream *st)
209 {
210  AVIOContext *pb = s->pb;
211  int version, num_streams, i, channels = 0, ret;
212 
213  if (size < 36)
214  return AVERROR_INVALIDDATA;
215 
219 
220  version = avio_r8(pb);
221  if (version != 3 && version != 4)
222  return AVERROR_INVALIDDATA;
223  num_streams = avio_r8(pb);
224  if (size != (32 + ((version==3)?0:8) + 4*num_streams))
225  return AVERROR_INVALIDDATA;
226  avio_skip(pb, 10);
227  st->codecpar->sample_rate = avio_rb32(pb);
228  if (version == 4)
229  avio_skip(pb, 8);
230  avio_skip(pb, 4);
231  st->duration = avio_rb32(pb);
232  avio_skip(pb, 8);
233 
234  for (i = 0; i < num_streams; i++) {
235  channels += avio_r8(pb);
236  avio_skip(pb, 3);
237  }
241 
242  if (st->codecpar->ch_layout.nb_channels <= 0 || st->codecpar->sample_rate <= 0)
243  return AVERROR_INVALIDDATA;
244 
245  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
246 
247  avio_seek(pb, -size, SEEK_CUR);
248  if ((ret = ff_get_extradata(s, st->codecpar, pb, size)) < 0)
249  return ret;
250 
251  return 0;
252 }
253 
254 static inline int wav_parse_bext_string(AVFormatContext *s, const char *key,
255  int length)
256 {
257  char temp[257];
258  int ret;
259 
260  av_assert0(length < sizeof(temp));
261  if ((ret = ffio_read_size(s->pb, temp, length)) < 0)
262  return ret;
263 
264  temp[length] = 0;
265 
266  if (strlen(temp))
267  return av_dict_set(&s->metadata, key, temp, 0);
268 
269  return 0;
270 }
271 
272 static int wav_parse_bext_tag(AVFormatContext *s, int64_t size)
273 {
274  char temp[131], *coding_history;
275  int ret, x;
276  uint64_t time_reference;
277  int64_t umid_parts[8], umid_mask = 0;
278 
279  if ((ret = wav_parse_bext_string(s, "description", 256)) < 0 ||
280  (ret = wav_parse_bext_string(s, "originator", 32)) < 0 ||
281  (ret = wav_parse_bext_string(s, "originator_reference", 32)) < 0 ||
282  (ret = wav_parse_bext_string(s, "origination_date", 10)) < 0 ||
283  (ret = wav_parse_bext_string(s, "origination_time", 8)) < 0)
284  return ret;
285 
286  time_reference = avio_rl64(s->pb);
287  snprintf(temp, sizeof(temp), "%"PRIu64, time_reference);
288  if ((ret = av_dict_set(&s->metadata, "time_reference", temp, 0)) < 0)
289  return ret;
290 
291  /* check if version is >= 1, in which case an UMID may be present */
292  if (avio_rl16(s->pb) >= 1) {
293  for (x = 0; x < 8; x++)
294  umid_mask |= umid_parts[x] = avio_rb64(s->pb);
295 
296  if (umid_mask) {
297  /* the string formatting below is per SMPTE 330M-2004 Annex C */
298  if (umid_parts[4] == 0 && umid_parts[5] == 0 &&
299  umid_parts[6] == 0 && umid_parts[7] == 0) {
300  /* basic UMID */
301  snprintf(temp, sizeof(temp),
302  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
303  umid_parts[0], umid_parts[1],
304  umid_parts[2], umid_parts[3]);
305  } else {
306  /* extended UMID */
307  snprintf(temp, sizeof(temp),
308  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64
309  "%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
310  umid_parts[0], umid_parts[1],
311  umid_parts[2], umid_parts[3],
312  umid_parts[4], umid_parts[5],
313  umid_parts[6], umid_parts[7]);
314  }
315 
316  if ((ret = av_dict_set(&s->metadata, "umid", temp, 0)) < 0)
317  return ret;
318  }
319 
320  avio_skip(s->pb, 190);
321  } else
322  avio_skip(s->pb, 254);
323 
324  if (size > 602) {
325  /* CodingHistory present */
326  size -= 602;
327 
328  if (!(coding_history = av_malloc(size + 1)))
329  return AVERROR(ENOMEM);
330 
331  if ((ret = ffio_read_size(s->pb, coding_history, size)) < 0) {
332  av_free(coding_history);
333  return ret;
334  }
335 
336  coding_history[size] = 0;
337  if ((ret = av_dict_set(&s->metadata, "coding_history", coding_history,
339  return ret;
340  }
341 
342  return 0;
343 }
344 
345 static const AVMetadataConv wav_metadata_conv[] = {
346  { "description", "comment" },
347  { "originator", "encoded_by" },
348  { "origination_date", "date" },
349  { "origination_time", "creation_time" },
350  { 0 },
351 };
352 
353 /* wav input */
354 static int wav_read_header(AVFormatContext *s)
355 {
356  int64_t size, av_uninit(data_size);
357  int64_t sample_count = 0;
358  int rf64 = 0, bw64 = 0;
359  uint32_t tag;
360  AVIOContext *pb = s->pb;
361  AVStream *st = NULL;
362  WAVDemuxContext *wav = s->priv_data;
363  int ret, got_fmt = 0, got_xma2 = 0;
364  int64_t next_tag_ofs, data_ofs = -1;
365 
366  wav->unaligned = avio_tell(s->pb) & 1;
367 
368  wav->smv_data_ofs = -1;
369 
370  /* read chunk ID */
371  tag = avio_rl32(pb);
372  switch (tag) {
373  case MKTAG('R', 'I', 'F', 'F'):
374  break;
375  case MKTAG('R', 'I', 'F', 'X'):
376  wav->rifx = 1;
377  break;
378  case MKTAG('R', 'F', '6', '4'):
379  rf64 = 1;
380  break;
381  case MKTAG('B', 'W', '6', '4'):
382  bw64 = 1;
383  break;
384  default:
385  av_log(s, AV_LOG_ERROR, "invalid start code %s in RIFF header\n",
386  av_fourcc2str(tag));
387  return AVERROR_INVALIDDATA;
388  }
389 
390  /* read chunk size */
391  avio_rl32(pb);
392 
393  /* read format */
394  if (avio_rl32(pb) != MKTAG('W', 'A', 'V', 'E')) {
395  av_log(s, AV_LOG_ERROR, "invalid format in RIFF header\n");
396  return AVERROR_INVALIDDATA;
397  }
398 
399  if (rf64 || bw64) {
400  if (avio_rl32(pb) != MKTAG('d', 's', '6', '4'))
401  return AVERROR_INVALIDDATA;
402  size = avio_rl32(pb);
403  if (size < 24)
404  return AVERROR_INVALIDDATA;
405  avio_rl64(pb); /* RIFF size */
406 
407  data_size = avio_rl64(pb);
408  sample_count = avio_rl64(pb);
409 
410  if (data_size < 0 || sample_count < 0) {
411  av_log(s, AV_LOG_ERROR, "negative data_size and/or sample_count in "
412  "ds64: data_size = %"PRId64", sample_count = %"PRId64"\n",
413  data_size, sample_count);
414  return AVERROR_INVALIDDATA;
415  }
416  avio_skip(pb, size - 24); /* skip rest of ds64 chunk */
417 
418  }
419 
420  /* Create the audio stream now so that its index is always zero */
421  st = avformat_new_stream(s, NULL);
422  if (!st)
423  return AVERROR(ENOMEM);
424 
425  for (;;) {
426  AVStream *vst;
427  size = next_tag(pb, &tag, wav->rifx);
428  next_tag_ofs = avio_tell(pb) + size + (size & 1);
429 
430  if (avio_feof(pb))
431  break;
432 
433  switch (tag) {
434  case MKTAG('f', 'm', 't', ' '):
435  /* only parse the first 'fmt ' tag found */
436  if (!got_xma2 && !got_fmt && (ret = wav_parse_fmt_tag(s, size, st)) < 0) {
437  return ret;
438  } else if (got_fmt)
439  av_log(s, AV_LOG_WARNING, "found more than one 'fmt ' tag\n");
440 
441  got_fmt = 1;
442  break;
443  case MKTAG('X', 'M', 'A', '2'):
444  /* only parse the first 'XMA2' tag found */
445  if (!got_fmt && !got_xma2 && (ret = wav_parse_xma2_tag(s, size, st)) < 0) {
446  return ret;
447  } else if (got_xma2)
448  av_log(s, AV_LOG_WARNING, "found more than one 'XMA2' tag\n");
449 
450  got_xma2 = 1;
451  break;
452  case MKTAG('d', 'a', 't', 'a'):
453  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) && !got_fmt && !got_xma2) {
455  "found no 'fmt ' tag before the 'data' tag\n");
456  return AVERROR_INVALIDDATA;
457  }
458 
459  if (rf64 || bw64) {
460  wav->data_end = av_sat_add64(avio_tell(pb), data_size);
461  next_tag_ofs = wav->data_end + (data_size & 1);
462  } else if (size > 0 && size != 0xFFFFFFFF) {
463  data_size = size;
464  wav->data_end = avio_tell(pb) + size;
465  next_tag_ofs = wav->data_end + (size & 1);
466  } else {
467  av_log(s, AV_LOG_WARNING, "Ignoring maximum wav data size, "
468  "file may be invalid\n");
469  data_size = 0;
470  next_tag_ofs = wav->data_end = INT64_MAX;
471  }
472 
473  data_ofs = avio_tell(pb);
474 
475  /* don't look for footer metadata if we can't seek or if we don't
476  * know where the data tag ends
477  */
478  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) || (!(rf64 && !bw64) && !size))
479  goto break_loop;
480  break;
481  case MKTAG('f', 'a', 'c', 't'):
482  if (!sample_count)
483  sample_count = (!wav->rifx ? avio_rl32(pb) : avio_rb32(pb));
484  break;
485  case MKTAG('b', 'e', 'x', 't'):
486  if ((ret = wav_parse_bext_tag(s, size)) < 0)
487  return ret;
488  break;
489  case MKTAG('S','M','V','0'):
490  if (!got_fmt) {
491  av_log(s, AV_LOG_ERROR, "found no 'fmt ' tag before the 'SMV0' tag\n");
492  return AVERROR_INVALIDDATA;
493  }
494  // SMV file, a wav file with video appended.
495  if (size != MKTAG('0','2','0','0')) {
496  av_log(s, AV_LOG_ERROR, "Unknown SMV version found\n");
497  goto break_loop;
498  }
499  av_log(s, AV_LOG_DEBUG, "Found SMV data\n");
500  wav->smv_given_first = 0;
501  vst = avformat_new_stream(s, NULL);
502  if (!vst)
503  return AVERROR(ENOMEM);
504  wav->vst = vst;
505  avio_r8(pb);
506  vst->id = 1;
509  vst->codecpar->width = avio_rl24(pb);
510  vst->codecpar->height = avio_rl24(pb);
511  if ((ret = ff_alloc_extradata(vst->codecpar, 4)) < 0) {
512  av_log(s, AV_LOG_ERROR, "Could not allocate extradata.\n");
513  return ret;
514  }
515  size = avio_rl24(pb);
516  wav->smv_data_ofs = avio_tell(pb) + (size - 5) * 3;
517  avio_rl24(pb);
518  wav->smv_block_size = avio_rl24(pb);
519  if (!wav->smv_block_size)
520  return AVERROR_INVALIDDATA;
521  avpriv_set_pts_info(vst, 32, 1, avio_rl24(pb));
522  vst->duration = avio_rl24(pb);
523  avio_rl24(pb);
524  avio_rl24(pb);
525  wav->smv_frames_per_jpeg = avio_rl24(pb);
526  if (wav->smv_frames_per_jpeg > 65536) {
527  av_log(s, AV_LOG_ERROR, "too many frames per jpeg\n");
528  return AVERROR_INVALIDDATA;
529  }
531  goto break_loop;
532  case MKTAG('L', 'I', 'S', 'T'):
533  case MKTAG('l', 'i', 's', 't'):
534  if (size < 4) {
535  av_log(s, AV_LOG_ERROR, "too short LIST tag\n");
536  return AVERROR_INVALIDDATA;
537  }
538  switch (avio_rl32(pb)) {
539  case MKTAG('I', 'N', 'F', 'O'):
540  ff_read_riff_info(s, size - 4);
541  break;
542  case MKTAG('a', 'd', 't', 'l'):
543  if (s->nb_chapters > 0) {
544  while (avio_tell(pb) < next_tag_ofs &&
545  !avio_feof(pb)) {
546  char cue_label[512];
547  unsigned id, sub_size;
548 
549  if (avio_rl32(pb) != MKTAG('l', 'a', 'b', 'l'))
550  break;
551 
552  sub_size = avio_rl32(pb);
553  if (sub_size < 5)
554  break;
555  id = avio_rl32(pb);
556  avio_get_str(pb, sub_size - 4, cue_label, sizeof(cue_label));
557  avio_skip(pb, avio_tell(pb) & 1);
558 
559  for (int i = 0; i < s->nb_chapters; i++) {
560  if (s->chapters[i]->id == id) {
561  av_dict_set(&s->chapters[i]->metadata, "title", cue_label, 0);
562  break;
563  }
564  }
565  }
566  }
567  break;
568  }
569  break;
570  case MKTAG('I', 'D', '3', ' '):
571  case MKTAG('i', 'd', '3', ' '): {
572  ID3v2ExtraMeta *id3v2_extra_meta;
573  ff_id3v2_read(s, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta, 0);
574  if (id3v2_extra_meta) {
575  ff_id3v2_parse_apic(s, id3v2_extra_meta);
576  ff_id3v2_parse_chapters(s, id3v2_extra_meta);
577  ff_id3v2_parse_priv(s, id3v2_extra_meta);
578  }
579  ff_id3v2_free_extra_meta(&id3v2_extra_meta);
580  }
581  break;
582  case MKTAG('c', 'u', 'e', ' '):
583  if (size >= 4 && got_fmt && st->codecpar->sample_rate > 0) {
584  AVRational tb = {1, st->codecpar->sample_rate};
585  unsigned nb_cues = avio_rl32(pb);
586 
587  if (size >= nb_cues * 24LL + 4LL) {
588  for (int i = 0; i < nb_cues; i++) {
589  unsigned offset, id = avio_rl32(pb);
590 
591  if (avio_feof(pb))
592  return AVERROR_INVALIDDATA;
593 
594  avio_skip(pb, 16);
595  offset = avio_rl32(pb);
596 
597  if (!avpriv_new_chapter(s, id, tb, offset, AV_NOPTS_VALUE, NULL))
598  return AVERROR(ENOMEM);
599  }
600  }
601  }
602  break;
603  }
604 
605  /* seek to next tag unless we know that we'll run into EOF */
606  if ((avio_size(pb) > 0 && next_tag_ofs >= avio_size(pb)) ||
607  wav_seek_tag(wav, pb, next_tag_ofs) < 0) {
608  break;
609  }
610  }
611 
612 break_loop:
613  if (!got_fmt && !got_xma2) {
614  av_log(s, AV_LOG_ERROR, "no 'fmt ' or 'XMA2' tag found\n");
615  return AVERROR_INVALIDDATA;
616  }
617 
618  if (data_ofs < 0) {
619  av_log(s, AV_LOG_ERROR, "no 'data' tag found\n");
620  return AVERROR_INVALIDDATA;
621  }
622 
623  avio_seek(pb, data_ofs, SEEK_SET);
624 
625  if (data_size > (INT64_MAX>>3)) {
626  av_log(s, AV_LOG_WARNING, "Data size %"PRId64" is too large\n", data_size);
627  data_size = 0;
628  }
629 
630  if ( st->codecpar->bit_rate > 0 && data_size > 0
631  && st->codecpar->sample_rate > 0
632  && sample_count > 0 && st->codecpar->ch_layout.nb_channels > 1
633  && sample_count % st->codecpar->ch_layout.nb_channels == 0) {
634  if (fabs(8.0 * data_size * st->codecpar->ch_layout.nb_channels * st->codecpar->sample_rate /
635  sample_count /st->codecpar->bit_rate - 1.0) < 0.3)
636  sample_count /= st->codecpar->ch_layout.nb_channels;
637  }
638 
639  if (data_size > 0 && sample_count && st->codecpar->ch_layout.nb_channels &&
640  (data_size << 3) / sample_count / st->codecpar->ch_layout.nb_channels > st->codecpar->bits_per_coded_sample + 1) {
641  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
642  sample_count = 0;
643  }
644 
645  /* G.729 hack (for Ticket4577)
646  * FIXME: Come up with cleaner, more general solution */
647  if (st->codecpar->codec_id == AV_CODEC_ID_G729 && sample_count && (data_size << 3) > sample_count) {
648  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
649  sample_count = 0;
650  }
651 
652  if (!sample_count || av_get_exact_bits_per_sample(st->codecpar->codec_id) > 0)
653  if ( st->codecpar->ch_layout.nb_channels
654  && data_size
656  && wav->data_end <= avio_size(pb))
657  sample_count = (data_size << 3)
658  /
660 
661  if (sample_count)
662  st->duration = sample_count;
663 
666  st->codecpar->bits_per_coded_sample == 32 &&
667  st->codecpar->extradata_size == 2 &&
668  AV_RL16(st->codecpar->extradata) == 1) {
671  } else if (st->codecpar->codec_id == AV_CODEC_ID_PCM_S24LE &&
673  st->codecpar->bits_per_coded_sample == 24) {
675  } else if (st->codecpar->codec_id == AV_CODEC_ID_XMA1 ||
677  st->codecpar->block_align = 2048;
678  } else if (st->codecpar->codec_id == AV_CODEC_ID_ADPCM_MS && st->codecpar->ch_layout.nb_channels > 2 &&
679  st->codecpar->block_align < INT_MAX / st->codecpar->ch_layout.nb_channels) {
681  }
682 
683  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
685 
686  set_spdif(s, wav);
687  set_max_size(st, wav);
688 
689  return 0;
690 }
691 
692 /**
693  * Find chunk with w64 GUID by skipping over other chunks.
694  * @return the size of the found chunk
695  */
696 static int64_t find_guid(AVIOContext *pb, const uint8_t guid1[16])
697 {
698  uint8_t guid[16];
699  int64_t size;
700 
701  while (!avio_feof(pb)) {
702  if (avio_read(pb, guid, 16) != 16)
703  break;
704  size = avio_rl64(pb);
705  if (size <= 24 || size > INT64_MAX - 8)
706  return AVERROR_INVALIDDATA;
707  if (!memcmp(guid, guid1, 16))
708  return size;
709  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
710  }
711  return AVERROR_EOF;
712 }
713 
714 static int wav_read_packet(AVFormatContext *s, AVPacket *pkt)
715 {
716  int ret, size;
717  int64_t left;
718  WAVDemuxContext *wav = s->priv_data;
719  AVStream *st = s->streams[0];
720 
721  if (CONFIG_SPDIF_DEMUXER && wav->spdif == 1)
722  return ff_spdif_read_packet(s, pkt);
723 
724  if (wav->smv_data_ofs > 0) {
726  AVStream *vst = wav->vst;
727 smv_retry:
730 
732  /*We always return a video frame first to get the pixel format first*/
733  wav->smv_last_stream = wav->smv_given_first ?
735  audio_dts, st->time_base) > 0 : 0;
736  wav->smv_given_first = 1;
737  }
738  wav->smv_last_stream = !wav->smv_last_stream;
739  wav->smv_last_stream |= wav->audio_eof;
740  wav->smv_last_stream &= !wav->smv_eof;
741  if (wav->smv_last_stream) {
742  uint64_t old_pos = avio_tell(s->pb);
743  uint64_t new_pos = wav->smv_data_ofs +
744  wav->smv_block * (int64_t)wav->smv_block_size;
745  if (avio_seek(s->pb, new_pos, SEEK_SET) < 0) {
746  ret = AVERROR_EOF;
747  goto smv_out;
748  }
749  size = avio_rl24(s->pb);
750  if (size > wav->smv_block_size) {
751  ret = AVERROR_EOF;
752  goto smv_out;
753  }
754  ret = av_get_packet(s->pb, pkt, size);
755  if (ret < 0)
756  goto smv_out;
757  pkt->pos -= 3;
758  pkt->pts = wav->smv_block * wav->smv_frames_per_jpeg;
760  wav->smv_block++;
761 
762  pkt->stream_index = vst->index;
763 smv_out:
764  avio_seek(s->pb, old_pos, SEEK_SET);
765  if (ret == AVERROR_EOF) {
766  wav->smv_eof = 1;
767  goto smv_retry;
768  }
769  return ret;
770  }
771  }
772 
773  left = wav->data_end - avio_tell(s->pb);
774  if (wav->ignore_length)
775  left = INT_MAX;
776  if (left <= 0) {
777  if (CONFIG_W64_DEMUXER && wav->w64)
778  left = find_guid(s->pb, ff_w64_guid_data) - 24;
779  else
780  left = find_tag(wav, s->pb, MKTAG('d', 'a', 't', 'a'));
781  if (left < 0) {
782  wav->audio_eof = 1;
783  if (wav->smv_data_ofs > 0 && !wav->smv_eof)
784  goto smv_retry;
785  return AVERROR_EOF;
786  }
787  if (INT64_MAX - left < avio_tell(s->pb))
788  return AVERROR_INVALIDDATA;
789  wav->data_end = avio_tell(s->pb) + left;
790  }
791 
792  size = wav->max_size;
793  if (st->codecpar->block_align > 1) {
794  if (size < st->codecpar->block_align)
795  size = st->codecpar->block_align;
796  size = (size / st->codecpar->block_align) * st->codecpar->block_align;
797  }
798  size = FFMIN(size, left);
799  ret = av_get_packet(s->pb, pkt, size);
800  if (ret < 0)
801  return ret;
802  pkt->stream_index = 0;
803 
804  return ret;
805 }
806 
807 static int wav_read_seek(AVFormatContext *s,
808  int stream_index, int64_t timestamp, int flags)
809 {
810  WAVDemuxContext *wav = s->priv_data;
811  AVStream *ast = s->streams[0], *vst = wav->vst;
812  wav->smv_eof = 0;
813  wav->audio_eof = 0;
814 
815  if (stream_index != 0 && (!vst || stream_index != vst->index))
816  return AVERROR(EINVAL);
817  if (wav->smv_data_ofs > 0) {
818  int64_t smv_timestamp = timestamp;
819  if (stream_index == 0)
820  smv_timestamp = av_rescale_q(timestamp, ast->time_base, vst->time_base);
821  else
822  timestamp = av_rescale_q(smv_timestamp, vst->time_base, ast->time_base);
823  if (wav->smv_frames_per_jpeg > 0) {
824  wav->smv_block = smv_timestamp / wav->smv_frames_per_jpeg;
825  }
826  }
827 
828  switch (ast->codecpar->codec_id) {
829  case AV_CODEC_ID_MP2:
830  case AV_CODEC_ID_MP3:
831  case AV_CODEC_ID_AC3:
832  case AV_CODEC_ID_DTS:
833  case AV_CODEC_ID_XMA2:
834  /* use generic seeking with dynamically generated indexes */
835  return -1;
836  default:
837  break;
838  }
839  return ff_pcm_read_seek(s, 0, timestamp, flags);
840 }
841 
842 static const AVClass wav_demuxer_class = {
843  .class_name = "WAV demuxer",
844  .item_name = av_default_item_name,
845  .option = demux_options,
846  .version = LIBAVUTIL_VERSION_INT,
847 };
849  .p.name = "wav",
850  .p.long_name = NULL_IF_CONFIG_SMALL("WAV / WAVE (Waveform Audio)"),
851  .p.flags = AVFMT_GENERIC_INDEX,
852  .p.codec_tag = ff_wav_codec_tags_list,
853  .p.priv_class = &wav_demuxer_class,
854  .priv_data_size = sizeof(WAVDemuxContext),
855  .read_probe = wav_probe,
856  .read_header = wav_read_header,
857  .read_packet = wav_read_packet,
858  .read_seek = wav_read_seek,
859 };
860 #endif /* CONFIG_WAV_DEMUXER */
861 
862 #if CONFIG_W64_DEMUXER
863 static int w64_probe(const AVProbeData *p)
864 {
865  if (p->buf_size <= 40)
866  return 0;
867  if (!memcmp(p->buf, ff_w64_guid_riff, 16) &&
868  !memcmp(p->buf + 24, ff_w64_guid_wave, 16))
869  return AVPROBE_SCORE_MAX;
870  else
871  return 0;
872 }
873 
874 static int w64_read_header(AVFormatContext *s)
875 {
876  int64_t size, data_ofs = 0;
877  AVIOContext *pb = s->pb;
878  WAVDemuxContext *wav = s->priv_data;
879  AVStream *st;
880  uint8_t guid[16];
881  int ret = ffio_read_size(pb, guid, 16);
882 
883  if (ret < 0)
884  return ret;
885 
886  if (memcmp(guid, ff_w64_guid_riff, 16))
887  return AVERROR_INVALIDDATA;
888 
889  /* riff + wave + fmt + sizes */
890  if (avio_rl64(pb) < 16 + 8 + 16 + 8 + 16 + 8)
891  return AVERROR_INVALIDDATA;
892 
893  ret = ffio_read_size(pb, guid, 16);
894  if (ret < 0)
895  return ret;
896  if (memcmp(guid, ff_w64_guid_wave, 16)) {
897  av_log(s, AV_LOG_ERROR, "could not find wave guid\n");
898  return AVERROR_INVALIDDATA;
899  }
900 
901  wav->w64 = 1;
902 
903  st = avformat_new_stream(s, NULL);
904  if (!st)
905  return AVERROR(ENOMEM);
906 
907  while (!avio_feof(pb)) {
908  if (avio_read(pb, guid, 16) != 16)
909  break;
910  size = avio_rl64(pb);
911  if (size <= 24 || INT64_MAX - size < avio_tell(pb)) {
912  if (data_ofs)
913  break;
914  return AVERROR_INVALIDDATA;
915  }
916 
917  if (!memcmp(guid, ff_w64_guid_fmt, 16)) {
918  /* subtract chunk header size - normal wav file doesn't count it */
919  ret = ff_get_wav_header(s, pb, st->codecpar, size - 24, 0);
920  if (ret < 0)
921  return ret;
922  avio_skip(pb, FFALIGN(size, INT64_C(8)) - size);
923  if (st->codecpar->block_align &&
925  st->codecpar->bits_per_coded_sample < 128) {
926  int64_t block_align = st->codecpar->block_align;
927 
928  block_align = FFMAX(block_align,
929  ((st->codecpar->bits_per_coded_sample + 7LL) / 8) *
931  if (block_align > st->codecpar->block_align) {
932  av_log(s, AV_LOG_WARNING, "invalid block_align: %d, broken file.\n",
933  st->codecpar->block_align);
934  st->codecpar->block_align = block_align;
935  }
936  }
937  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
938  } else if (!memcmp(guid, ff_w64_guid_fact, 16)) {
940 
941  samples = avio_rl64(pb);
942  if (samples > 0)
943  st->duration = samples;
944  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 32);
945  } else if (!memcmp(guid, ff_w64_guid_data, 16)) {
946  wav->data_end = avio_tell(pb) + size - 24;
947 
948  data_ofs = avio_tell(pb);
949  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
950  break;
951 
952  avio_skip(pb, size - 24);
953  } else if (!memcmp(guid, ff_w64_guid_summarylist, 16)) {
954  int64_t start, end, cur;
955  uint32_t count, chunk_size, i;
956  int64_t filesize = avio_size(s->pb);
957 
958  start = avio_tell(pb);
959  end = start + FFALIGN(size, INT64_C(8)) - 24;
960  count = avio_rl32(pb);
961 
962  for (i = 0; i < count; i++) {
963  char chunk_key[5], *value;
964 
965  if (avio_feof(pb) || (cur = avio_tell(pb)) < 0 || cur > end - 8 /* = tag + size */)
966  break;
967 
968  chunk_key[4] = 0;
969  avio_read(pb, chunk_key, 4);
970  chunk_size = avio_rl32(pb);
971  if (chunk_size == UINT32_MAX || (filesize >= 0 && chunk_size > filesize))
972  return AVERROR_INVALIDDATA;
973 
974  value = av_malloc(chunk_size + 1);
975  if (!value)
976  return AVERROR(ENOMEM);
977 
978  ret = avio_get_str16le(pb, chunk_size, value, chunk_size);
979  if (ret < 0) {
980  av_free(value);
981  return ret;
982  }
983  avio_skip(pb, chunk_size - ret);
984 
985  av_dict_set(&s->metadata, chunk_key, value, AV_DICT_DONT_STRDUP_VAL);
986  }
987 
988  avio_skip(pb, end - avio_tell(pb));
989  } else {
990  av_log(s, AV_LOG_DEBUG, "unknown guid: "FF_PRI_GUID"\n", FF_ARG_GUID(guid));
991  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
992  }
993  }
994 
995  if (!data_ofs)
996  return AVERROR_EOF;
997 
998  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
1000 
1001  handle_stream_probing(st);
1003 
1004  avio_seek(pb, data_ofs, SEEK_SET);
1005 
1006  set_spdif(s, wav);
1007  set_max_size(st, wav);
1008 
1009  return 0;
1010 }
1011 
1012 static const AVClass w64_demuxer_class = {
1013  .class_name = "W64 demuxer",
1014  .item_name = av_default_item_name,
1016  .version = LIBAVUTIL_VERSION_INT,
1017 };
1018 
1019 const FFInputFormat ff_w64_demuxer = {
1020  .p.name = "w64",
1021  .p.long_name = NULL_IF_CONFIG_SMALL("Sony Wave64"),
1022  .p.flags = AVFMT_GENERIC_INDEX,
1023  .p.codec_tag = ff_wav_codec_tags_list,
1024  .p.priv_class = &w64_demuxer_class,
1025  .priv_data_size = sizeof(WAVDemuxContext),
1026  .flags_internal = FF_INFMT_FLAG_ID3V2_AUTO,
1027  .read_probe = w64_probe,
1028  .read_header = w64_read_header,
1029  .read_packet = wav_read_packet,
1030  .read_seek = wav_read_seek,
1031 };
1032 #endif /* CONFIG_W64_DEMUXER */
avpriv_new_chapter
AVChapter * avpriv_new_chapter(AVFormatContext *s, int64_t id, AVRational time_base, int64_t start, int64_t end, const char *title)
Add a new chapter.
Definition: demux_utils.c:43
WAVDemuxContext
Definition: wavdec.c:51
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:338
flags
const SwsFlags flags[]
Definition: swscale.c:72
WAVDemuxContext::unaligned
int unaligned
Definition: wavdec.c:67
WAVDemuxContext::smv_block
int smv_block
Definition: wavdec.c:59
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:216
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:383
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:71
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:463
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
pcm.h
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:53
AV_WL32
#define AV_WL32(p, v)
Definition: intreadwrite.h:422
av_compare_ts
int av_compare_ts(int64_t ts_a, AVRational tb_a, int64_t ts_b, AVRational tb_b)
Compare two timestamps each in its own time base.
Definition: mathematics.c:147
W64_DEMUXER_OPTIONS_OFFSET
#define W64_DEMUXER_OPTIONS_OFFSET
avformat_new_stream
AVStream * avformat_new_stream(AVFormatContext *s, const struct AVCodec *c)
Add a new stream to a media file.
AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:57
WAVDemuxContext::smv_data_ofs
int64_t smv_data_ofs
Definition: wavdec.c:56
audio_dts
static int64_t audio_dts
Definition: movenc.c:62
WAVDemuxContext::smv_frames_per_jpeg
int smv_frames_per_jpeg
Definition: wavdec.c:58
int64_t
long long int64_t
Definition: coverity.c:34
id3v2.h
FF_INFMT_FLAG_ID3V2_AUTO
#define FF_INFMT_FLAG_ID3V2_AUTO
Automatically parse ID3v2 metadata.
Definition: demux.h:45
WAVDemuxContext::max_size
int max_size
Definition: wavdec.c:64
internal.h
AVOption
AVOption.
Definition: opt.h:429
ff_id3v2_read
void ff_id3v2_read(AVFormatContext *s, const char *magic, ID3v2ExtraMeta **extra_meta, unsigned int max_search_size)
Read an ID3v2 tag, including supported extra metadata.
Definition: id3v2.c:1171
AVMetadataConv
Definition: metadata.h:34
AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: packet.h:613
mathematics.h
AVChannelLayout::order
enum AVChannelOrder order
Channel order used in this layout.
Definition: channel_layout.h:324
FFMAX
#define FFMAX(a, b)
Definition: macros.h:47
AVChannelLayout::nb_channels
int nb_channels
Number of channels in this layout.
Definition: channel_layout.h:329
avio_size
int64_t avio_size(AVIOContext *s)
Get the filesize.
Definition: aviobuf.c:326
WAVDemuxContext::data_end
int64_t data_end
Definition: wavdec.c:53
video_dts
static int64_t video_dts
Definition: movenc.c:62
WAVDemuxContext::w64
int w64
Definition: wavdec.c:54
ff_get_extradata
int ff_get_extradata(void *logctx, AVCodecParameters *par, AVIOContext *pb, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0 and f...
Definition: demux_utils.c:340
AVPROBE_SCORE_MAX
#define AVPROBE_SCORE_MAX
maximum score
Definition: avformat.h:463
return
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a it should return
Definition: filter_design.txt:265
avpriv_set_pts_info
void avpriv_set_pts_info(AVStream *st, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: avformat.c:895
ff_w64_guid_summarylist
const uint8_t ff_w64_guid_summarylist[16]
Definition: w64.c:47
ff_wav_demuxer
const FFInputFormat ff_wav_demuxer
ffstream
static av_always_inline FFStream * ffstream(AVStream *st)
Definition: internal.h:362
read_seek
static int read_seek(AVFormatContext *ctx, int stream_index, int64_t timestamp, int flags)
Definition: libcdio.c:151
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:494
AVFMT_GENERIC_INDEX
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:479
demux_options
static const AVOption demux_options[]
Definition: wavdec.c:73
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:461
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:804
avio_rl16
unsigned int avio_rl16(AVIOContext *s)
Definition: aviobuf.c:717
ff_id3v2_parse_chapters
int ff_id3v2_parse_chapters(AVFormatContext *s, ID3v2ExtraMeta *cur)
Create chapters for all CHAP tags found in the ID3v2 header.
Definition: id3v2.c:1224
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:79
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:549
avassert.h
avio_rb32
unsigned int avio_rb32(AVIOContext *s)
Definition: aviobuf.c:764
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:210
ID3v2ExtraMeta
Definition: id3v2.h:84
read_packet
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_read_callback.c:42
avio_get_str16le
int avio_get_str16le(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a UTF-16 string from pb and convert it to UTF-8.
FF_ARG_GUID
#define FF_ARG_GUID(g)
Definition: riff.h:109
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:198
AV_CODEC_ID_XMA1
@ AV_CODEC_ID_XMA1
Definition: codec_id.h:539
AVInputFormat::name
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:549
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:201
AVCodecParameters::width
int width
The width of the video frame in pixels.
Definition: codec_par.h:143
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:460
AV_CHANNEL_ORDER_UNSPEC
@ AV_CHANNEL_ORDER_UNSPEC
Only the channel count is specified, without any further information about the channel order.
Definition: channel_layout.h:119
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:42
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:231
AV_CODEC_ID_PCM_F24LE
@ AV_CODEC_ID_PCM_F24LE
Definition: codec_id.h:372
channels
channels
Definition: aptx.h:31
AV_RL16
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_RL16
Definition: bytestream.h:94
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
ff_read_riff_info
int ff_read_riff_info(AVFormatContext *s, int64_t size)
Definition: riffdec.c:257
key
const char * key
Definition: hwcontext_opencl.c:189
if
if(ret)
Definition: filter_design.txt:179
FFStream::need_parsing
enum AVStreamParseType need_parsing
Definition: internal.h:314
AVFormatContext
Format I/O context.
Definition: avformat.h:1264
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:768
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:76
fabs
static __device__ float fabs(float a)
Definition: cuda_runtime.h:182
AVStream::time_base
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented.
Definition: avformat.h:784
NULL
#define NULL
Definition: coverity.c:32
ff_pcm_default_packet_size
int ff_pcm_default_packet_size(AVCodecParameters *par)
Definition: pcm.c:29
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:242
ff_id3v2_parse_apic
int ff_id3v2_parse_apic(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Create a stream for each APIC (attached picture) extracted from the ID3v2 header.
Definition: id3v2.c:1193
avio_rb64
uint64_t avio_rb64(AVIOContext *s)
Definition: aviobuf.c:911
AVProbeData
This structure contains the data a format has to probe a file.
Definition: avformat.h:451
AVCodecParameters::ch_layout
AVChannelLayout ch_layout
The channel layout and number of channels.
Definition: codec_par.h:207
AVPROBE_SCORE_EXTENSION
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:461
AVCodecParameters::sample_rate
int sample_rate
The number of audio samples per second.
Definition: codec_par.h:213
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:49
ff_w64_guid_fmt
const uint8_t ff_w64_guid_fmt[16]
Definition: w64.c:33
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:75
WAVDemuxContext::smv_last_stream
int smv_last_stream
Definition: wavdec.c:60
av_get_exact_bits_per_sample
int av_get_exact_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:454
avio_rl32
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:733
AVIOContext
Bytestream IO Context.
Definition: avio.h:160
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:350
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:94
DEC
#define DEC
Definition: wavdec.c:72
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:261
FFStream
Definition: internal.h:128
i
#define i(width, name, range_min, range_max)
Definition: cbs_h264.c:63
ff_spdif_probe
int ff_spdif_probe(const uint8_t *p_buf, int buf_size, enum AVCodecID *codec)
Definition: spdifdec.c:122
WAVDemuxContext::smv_eof
int smv_eof
Definition: wavdec.c:61
AV_CODEC_ID_DTS
@ AV_CODEC_ID_DTS
Definition: codec_id.h:464
avio_get_str
int avio_get_str(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a string from pb into buf.
Definition: aviobuf.c:869
size
int size
Definition: twinvq_data.h:10344
AV_CODEC_ID_SMVJPEG
@ AV_CODEC_ID_SMVJPEG
Definition: codec_id.h:268
avio.h
ID3v2_DEFAULT_MAGIC
#define ID3v2_DEFAULT_MAGIC
Default magic bytes for ID3v2 header: "ID3".
Definition: id3v2.h:35
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:247
ff_riff_info_conv
const AVMetadataConv ff_riff_info_conv[]
Definition: riff.c:637
FFInputFormat::p
AVInputFormat p
The public AVInputFormat.
Definition: demux.h:70
avio_r8
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:606
ffio_ensure_seekback
int ffio_ensure_seekback(AVIOContext *s, int64_t buf_size)
Ensures that the requested seekback buffer size will be available.
Definition: aviobuf.c:1026
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
read_header
static int read_header(FFV1Context *f, RangeCoder *c)
Definition: ffv1dec.c:501
version
version
Definition: libkvazaar.c:313
FFStream::probe_packets
int probe_packets
Number of packets to buffer for codec probing.
Definition: internal.h:311
ff_spdif_read_packet
int ff_spdif_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: spdifdec.c:189
filesize
static int64_t filesize(AVIOContext *pb)
Definition: ffmpeg_mux.c:51
set_max_size
static void set_max_size(AVStream *st, WAVDemuxContext *wav)
Definition: wavdec.c:82
WAVDemuxContext::rifx
int rifx
Definition: wavdec.c:68
log.h
av_malloc
#define av_malloc(s)
Definition: ops_asmgen.c:44
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:588
avio_rl24
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:725
avio_internal.h
WAVDemuxContext::audio_eof
int audio_eof
Definition: wavdec.c:62
ff_w64_guid_wave
const uint8_t ff_w64_guid_wave[16]
Definition: w64.c:28
AVCodecParameters::height
int height
The height of the video frame in pixels.
Definition: codec_par.h:150
AVCodecParameters::block_align
int block_align
The number of bytes per coded audio frame, required by some formats.
Definition: codec_par.h:221
WAVDemuxContext::smv_block_size
int smv_block_size
Definition: wavdec.c:57
value
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
Definition: writing_filters.txt:86
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
demux.h
AV_CODEC_ID_PCM_F16LE
@ AV_CODEC_ID_PCM_F16LE
Definition: codec_id.h:371
ff_w64_guid_fact
const uint8_t ff_w64_guid_fact[16]
Definition: w64.c:38
len
int len
Definition: vorbis_enc_data.h:426
ff_get_wav_header
int ff_get_wav_header(AVFormatContext *s, AVIOContext *pb, AVCodecParameters *par, int size, int big_endian)
Definition: riffdec.c:95
av_get_packet
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:98
av_uninit
#define av_uninit(x)
Definition: attributes.h:187
tag
uint32_t tag
Definition: movenc.c:2048
AVStream::id
int id
Format-specific stream ID.
Definition: avformat.h:757
ret
ret
Definition: filter_design.txt:187
AVStream
Stream structure.
Definition: avformat.h:745
WAVDemuxContext::spdif
int spdif
Definition: wavdec.c:65
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:236
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:81
ff_pcm_read_seek
int ff_pcm_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
Definition: pcm.c:73
metadata.h
pos
unsigned int pos
Definition: spdifenc.c:414
avformat.h
dict.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
id
enum AVCodecID id
Definition: dts2pts.c:550
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
av_sat_add64
#define av_sat_add64
Definition: common.h:139
set_spdif
static void set_spdif(AVFormatContext *s, WAVDemuxContext *wav)
Definition: wavdec.c:90
AVStream::index
int index
stream index in AVFormatContext
Definition: avformat.h:751
WAVDemuxContext::smv_given_first
int smv_given_first
Definition: wavdec.c:66
AV_CODEC_ID_G729
@ AV_CODEC_ID_G729
Definition: codec_id.h:513
w64.h
WAVDemuxContext::ignore_length
int ignore_length
Definition: wavdec.c:63
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:41
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Underlying C type is int.
Definition: opt.h:259
av_channel_layout_uninit
void av_channel_layout_uninit(AVChannelLayout *channel_layout)
Free any allocated data in the channel layout and reset the channel count to 0.
Definition: channel_layout.c:443
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:615
temp
else temp
Definition: vf_mcdeint.c:271
AVSTREAM_PARSE_FULL_RAW
@ AVSTREAM_PARSE_FULL_RAW
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:594
OFFSET
#define OFFSET(x)
Definition: wavdec.c:71
samples
Filter the word “frame” indicates either a video frame or a group of audio samples
Definition: filter_design.txt:8
Windows::Graphics::DirectX::Direct3D11::p
IDirect3DDxgiInterfaceAccess _COM_Outptr_ void ** p
Definition: vsrc_gfxcapture_winrt.hpp:53
AVPacket::stream_index
int stream_index
Definition: packet.h:597
avio_skip
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:321
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:200
read_probe
static int read_probe(const AVProbeData *p)
Definition: cdg.c:30
ff_w64_guid_data
const uint8_t ff_w64_guid_data[16]
Definition: w64.c:42
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:346
AVCodecParameters::bits_per_coded_sample
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: codec_par.h:113
mem.h
find_guid
static const GUIDParseTable * find_guid(ff_asf_guid guid)
Definition: asfdec_o.c:1549
AV_CODEC_ID_XMA2
@ AV_CODEC_ID_XMA2
Definition: codec_id.h:540
FFStream::request_probe
int request_probe
stream probing state -1 -> probing finished 0 -> no probing requested rest -> perform probing with re...
Definition: internal.h:198
ff_w64_guid_riff
const uint8_t ff_w64_guid_riff[16]
Definition: w64.c:23
av_free
#define av_free(p)
Definition: tableprint_vlc.h:34
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:57
AVPacket
This structure stores compressed data.
Definition: packet.h:572
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Underlying C type is int.
Definition: opt.h:327
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:86
riff.h
ff_id3v2_free_extra_meta
void ff_id3v2_free_extra_meta(ID3v2ExtraMeta **extra_meta)
Free memory allocated parsing special (non-text) metadata.
Definition: id3v2.c:1177
FFStream::cur_dts
int64_t cur_dts
Definition: internal.h:353
AVPacket::pos
int64_t pos
byte position in stream, -1 if unknown
Definition: packet.h:615
FFInputFormat
Definition: demux.h:66
avio_rl64
uint64_t avio_rl64(AVIOContext *s)
Definition: aviobuf.c:741
int32_t
int32_t
Definition: audioconvert.c:56
AVCodecParameters::bit_rate
int64_t bit_rate
The average bitrate of the encoded data (in bits per second).
Definition: codec_par.h:99
ff_id3v2_parse_priv
int ff_id3v2_parse_priv(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Add metadata for all PRIV tags in the ID3v2 header.
Definition: id3v2.c:1289
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
MKTAG
#define MKTAG(a, b, c, d)
Definition: macros.h:55
ffio_read_size
int ffio_read_size(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:665
pkt
static AVPacket * pkt
Definition: demux_decode.c:55
FF_SANE_NB_CHANNELS
#define FF_SANE_NB_CHANNELS
Definition: internal.h:37
snprintf
#define snprintf
Definition: snprintf.h:34
WAVDemuxContext::vst
AVStream * vst
Definition: wavdec.c:55
ff_w64_demuxer
const FFInputFormat ff_w64_demuxer
spdif.h
FF_PRI_GUID
#define FF_PRI_GUID
Definition: riff.h:105
ff_wav_codec_tags_list
const AVCodecTag *const ff_wav_codec_tags_list[]
ff_metadata_conv_ctx
void ff_metadata_conv_ctx(AVFormatContext *ctx, const AVMetadataConv *d_conv, const AVMetadataConv *s_conv)
Definition: metadata.c:59
av_fourcc2str
#define av_fourcc2str(fourcc)
Definition: avutil.h:347
ff_alloc_extradata
int ff_alloc_extradata(AVCodecParameters *par, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0.
Definition: utils.c:237
avio_feof
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:349