FFmpeg
wavdec.c
Go to the documentation of this file.
1 /*
2  * WAV demuxer
3  * Copyright (c) 2001, 2002 Fabrice Bellard
4  *
5  * Sony Wave64 demuxer
6  * RF64 demuxer
7  * Copyright (c) 2009 Daniel Verkamp
8  *
9  * BW64 demuxer
10  *
11  * This file is part of FFmpeg.
12  *
13  * FFmpeg is free software; you can redistribute it and/or
14  * modify it under the terms of the GNU Lesser General Public
15  * License as published by the Free Software Foundation; either
16  * version 2.1 of the License, or (at your option) any later version.
17  *
18  * FFmpeg is distributed in the hope that it will be useful,
19  * but WITHOUT ANY WARRANTY; without even the implied warranty of
20  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21  * Lesser General Public License for more details.
22  *
23  * You should have received a copy of the GNU Lesser General Public
24  * License along with FFmpeg; if not, write to the Free Software
25  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26  */
27 
28 #include <stdint.h>
29 
30 #include "config_components.h"
31 #include "libavutil/avassert.h"
32 #include "libavutil/dict.h"
33 #include "libavutil/intreadwrite.h"
34 #include "libavutil/log.h"
35 #include "libavutil/mathematics.h"
36 #include "libavutil/opt.h"
37 #include "libavcodec/internal.h"
38 #include "avformat.h"
39 #include "avio.h"
40 #include "avio_internal.h"
41 #include "demux.h"
42 #include "id3v2.h"
43 #include "internal.h"
44 #include "metadata.h"
45 #include "pcm.h"
46 #include "riff.h"
47 #include "w64.h"
48 #include "spdif.h"
49 
50 typedef struct WAVDemuxContext {
51  const AVClass *class;
52  int64_t data_end;
53  int w64;
55  int64_t smv_data_ofs;
58  int smv_block;
60  int smv_eof;
61  int audio_eof;
63  int max_size;
64  int spdif;
66  int unaligned; // e.g. if an odd number of bytes ID3 tag was prepended
67  int rifx; // RIFX: integer byte order for parameters is big endian
69 
70 #define OFFSET(x) offsetof(WAVDemuxContext, x)
71 #define DEC AV_OPT_FLAG_DECODING_PARAM
72 static const AVOption demux_options[] = {
73 #define W64_DEMUXER_OPTIONS_OFFSET (1 * CONFIG_WAV_DEMUXER)
74 #if CONFIG_WAV_DEMUXER
75  { "ignore_length", "Ignore length", OFFSET(ignore_length), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, DEC },
76 #endif
77  { "max_size", "max size of single packet", OFFSET(max_size), AV_OPT_TYPE_INT, { .i64 = 4096 }, 1024, 1 << 22, DEC },
78  { NULL },
79 };
80 
82 {
83  if (CONFIG_SPDIF_DEMUXER && s->streams[0]->codecpar->codec_tag == 1) {
84  enum AVCodecID codec;
85  int len = 1<<16;
86  int ret = ffio_ensure_seekback(s->pb, len);
87 
88  if (ret >= 0) {
89  uint8_t *buf = av_malloc(len + AV_INPUT_BUFFER_PADDING_SIZE);
90  if (!buf) {
91  ret = AVERROR(ENOMEM);
92  } else {
93  int64_t pos = avio_tell(s->pb);
94  len = ret = avio_read(s->pb, buf, len);
95  if (len >= 0) {
96  ret = ff_spdif_probe(buf, len, &codec);
98  s->streams[0]->codecpar->codec_id = codec;
99  wav->spdif = 1;
100  }
101  }
102  avio_seek(s->pb, pos, SEEK_SET);
103  av_free(buf);
104  }
105  }
106 
107  if (ret < 0)
108  av_log(s, AV_LOG_WARNING, "Cannot check for SPDIF\n");
109  }
110 }
111 
112 #if CONFIG_WAV_DEMUXER
113 
114 static int64_t next_tag(AVIOContext *pb, uint32_t *tag, int big_endian)
115 {
116  *tag = avio_rl32(pb);
117  if (!big_endian) {
118  return avio_rl32(pb);
119  } else {
120  return avio_rb32(pb);
121  }
122 }
123 
124 /* RIFF chunks are always at even offsets relative to where they start. */
125 static int64_t wav_seek_tag(WAVDemuxContext * wav, AVIOContext *s, int64_t offset, int whence)
126 {
127  offset += offset < INT64_MAX && offset + wav->unaligned & 1;
128 
129  return avio_seek(s, offset, whence);
130 }
131 
132 /* return the size of the found tag */
133 static int64_t find_tag(WAVDemuxContext * wav, AVIOContext *pb, uint32_t tag1)
134 {
135  unsigned int tag;
136  int64_t size;
137 
138  for (;;) {
139  if (avio_feof(pb))
140  return AVERROR_EOF;
141  size = next_tag(pb, &tag, wav->rifx);
142  if (tag == tag1)
143  break;
144  wav_seek_tag(wav, pb, size, SEEK_CUR);
145  }
146  return size;
147 }
148 
149 static int wav_probe(const AVProbeData *p)
150 {
151  /* check file header */
152  if (p->buf_size <= 32)
153  return 0;
154  if (!memcmp(p->buf + 8, "WAVE", 4)) {
155  if (!memcmp(p->buf, "RIFF", 4) || !memcmp(p->buf, "RIFX", 4))
156  /* Since the ACT demuxer has a standard WAV header at the top of
157  * its own, the returned score is decreased to avoid a probe
158  * conflict between ACT and WAV. */
159  return AVPROBE_SCORE_MAX - 1;
160  else if ((!memcmp(p->buf, "RF64", 4) ||
161  !memcmp(p->buf, "BW64", 4)) &&
162  !memcmp(p->buf + 12, "ds64", 4))
163  return AVPROBE_SCORE_MAX;
164  }
165  return 0;
166 }
167 
168 static void handle_stream_probing(AVStream *st)
169 {
171  FFStream *const sti = ffstream(st);
173  sti->probe_packets = FFMIN(sti->probe_packets, 32);
174  }
175 }
176 
177 static int wav_parse_fmt_tag(AVFormatContext *s, int64_t size, AVStream *st)
178 {
179  AVIOContext *pb = s->pb;
180  WAVDemuxContext *wav = s->priv_data;
181  int ret;
182 
183  /* parse fmt header */
184  ret = ff_get_wav_header(s, pb, st->codecpar, size, wav->rifx);
185  if (ret < 0)
186  return ret;
187  handle_stream_probing(st);
188 
190 
191  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
192 
193  return 0;
194 }
195 
196 static int wav_parse_xma2_tag(AVFormatContext *s, int64_t size, AVStream *st)
197 {
198  AVIOContext *pb = s->pb;
199  int version, num_streams, i, channels = 0, ret;
200 
201  if (size < 36)
202  return AVERROR_INVALIDDATA;
203 
207 
208  version = avio_r8(pb);
209  if (version != 3 && version != 4)
210  return AVERROR_INVALIDDATA;
211  num_streams = avio_r8(pb);
212  if (size != (32 + ((version==3)?0:8) + 4*num_streams))
213  return AVERROR_INVALIDDATA;
214  avio_skip(pb, 10);
215  st->codecpar->sample_rate = avio_rb32(pb);
216  if (version == 4)
217  avio_skip(pb, 8);
218  avio_skip(pb, 4);
219  st->duration = avio_rb32(pb);
220  avio_skip(pb, 8);
221 
222  for (i = 0; i < num_streams; i++) {
223  channels += avio_r8(pb);
224  avio_skip(pb, 3);
225  }
229 
230  if (st->codecpar->ch_layout.nb_channels <= 0 || st->codecpar->sample_rate <= 0)
231  return AVERROR_INVALIDDATA;
232 
233  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
234 
235  avio_seek(pb, -size, SEEK_CUR);
236  if ((ret = ff_get_extradata(s, st->codecpar, pb, size)) < 0)
237  return ret;
238 
239  return 0;
240 }
241 
242 static inline int wav_parse_bext_string(AVFormatContext *s, const char *key,
243  int length)
244 {
245  char temp[257];
246  int ret;
247 
248  av_assert0(length < sizeof(temp));
249  if ((ret = ffio_read_size(s->pb, temp, length)) < 0)
250  return ret;
251 
252  temp[length] = 0;
253 
254  if (strlen(temp))
255  return av_dict_set(&s->metadata, key, temp, 0);
256 
257  return 0;
258 }
259 
260 static int wav_parse_bext_tag(AVFormatContext *s, int64_t size)
261 {
262  char temp[131], *coding_history;
263  int ret, x;
264  uint64_t time_reference;
265  int64_t umid_parts[8], umid_mask = 0;
266 
267  if ((ret = wav_parse_bext_string(s, "description", 256)) < 0 ||
268  (ret = wav_parse_bext_string(s, "originator", 32)) < 0 ||
269  (ret = wav_parse_bext_string(s, "originator_reference", 32)) < 0 ||
270  (ret = wav_parse_bext_string(s, "origination_date", 10)) < 0 ||
271  (ret = wav_parse_bext_string(s, "origination_time", 8)) < 0)
272  return ret;
273 
274  time_reference = avio_rl64(s->pb);
275  snprintf(temp, sizeof(temp), "%"PRIu64, time_reference);
276  if ((ret = av_dict_set(&s->metadata, "time_reference", temp, 0)) < 0)
277  return ret;
278 
279  /* check if version is >= 1, in which case an UMID may be present */
280  if (avio_rl16(s->pb) >= 1) {
281  for (x = 0; x < 8; x++)
282  umid_mask |= umid_parts[x] = avio_rb64(s->pb);
283 
284  if (umid_mask) {
285  /* the string formatting below is per SMPTE 330M-2004 Annex C */
286  if (umid_parts[4] == 0 && umid_parts[5] == 0 &&
287  umid_parts[6] == 0 && umid_parts[7] == 0) {
288  /* basic UMID */
289  snprintf(temp, sizeof(temp),
290  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
291  umid_parts[0], umid_parts[1],
292  umid_parts[2], umid_parts[3]);
293  } else {
294  /* extended UMID */
295  snprintf(temp, sizeof(temp),
296  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64
297  "%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
298  umid_parts[0], umid_parts[1],
299  umid_parts[2], umid_parts[3],
300  umid_parts[4], umid_parts[5],
301  umid_parts[6], umid_parts[7]);
302  }
303 
304  if ((ret = av_dict_set(&s->metadata, "umid", temp, 0)) < 0)
305  return ret;
306  }
307 
308  avio_skip(s->pb, 190);
309  } else
310  avio_skip(s->pb, 254);
311 
312  if (size > 602) {
313  /* CodingHistory present */
314  size -= 602;
315 
316  if (!(coding_history = av_malloc(size + 1)))
317  return AVERROR(ENOMEM);
318 
319  if ((ret = ffio_read_size(s->pb, coding_history, size)) < 0) {
320  av_free(coding_history);
321  return ret;
322  }
323 
324  coding_history[size] = 0;
325  if ((ret = av_dict_set(&s->metadata, "coding_history", coding_history,
327  return ret;
328  }
329 
330  return 0;
331 }
332 
333 static const AVMetadataConv wav_metadata_conv[] = {
334  { "description", "comment" },
335  { "originator", "encoded_by" },
336  { "origination_date", "date" },
337  { "origination_time", "creation_time" },
338  { 0 },
339 };
340 
341 /* wav input */
342 static int wav_read_header(AVFormatContext *s)
343 {
344  int64_t size, av_uninit(data_size);
345  int64_t sample_count = 0;
346  int rf64 = 0, bw64 = 0;
347  uint32_t tag;
348  AVIOContext *pb = s->pb;
349  AVStream *st = NULL;
350  WAVDemuxContext *wav = s->priv_data;
351  int ret, got_fmt = 0, got_xma2 = 0;
352  int64_t next_tag_ofs, data_ofs = -1;
353 
354  wav->unaligned = avio_tell(s->pb) & 1;
355 
356  wav->smv_data_ofs = -1;
357 
358  /* read chunk ID */
359  tag = avio_rl32(pb);
360  switch (tag) {
361  case MKTAG('R', 'I', 'F', 'F'):
362  break;
363  case MKTAG('R', 'I', 'F', 'X'):
364  wav->rifx = 1;
365  break;
366  case MKTAG('R', 'F', '6', '4'):
367  rf64 = 1;
368  break;
369  case MKTAG('B', 'W', '6', '4'):
370  bw64 = 1;
371  break;
372  default:
373  av_log(s, AV_LOG_ERROR, "invalid start code %s in RIFF header\n",
374  av_fourcc2str(tag));
375  return AVERROR_INVALIDDATA;
376  }
377 
378  /* read chunk size */
379  avio_rl32(pb);
380 
381  /* read format */
382  if (avio_rl32(pb) != MKTAG('W', 'A', 'V', 'E')) {
383  av_log(s, AV_LOG_ERROR, "invalid format in RIFF header\n");
384  return AVERROR_INVALIDDATA;
385  }
386 
387  if (rf64 || bw64) {
388  if (avio_rl32(pb) != MKTAG('d', 's', '6', '4'))
389  return AVERROR_INVALIDDATA;
390  size = avio_rl32(pb);
391  if (size < 24)
392  return AVERROR_INVALIDDATA;
393  avio_rl64(pb); /* RIFF size */
394 
395  data_size = avio_rl64(pb);
396  sample_count = avio_rl64(pb);
397 
398  if (data_size < 0 || sample_count < 0) {
399  av_log(s, AV_LOG_ERROR, "negative data_size and/or sample_count in "
400  "ds64: data_size = %"PRId64", sample_count = %"PRId64"\n",
401  data_size, sample_count);
402  return AVERROR_INVALIDDATA;
403  }
404  avio_skip(pb, size - 24); /* skip rest of ds64 chunk */
405 
406  }
407 
408  /* Create the audio stream now so that its index is always zero */
409  st = avformat_new_stream(s, NULL);
410  if (!st)
411  return AVERROR(ENOMEM);
412 
413  for (;;) {
414  AVStream *vst;
415  size = next_tag(pb, &tag, wav->rifx);
416  next_tag_ofs = avio_tell(pb) + size;
417 
418  if (avio_feof(pb))
419  break;
420 
421  switch (tag) {
422  case MKTAG('f', 'm', 't', ' '):
423  /* only parse the first 'fmt ' tag found */
424  if (!got_xma2 && !got_fmt && (ret = wav_parse_fmt_tag(s, size, st)) < 0) {
425  return ret;
426  } else if (got_fmt)
427  av_log(s, AV_LOG_WARNING, "found more than one 'fmt ' tag\n");
428 
429  got_fmt = 1;
430  break;
431  case MKTAG('X', 'M', 'A', '2'):
432  /* only parse the first 'XMA2' tag found */
433  if (!got_fmt && !got_xma2 && (ret = wav_parse_xma2_tag(s, size, st)) < 0) {
434  return ret;
435  } else if (got_xma2)
436  av_log(s, AV_LOG_WARNING, "found more than one 'XMA2' tag\n");
437 
438  got_xma2 = 1;
439  break;
440  case MKTAG('d', 'a', 't', 'a'):
441  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) && !got_fmt && !got_xma2) {
443  "found no 'fmt ' tag before the 'data' tag\n");
444  return AVERROR_INVALIDDATA;
445  }
446 
447  if (rf64 || bw64) {
448  next_tag_ofs = wav->data_end = av_sat_add64(avio_tell(pb), data_size);
449  } else if (size != 0xFFFFFFFF) {
450  data_size = size;
451  next_tag_ofs = wav->data_end = size ? next_tag_ofs : INT64_MAX;
452  } else {
453  av_log(s, AV_LOG_WARNING, "Ignoring maximum wav data size, "
454  "file may be invalid\n");
455  data_size = 0;
456  next_tag_ofs = wav->data_end = INT64_MAX;
457  }
458 
459  data_ofs = avio_tell(pb);
460 
461  /* don't look for footer metadata if we can't seek or if we don't
462  * know where the data tag ends
463  */
464  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) || (!(rf64 && !bw64) && !size))
465  goto break_loop;
466  break;
467  case MKTAG('f', 'a', 'c', 't'):
468  if (!sample_count)
469  sample_count = (!wav->rifx ? avio_rl32(pb) : avio_rb32(pb));
470  break;
471  case MKTAG('b', 'e', 'x', 't'):
472  if ((ret = wav_parse_bext_tag(s, size)) < 0)
473  return ret;
474  break;
475  case MKTAG('S','M','V','0'):
476  if (!got_fmt) {
477  av_log(s, AV_LOG_ERROR, "found no 'fmt ' tag before the 'SMV0' tag\n");
478  return AVERROR_INVALIDDATA;
479  }
480  // SMV file, a wav file with video appended.
481  if (size != MKTAG('0','2','0','0')) {
482  av_log(s, AV_LOG_ERROR, "Unknown SMV version found\n");
483  goto break_loop;
484  }
485  av_log(s, AV_LOG_DEBUG, "Found SMV data\n");
486  wav->smv_given_first = 0;
487  vst = avformat_new_stream(s, NULL);
488  if (!vst)
489  return AVERROR(ENOMEM);
490  wav->vst = vst;
491  avio_r8(pb);
492  vst->id = 1;
495  vst->codecpar->width = avio_rl24(pb);
496  vst->codecpar->height = avio_rl24(pb);
497  if ((ret = ff_alloc_extradata(vst->codecpar, 4)) < 0) {
498  av_log(s, AV_LOG_ERROR, "Could not allocate extradata.\n");
499  return ret;
500  }
501  size = avio_rl24(pb);
502  wav->smv_data_ofs = avio_tell(pb) + (size - 5) * 3;
503  avio_rl24(pb);
504  wav->smv_block_size = avio_rl24(pb);
505  if (!wav->smv_block_size)
506  return AVERROR_INVALIDDATA;
507  avpriv_set_pts_info(vst, 32, 1, avio_rl24(pb));
508  vst->duration = avio_rl24(pb);
509  avio_rl24(pb);
510  avio_rl24(pb);
511  wav->smv_frames_per_jpeg = avio_rl24(pb);
512  if (wav->smv_frames_per_jpeg > 65536) {
513  av_log(s, AV_LOG_ERROR, "too many frames per jpeg\n");
514  return AVERROR_INVALIDDATA;
515  }
517  goto break_loop;
518  case MKTAG('L', 'I', 'S', 'T'):
519  case MKTAG('l', 'i', 's', 't'):
520  if (size < 4) {
521  av_log(s, AV_LOG_ERROR, "too short LIST tag\n");
522  return AVERROR_INVALIDDATA;
523  }
524  switch (avio_rl32(pb)) {
525  case MKTAG('I', 'N', 'F', 'O'):
526  ff_read_riff_info(s, size - 4);
527  break;
528  case MKTAG('a', 'd', 't', 'l'):
529  if (s->nb_chapters > 0) {
530  while (avio_tell(pb) < next_tag_ofs &&
531  !avio_feof(pb)) {
532  char cue_label[512];
533  unsigned id, sub_size;
534 
535  if (avio_rl32(pb) != MKTAG('l', 'a', 'b', 'l'))
536  break;
537 
538  sub_size = avio_rl32(pb);
539  if (sub_size < 5)
540  break;
541  id = avio_rl32(pb);
542  avio_get_str(pb, sub_size - 4, cue_label, sizeof(cue_label));
543  avio_skip(pb, avio_tell(pb) & 1);
544 
545  for (int i = 0; i < s->nb_chapters; i++) {
546  if (s->chapters[i]->id == id) {
547  av_dict_set(&s->chapters[i]->metadata, "title", cue_label, 0);
548  break;
549  }
550  }
551  }
552  }
553  break;
554  }
555  break;
556  case MKTAG('I', 'D', '3', ' '):
557  case MKTAG('i', 'd', '3', ' '): {
558  ID3v2ExtraMeta *id3v2_extra_meta;
559  ff_id3v2_read(s, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta, 0);
560  if (id3v2_extra_meta) {
561  ff_id3v2_parse_apic(s, id3v2_extra_meta);
562  ff_id3v2_parse_chapters(s, id3v2_extra_meta);
563  ff_id3v2_parse_priv(s, id3v2_extra_meta);
564  }
565  ff_id3v2_free_extra_meta(&id3v2_extra_meta);
566  }
567  break;
568  case MKTAG('c', 'u', 'e', ' '):
569  if (size >= 4 && got_fmt && st->codecpar->sample_rate > 0) {
570  AVRational tb = {1, st->codecpar->sample_rate};
571  unsigned nb_cues = avio_rl32(pb);
572 
573  if (size >= nb_cues * 24LL + 4LL) {
574  for (int i = 0; i < nb_cues; i++) {
575  unsigned offset, id = avio_rl32(pb);
576 
577  if (avio_feof(pb))
578  return AVERROR_INVALIDDATA;
579 
580  avio_skip(pb, 16);
581  offset = avio_rl32(pb);
582 
584  return AVERROR(ENOMEM);
585  }
586  }
587  }
588  break;
589  }
590 
591  /* seek to next tag unless we know that we'll run into EOF */
592  if ((avio_size(pb) > 0 && next_tag_ofs >= avio_size(pb)) ||
593  wav_seek_tag(wav, pb, next_tag_ofs, SEEK_SET) < 0) {
594  break;
595  }
596  }
597 
598 break_loop:
599  if (!got_fmt && !got_xma2) {
600  av_log(s, AV_LOG_ERROR, "no 'fmt ' or 'XMA2' tag found\n");
601  return AVERROR_INVALIDDATA;
602  }
603 
604  if (data_ofs < 0) {
605  av_log(s, AV_LOG_ERROR, "no 'data' tag found\n");
606  return AVERROR_INVALIDDATA;
607  }
608 
609  avio_seek(pb, data_ofs, SEEK_SET);
610 
611  if (data_size > (INT64_MAX>>3)) {
612  av_log(s, AV_LOG_WARNING, "Data size %"PRId64" is too large\n", data_size);
613  data_size = 0;
614  }
615 
616  if ( st->codecpar->bit_rate > 0 && data_size > 0
617  && st->codecpar->sample_rate > 0
618  && sample_count > 0 && st->codecpar->ch_layout.nb_channels > 1
619  && sample_count % st->codecpar->ch_layout.nb_channels == 0) {
620  if (fabs(8.0 * data_size * st->codecpar->ch_layout.nb_channels * st->codecpar->sample_rate /
621  sample_count /st->codecpar->bit_rate - 1.0) < 0.3)
622  sample_count /= st->codecpar->ch_layout.nb_channels;
623  }
624 
625  if (data_size > 0 && sample_count && st->codecpar->ch_layout.nb_channels &&
626  (data_size << 3) / sample_count / st->codecpar->ch_layout.nb_channels > st->codecpar->bits_per_coded_sample + 1) {
627  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
628  sample_count = 0;
629  }
630 
631  /* G.729 hack (for Ticket4577)
632  * FIXME: Come up with cleaner, more general solution */
633  if (st->codecpar->codec_id == AV_CODEC_ID_G729 && sample_count && (data_size << 3) > sample_count) {
634  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
635  sample_count = 0;
636  }
637 
638  if (!sample_count || av_get_exact_bits_per_sample(st->codecpar->codec_id) > 0)
639  if ( st->codecpar->ch_layout.nb_channels
640  && data_size
642  && wav->data_end <= avio_size(pb))
643  sample_count = (data_size << 3)
644  /
646 
647  if (sample_count)
648  st->duration = sample_count;
649 
652  st->codecpar->bits_per_coded_sample == 32 &&
653  st->codecpar->extradata_size == 2 &&
654  AV_RL16(st->codecpar->extradata) == 1) {
657  } else if (st->codecpar->codec_id == AV_CODEC_ID_PCM_S24LE &&
659  st->codecpar->bits_per_coded_sample == 24) {
661  } else if (st->codecpar->codec_id == AV_CODEC_ID_XMA1 ||
663  st->codecpar->block_align = 2048;
664  } else if (st->codecpar->codec_id == AV_CODEC_ID_ADPCM_MS && st->codecpar->ch_layout.nb_channels > 2 &&
665  st->codecpar->block_align < INT_MAX / st->codecpar->ch_layout.nb_channels) {
667  }
668 
669  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
671 
672  set_spdif(s, wav);
673 
674  return 0;
675 }
676 
677 /**
678  * Find chunk with w64 GUID by skipping over other chunks.
679  * @return the size of the found chunk
680  */
681 static int64_t find_guid(AVIOContext *pb, const uint8_t guid1[16])
682 {
683  uint8_t guid[16];
684  int64_t size;
685 
686  while (!avio_feof(pb)) {
687  avio_read(pb, guid, 16);
688  size = avio_rl64(pb);
689  if (size <= 24 || size > INT64_MAX - 8)
690  return AVERROR_INVALIDDATA;
691  if (!memcmp(guid, guid1, 16))
692  return size;
693  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
694  }
695  return AVERROR_EOF;
696 }
697 
698 static int wav_read_packet(AVFormatContext *s, AVPacket *pkt)
699 {
700  int ret, size;
701  int64_t left;
702  WAVDemuxContext *wav = s->priv_data;
703  AVStream *st = s->streams[0];
704 
705  if (CONFIG_SPDIF_DEMUXER && wav->spdif == 1)
706  return ff_spdif_read_packet(s, pkt);
707 
708  if (wav->smv_data_ofs > 0) {
709  int64_t audio_dts, video_dts;
710  AVStream *vst = wav->vst;
711 smv_retry:
714 
716  /*We always return a video frame first to get the pixel format first*/
717  wav->smv_last_stream = wav->smv_given_first ?
719  audio_dts, st->time_base) > 0 : 0;
720  wav->smv_given_first = 1;
721  }
722  wav->smv_last_stream = !wav->smv_last_stream;
723  wav->smv_last_stream |= wav->audio_eof;
724  wav->smv_last_stream &= !wav->smv_eof;
725  if (wav->smv_last_stream) {
726  uint64_t old_pos = avio_tell(s->pb);
727  uint64_t new_pos = wav->smv_data_ofs +
728  wav->smv_block * (int64_t)wav->smv_block_size;
729  if (avio_seek(s->pb, new_pos, SEEK_SET) < 0) {
730  ret = AVERROR_EOF;
731  goto smv_out;
732  }
733  size = avio_rl24(s->pb);
734  if (size > wav->smv_block_size) {
735  ret = AVERROR_EOF;
736  goto smv_out;
737  }
738  ret = av_get_packet(s->pb, pkt, size);
739  if (ret < 0)
740  goto smv_out;
741  pkt->pos -= 3;
742  pkt->pts = wav->smv_block * wav->smv_frames_per_jpeg;
744  wav->smv_block++;
745 
746  pkt->stream_index = vst->index;
747 smv_out:
748  avio_seek(s->pb, old_pos, SEEK_SET);
749  if (ret == AVERROR_EOF) {
750  wav->smv_eof = 1;
751  goto smv_retry;
752  }
753  return ret;
754  }
755  }
756 
757  left = wav->data_end - avio_tell(s->pb);
758  if (wav->ignore_length)
759  left = INT_MAX;
760  if (left <= 0) {
761  if (CONFIG_W64_DEMUXER && wav->w64)
762  left = find_guid(s->pb, ff_w64_guid_data) - 24;
763  else
764  left = find_tag(wav, s->pb, MKTAG('d', 'a', 't', 'a'));
765  if (left < 0) {
766  wav->audio_eof = 1;
767  if (wav->smv_data_ofs > 0 && !wav->smv_eof)
768  goto smv_retry;
769  return AVERROR_EOF;
770  }
771  if (INT64_MAX - left < avio_tell(s->pb))
772  return AVERROR_INVALIDDATA;
773  wav->data_end = avio_tell(s->pb) + left;
774  }
775 
776  size = wav->max_size;
777  if (st->codecpar->block_align > 1) {
778  if (size < st->codecpar->block_align)
779  size = st->codecpar->block_align;
780  size = (size / st->codecpar->block_align) * st->codecpar->block_align;
781  }
782  size = FFMIN(size, left);
783  ret = av_get_packet(s->pb, pkt, size);
784  if (ret < 0)
785  return ret;
786  pkt->stream_index = 0;
787 
788  return ret;
789 }
790 
791 static int wav_read_seek(AVFormatContext *s,
792  int stream_index, int64_t timestamp, int flags)
793 {
794  WAVDemuxContext *wav = s->priv_data;
795  AVStream *ast = s->streams[0], *vst = wav->vst;
796  wav->smv_eof = 0;
797  wav->audio_eof = 0;
798 
799  if (stream_index != 0 && (!vst || stream_index != vst->index))
800  return AVERROR(EINVAL);
801  if (wav->smv_data_ofs > 0) {
802  int64_t smv_timestamp = timestamp;
803  if (stream_index == 0)
804  smv_timestamp = av_rescale_q(timestamp, ast->time_base, vst->time_base);
805  else
806  timestamp = av_rescale_q(smv_timestamp, vst->time_base, ast->time_base);
807  if (wav->smv_frames_per_jpeg > 0) {
808  wav->smv_block = smv_timestamp / wav->smv_frames_per_jpeg;
809  }
810  }
811 
812  switch (ast->codecpar->codec_id) {
813  case AV_CODEC_ID_MP2:
814  case AV_CODEC_ID_MP3:
815  case AV_CODEC_ID_AC3:
816  case AV_CODEC_ID_DTS:
817  case AV_CODEC_ID_XMA2:
818  /* use generic seeking with dynamically generated indexes */
819  return -1;
820  default:
821  break;
822  }
823  return ff_pcm_read_seek(s, 0, timestamp, flags);
824 }
825 
826 static const AVClass wav_demuxer_class = {
827  .class_name = "WAV demuxer",
828  .item_name = av_default_item_name,
829  .option = demux_options,
830  .version = LIBAVUTIL_VERSION_INT,
831 };
833  .name = "wav",
834  .long_name = NULL_IF_CONFIG_SMALL("WAV / WAVE (Waveform Audio)"),
835  .priv_data_size = sizeof(WAVDemuxContext),
836  .read_probe = wav_probe,
837  .read_header = wav_read_header,
838  .read_packet = wav_read_packet,
839  .read_seek = wav_read_seek,
841  .codec_tag = ff_wav_codec_tags_list,
842  .priv_class = &wav_demuxer_class,
843 };
844 #endif /* CONFIG_WAV_DEMUXER */
845 
846 #if CONFIG_W64_DEMUXER
847 static int w64_probe(const AVProbeData *p)
848 {
849  if (p->buf_size <= 40)
850  return 0;
851  if (!memcmp(p->buf, ff_w64_guid_riff, 16) &&
852  !memcmp(p->buf + 24, ff_w64_guid_wave, 16))
853  return AVPROBE_SCORE_MAX;
854  else
855  return 0;
856 }
857 
858 static int w64_read_header(AVFormatContext *s)
859 {
860  int64_t size, data_ofs = 0;
861  AVIOContext *pb = s->pb;
862  WAVDemuxContext *wav = s->priv_data;
863  AVStream *st;
864  uint8_t guid[16];
865  int ret;
866 
867  avio_read(pb, guid, 16);
868  if (memcmp(guid, ff_w64_guid_riff, 16))
869  return AVERROR_INVALIDDATA;
870 
871  /* riff + wave + fmt + sizes */
872  if (avio_rl64(pb) < 16 + 8 + 16 + 8 + 16 + 8)
873  return AVERROR_INVALIDDATA;
874 
875  avio_read(pb, guid, 16);
876  if (memcmp(guid, ff_w64_guid_wave, 16)) {
877  av_log(s, AV_LOG_ERROR, "could not find wave guid\n");
878  return AVERROR_INVALIDDATA;
879  }
880 
881  wav->w64 = 1;
882 
883  st = avformat_new_stream(s, NULL);
884  if (!st)
885  return AVERROR(ENOMEM);
886 
887  while (!avio_feof(pb)) {
888  if (avio_read(pb, guid, 16) != 16)
889  break;
890  size = avio_rl64(pb);
891  if (size <= 24 || INT64_MAX - size < avio_tell(pb)) {
892  if (data_ofs)
893  break;
894  return AVERROR_INVALIDDATA;
895  }
896 
897  if (!memcmp(guid, ff_w64_guid_fmt, 16)) {
898  /* subtract chunk header size - normal wav file doesn't count it */
899  ret = ff_get_wav_header(s, pb, st->codecpar, size - 24, 0);
900  if (ret < 0)
901  return ret;
902  avio_skip(pb, FFALIGN(size, INT64_C(8)) - size);
903  if (st->codecpar->block_align &&
905  st->codecpar->bits_per_coded_sample < 128) {
906  int block_align = st->codecpar->block_align;
907 
908  block_align = FFMAX(block_align,
909  ((st->codecpar->bits_per_coded_sample + 7) / 8) *
911  if (block_align > st->codecpar->block_align) {
912  av_log(s, AV_LOG_WARNING, "invalid block_align: %d, broken file.\n",
913  st->codecpar->block_align);
914  st->codecpar->block_align = block_align;
915  }
916  }
917  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
918  } else if (!memcmp(guid, ff_w64_guid_fact, 16)) {
919  int64_t samples;
920 
921  samples = avio_rl64(pb);
922  if (samples > 0)
923  st->duration = samples;
924  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 32);
925  } else if (!memcmp(guid, ff_w64_guid_data, 16)) {
926  wav->data_end = avio_tell(pb) + size - 24;
927 
928  data_ofs = avio_tell(pb);
929  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
930  break;
931 
932  avio_skip(pb, size - 24);
933  } else if (!memcmp(guid, ff_w64_guid_summarylist, 16)) {
934  int64_t start, end, cur;
935  uint32_t count, chunk_size, i;
936  int64_t filesize = avio_size(s->pb);
937 
938  start = avio_tell(pb);
939  end = start + FFALIGN(size, INT64_C(8)) - 24;
940  count = avio_rl32(pb);
941 
942  for (i = 0; i < count; i++) {
943  char chunk_key[5], *value;
944 
945  if (avio_feof(pb) || (cur = avio_tell(pb)) < 0 || cur > end - 8 /* = tag + size */)
946  break;
947 
948  chunk_key[4] = 0;
949  avio_read(pb, chunk_key, 4);
950  chunk_size = avio_rl32(pb);
951  if (chunk_size == UINT32_MAX || (filesize >= 0 && chunk_size > filesize))
952  return AVERROR_INVALIDDATA;
953 
954  value = av_malloc(chunk_size + 1);
955  if (!value)
956  return AVERROR(ENOMEM);
957 
958  ret = avio_get_str16le(pb, chunk_size, value, chunk_size);
959  if (ret < 0) {
960  av_free(value);
961  return ret;
962  }
963  avio_skip(pb, chunk_size - ret);
964 
965  av_dict_set(&s->metadata, chunk_key, value, AV_DICT_DONT_STRDUP_VAL);
966  }
967 
968  avio_skip(pb, end - avio_tell(pb));
969  } else {
970  av_log(s, AV_LOG_DEBUG, "unknown guid: "FF_PRI_GUID"\n", FF_ARG_GUID(guid));
971  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
972  }
973  }
974 
975  if (!data_ofs)
976  return AVERROR_EOF;
977 
978  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
980 
981  handle_stream_probing(st);
983 
984  avio_seek(pb, data_ofs, SEEK_SET);
985 
986  set_spdif(s, wav);
987 
988  return 0;
989 }
990 
991 static const AVClass w64_demuxer_class = {
992  .class_name = "W64 demuxer",
993  .item_name = av_default_item_name,
995  .version = LIBAVUTIL_VERSION_INT,
996 };
997 
999  .name = "w64",
1000  .long_name = NULL_IF_CONFIG_SMALL("Sony Wave64"),
1001  .priv_data_size = sizeof(WAVDemuxContext),
1002  .read_probe = w64_probe,
1003  .read_header = w64_read_header,
1004  .read_packet = wav_read_packet,
1005  .read_seek = wav_read_seek,
1007  .codec_tag = ff_wav_codec_tags_list,
1008  .priv_class = &w64_demuxer_class,
1009 };
1010 #endif /* CONFIG_W64_DEMUXER */
avpriv_new_chapter
AVChapter * avpriv_new_chapter(AVFormatContext *s, int64_t id, AVRational time_base, int64_t start, int64_t end, const char *title)
Add a new chapter.
Definition: demux_utils.c:42
WAVDemuxContext
Definition: wavdec.c:50
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:330
WAVDemuxContext::unaligned
int unaligned
Definition: wavdec.c:66
WAVDemuxContext::smv_block
int smv_block
Definition: wavdec.c:58
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:375
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:69
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:445
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
pcm.h
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:51
AV_WL32
#define AV_WL32(p, v)
Definition: intreadwrite.h:424
av_compare_ts
int av_compare_ts(int64_t ts_a, AVRational tb_a, int64_t ts_b, AVRational tb_b)
Compare two timestamps each in its own time base.
Definition: mathematics.c:147
W64_DEMUXER_OPTIONS_OFFSET
#define W64_DEMUXER_OPTIONS_OFFSET
avformat_new_stream
AVStream * avformat_new_stream(AVFormatContext *s, const struct AVCodec *c)
Add a new stream to a media file.
AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:57
WAVDemuxContext::smv_data_ofs
int64_t smv_data_ofs
Definition: wavdec.c:55
audio_dts
int64_t audio_dts
Definition: movenc.c:61
WAVDemuxContext::smv_frames_per_jpeg
int smv_frames_per_jpeg
Definition: wavdec.c:57
id3v2.h
WAVDemuxContext::max_size
int max_size
Definition: wavdec.c:63
internal.h
AVOption
AVOption.
Definition: opt.h:251
ff_id3v2_read
void ff_id3v2_read(AVFormatContext *s, const char *magic, ID3v2ExtraMeta **extra_meta, unsigned int max_search_size)
Read an ID3v2 tag, including supported extra metadata.
Definition: id3v2.c:1139
AVMetadataConv
Definition: metadata.h:34
ff_get_wav_header
int ff_get_wav_header(void *logctx, AVIOContext *pb, AVCodecParameters *par, int size, int big_endian)
Definition: riffdec.c:94
AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: packet.h:509
mathematics.h
AVProbeData::buf_size
int buf_size
Size of buf except extra allocated bytes.
Definition: avformat.h:455
AVChannelLayout::order
enum AVChannelOrder order
Channel order used in this layout.
Definition: channel_layout.h:312
FFMAX
#define FFMAX(a, b)
Definition: macros.h:47
AVChannelLayout::nb_channels
int nb_channels
Number of channels in this layout.
Definition: channel_layout.h:317
avio_size
int64_t avio_size(AVIOContext *s)
Get the filesize.
Definition: aviobuf.c:370
sample_rate
sample_rate
Definition: ffmpeg_filter.c:368
WAVDemuxContext::data_end
int64_t data_end
Definition: wavdec.c:52
video_dts
int64_t video_dts
Definition: movenc.c:61
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:30
WAVDemuxContext::w64
int w64
Definition: wavdec.c:53
ff_get_extradata
int ff_get_extradata(void *logctx, AVCodecParameters *par, AVIOContext *pb, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0 and f...
Definition: demux_utils.c:355
AVPROBE_SCORE_MAX
#define AVPROBE_SCORE_MAX
maximum score
Definition: avformat.h:464
return
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a it should return
Definition: filter_design.txt:264
avpriv_set_pts_info
void avpriv_set_pts_info(AVStream *st, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: avformat.c:761
ff_w64_guid_summarylist
const uint8_t ff_w64_guid_summarylist[16]
Definition: w64.c:47
ffstream
static av_always_inline FFStream * ffstream(AVStream *st)
Definition: internal.h:420
read_seek
static int read_seek(AVFormatContext *ctx, int stream_index, int64_t timestamp, int flags)
Definition: libcdio.c:151
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:513
AVFMT_GENERIC_INDEX
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:481
demux_options
static const AVOption demux_options[]
Definition: wavdec.c:72
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:443
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:900
avio_rl16
unsigned int avio_rl16(AVIOContext *s)
Definition: aviobuf.c:761
ff_id3v2_parse_chapters
int ff_id3v2_parse_chapters(AVFormatContext *s, ID3v2ExtraMeta *cur)
Create chapters for all CHAP tags found in the ID3v2 header.
Definition: id3v2.c:1192
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:79
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:558
avassert.h
avio_rb32
unsigned int avio_rb32(AVIOContext *s)
Definition: aviobuf.c:808
pkt
AVPacket * pkt
Definition: movenc.c:59
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
AVInputFormat
Definition: avformat.h:549
ID3v2ExtraMeta
Definition: id3v2.h:84
read_packet
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_read_callback.c:41
avio_get_str16le
int avio_get_str16le(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a UTF-16 string from pb and convert it to UTF-8.
FF_ARG_GUID
#define FF_ARG_GUID(g)
Definition: riff.h:109
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:198
AV_CODEC_ID_XMA1
@ AV_CODEC_ID_XMA1
Definition: codec_id.h:521
AVInputFormat::name
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:554
AVProbeData::buf
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:454
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
AVCodecParameters::width
int width
Video only.
Definition: codec_par.h:121
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:442
AV_CHANNEL_ORDER_UNSPEC
@ AV_CHANNEL_ORDER_UNSPEC
Only the channel count is specified, without any further information about the channel order.
Definition: channel_layout.h:112
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:40
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:201
AV_CODEC_ID_PCM_F24LE
@ AV_CODEC_ID_PCM_F24LE
Definition: codec_id.h:364
channels
channels
Definition: aptx.h:31
AV_RL16
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_RL16
Definition: bytestream.h:94
ff_w64_demuxer
const AVInputFormat ff_w64_demuxer
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
ff_read_riff_info
int ff_read_riff_info(AVFormatContext *s, int64_t size)
Definition: riffdec.c:242
ff_wav_demuxer
const AVInputFormat ff_wav_demuxer
key
const char * key
Definition: hwcontext_opencl.c:174
if
if(ret)
Definition: filter_design.txt:179
FFStream::need_parsing
enum AVStreamParseType need_parsing
Definition: internal.h:391
AVFormatContext
Format I/O context.
Definition: avformat.h:1115
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:864
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
read_header
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:550
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
fabs
static __device__ float fabs(float a)
Definition: cuda_runtime.h:182
AVStream::time_base
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented.
Definition: avformat.h:880
NULL
#define NULL
Definition: coverity.c:32
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:237
ff_id3v2_parse_apic
int ff_id3v2_parse_apic(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Create a stream for each APIC (attached picture) extracted from the ID3v2 header.
Definition: id3v2.c:1161
avio_rb64
uint64_t avio_rb64(AVIOContext *s)
Definition: aviobuf.c:955
AVProbeData
This structure contains the data a format has to probe a file.
Definition: avformat.h:452
AVCodecParameters::ch_layout
AVChannelLayout ch_layout
Audio only.
Definition: codec_par.h:206
AVPROBE_SCORE_EXTENSION
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:462
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:171
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:49
ff_w64_guid_fmt
const uint8_t ff_w64_guid_fmt[16]
Definition: w64.c:33
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:73
WAVDemuxContext::smv_last_stream
int smv_last_stream
Definition: wavdec.c:59
av_get_exact_bits_per_sample
int av_get_exact_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:465
avio_rl32
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:777
AVIOContext
Bytestream IO Context.
Definition: avio.h:166
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:342
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:106
DEC
#define DEC
Definition: wavdec.c:71
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:271
FFStream
Definition: internal.h:199
ff_spdif_probe
int ff_spdif_probe(const uint8_t *p_buf, int buf_size, enum AVCodecID *codec)
Definition: spdifdec.c:121
WAVDemuxContext::smv_eof
int smv_eof
Definition: wavdec.c:60
AV_CODEC_ID_DTS
@ AV_CODEC_ID_DTS
Definition: codec_id.h:446
avio_get_str
int avio_get_str(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a string from pb into buf.
Definition: aviobuf.c:913
size
int size
Definition: twinvq_data.h:10344
AV_CODEC_ID_SMVJPEG
@ AV_CODEC_ID_SMVJPEG
Definition: codec_id.h:267
avio.h
ID3v2_DEFAULT_MAGIC
#define ID3v2_DEFAULT_MAGIC
Default magic bytes for ID3v2 header: "ID3".
Definition: id3v2.h:35
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:248
ff_riff_info_conv
const AVMetadataConv ff_riff_info_conv[]
Definition: riff.c:620
avio_r8
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:650
ffio_ensure_seekback
int ffio_ensure_seekback(AVIOContext *s, int64_t buf_size)
Ensures that the requested seekback buffer size will be available.
Definition: aviobuf.c:1071
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
version
version
Definition: libkvazaar.c:321
FFStream::probe_packets
int probe_packets
Number of packets to buffer for codec probing.
Definition: internal.h:388
ff_spdif_read_packet
int ff_spdif_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: spdifdec.c:188
filesize
static int64_t filesize(AVIOContext *pb)
Definition: ffmpeg_mux.c:48
WAVDemuxContext::rifx
int rifx
Definition: wavdec.c:67
log.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:255
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:484
avio_rl24
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:769
avio_internal.h
WAVDemuxContext::audio_eof
int audio_eof
Definition: wavdec.c:61
ff_w64_guid_wave
const uint8_t ff_w64_guid_wave[16]
Definition: w64.c:28
AVCodecParameters::height
int height
Definition: codec_par.h:122
AVCodecParameters::block_align
int block_align
Audio only.
Definition: codec_par.h:178
WAVDemuxContext::smv_block_size
int smv_block_size
Definition: wavdec.c:56
value
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
Definition: writing_filters.txt:86
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
tb
#define tb
Definition: regdef.h:68
demux.h
AV_CODEC_ID_PCM_F16LE
@ AV_CODEC_ID_PCM_F16LE
Definition: codec_id.h:363
ff_w64_guid_fact
const uint8_t ff_w64_guid_fact[16]
Definition: w64.c:38
len
int len
Definition: vorbis_enc_data.h:426
av_get_packet
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:103
av_uninit
#define av_uninit(x)
Definition: attributes.h:154
tag
uint32_t tag
Definition: movenc.c:1737
AVStream::id
int id
Format-specific stream ID.
Definition: avformat.h:853
ret
ret
Definition: filter_design.txt:187
AVStream
Stream structure.
Definition: avformat.h:841
WAVDemuxContext::spdif
int spdif
Definition: wavdec.c:64
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:278
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:71
ff_pcm_read_seek
int ff_pcm_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
Definition: pcm.c:56
metadata.h
pos
unsigned int pos
Definition: spdifenc.c:413
avformat.h
dict.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
av_sat_add64
#define av_sat_add64
Definition: common.h:138
set_spdif
static void set_spdif(AVFormatContext *s, WAVDemuxContext *wav)
Definition: wavdec.c:81
id
enum AVCodecID id
Definition: dts2pts_bsf.c:364
AVStream::index
int index
stream index in AVFormatContext
Definition: avformat.h:847
WAVDemuxContext::smv_given_first
int smv_given_first
Definition: wavdec.c:65
AV_CODEC_ID_G729
@ AV_CODEC_ID_G729
Definition: codec_id.h:495
w64.h
WAVDemuxContext::ignore_length
int ignore_length
Definition: wavdec.c:62
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:41
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:225
av_channel_layout_uninit
void av_channel_layout_uninit(AVChannelLayout *channel_layout)
Free any allocated data in the channel layout and reset the channel count to 0.
Definition: channel_layout.c:640
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:659
temp
else temp
Definition: vf_mcdeint.c:263
AVSTREAM_PARSE_FULL_RAW
@ AVSTREAM_PARSE_FULL_RAW
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:695
OFFSET
#define OFFSET(x)
Definition: wavdec.c:70
samples
Filter the word “frame” indicates either a video frame or a group of audio samples
Definition: filter_design.txt:8
AVPacket::stream_index
int stream_index
Definition: packet.h:493
avio_skip
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:365
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
read_probe
static int read_probe(const AVProbeData *p)
Definition: cdg.c:29
ff_w64_guid_data
const uint8_t ff_w64_guid_data[16]
Definition: w64.c:42
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:338
AVCodecParameters::bits_per_coded_sample
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: codec_par.h:97
find_guid
static const GUIDParseTable * find_guid(ff_asf_guid guid)
Definition: asfdec_o.c:1545
AV_CODEC_ID_XMA2
@ AV_CODEC_ID_XMA2
Definition: codec_id.h:522
FFStream::request_probe
int request_probe
stream probing state -1 -> probing finished 0 -> no probing requested rest -> perform probing with re...
Definition: internal.h:268
ff_w64_guid_riff
const uint8_t ff_w64_guid_riff[16]
Definition: w64.c:23
av_free
#define av_free(p)
Definition: tableprint_vlc.h:33
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:55
AVPacket
This structure stores compressed data.
Definition: packet.h:468
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Definition: opt.h:244
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:88
riff.h
ff_id3v2_free_extra_meta
void ff_id3v2_free_extra_meta(ID3v2ExtraMeta **extra_meta)
Free memory allocated parsing special (non-text) metadata.
Definition: id3v2.c:1145
FFStream::cur_dts
int64_t cur_dts
Definition: internal.h:415
AVPacket::pos
int64_t pos
byte position in stream, -1 if unknown
Definition: packet.h:511
avio_rl64
uint64_t avio_rl64(AVIOContext *s)
Definition: aviobuf.c:785
int32_t
int32_t
Definition: audioconvert.c:56
flags
#define flags(name, subs,...)
Definition: cbs_av1.c:474
AVCodecParameters::bit_rate
int64_t bit_rate
The average bitrate of the encoded data (in bits per second).
Definition: codec_par.h:84
ff_id3v2_parse_priv
int ff_id3v2_parse_priv(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Add metadata for all PRIV tags in the ID3v2 header.
Definition: id3v2.c:1257
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
MKTAG
#define MKTAG(a, b, c, d)
Definition: macros.h:55
ffio_read_size
int ffio_read_size(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:709
FF_SANE_NB_CHANNELS
#define FF_SANE_NB_CHANNELS
Definition: internal.h:40
snprintf
#define snprintf
Definition: snprintf.h:34
WAVDemuxContext::vst
AVStream * vst
Definition: wavdec.c:54
spdif.h
FF_PRI_GUID
#define FF_PRI_GUID
Definition: riff.h:105
ff_wav_codec_tags_list
const AVCodecTag *const ff_wav_codec_tags_list[]
ff_metadata_conv_ctx
void ff_metadata_conv_ctx(AVFormatContext *ctx, const AVMetadataConv *d_conv, const AVMetadataConv *s_conv)
Definition: metadata.c:59
av_fourcc2str
#define av_fourcc2str(fourcc)
Definition: avutil.h:358
ff_alloc_extradata
int ff_alloc_extradata(AVCodecParameters *par, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0.
Definition: utils.c:239
avio_feof
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:393