FFmpeg
wavdec.c
Go to the documentation of this file.
1 /*
2  * WAV demuxer
3  * Copyright (c) 2001, 2002 Fabrice Bellard
4  *
5  * Sony Wave64 demuxer
6  * RF64 demuxer
7  * Copyright (c) 2009 Daniel Verkamp
8  *
9  * BW64 demuxer
10  *
11  * This file is part of FFmpeg.
12  *
13  * FFmpeg is free software; you can redistribute it and/or
14  * modify it under the terms of the GNU Lesser General Public
15  * License as published by the Free Software Foundation; either
16  * version 2.1 of the License, or (at your option) any later version.
17  *
18  * FFmpeg is distributed in the hope that it will be useful,
19  * but WITHOUT ANY WARRANTY; without even the implied warranty of
20  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21  * Lesser General Public License for more details.
22  *
23  * You should have received a copy of the GNU Lesser General Public
24  * License along with FFmpeg; if not, write to the Free Software
25  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26  */
27 
28 #include <stdint.h>
29 
30 #include "config_components.h"
31 #include "libavutil/avassert.h"
32 #include "libavutil/dict.h"
33 #include "libavutil/intreadwrite.h"
34 #include "libavutil/log.h"
35 #include "libavutil/mathematics.h"
36 #include "libavutil/opt.h"
37 #include "avformat.h"
38 #include "avio.h"
39 #include "avio_internal.h"
40 #include "demux.h"
41 #include "id3v2.h"
42 #include "internal.h"
43 #include "metadata.h"
44 #include "pcm.h"
45 #include "riff.h"
46 #include "w64.h"
47 #include "spdif.h"
48 
49 typedef struct WAVDemuxContext {
50  const AVClass *class;
51  int64_t data_end;
52  int w64;
54  int64_t smv_data_ofs;
57  int smv_block;
59  int smv_eof;
60  int audio_eof;
62  int max_size;
63  int spdif;
65  int unaligned; // e.g. if an odd number of bytes ID3 tag was prepended
66  int rifx; // RIFX: integer byte order for parameters is big endian
68 
69 #define OFFSET(x) offsetof(WAVDemuxContext, x)
70 #define DEC AV_OPT_FLAG_DECODING_PARAM
71 static const AVOption demux_options[] = {
72 #define W64_DEMUXER_OPTIONS_OFFSET (1 * CONFIG_WAV_DEMUXER)
73 #if CONFIG_WAV_DEMUXER
74  { "ignore_length", "Ignore length", OFFSET(ignore_length), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, DEC },
75 #endif
76  { "max_size", "max size of single packet", OFFSET(max_size), AV_OPT_TYPE_INT, { .i64 = 4096 }, 1024, 1 << 22, DEC },
77  { NULL },
78 };
79 
81 {
82  if (CONFIG_SPDIF_DEMUXER && s->streams[0]->codecpar->codec_tag == 1) {
83  enum AVCodecID codec;
84  int len = 1<<16;
85  int ret = ffio_ensure_seekback(s->pb, len);
86 
87  if (ret >= 0) {
88  uint8_t *buf = av_malloc(len + AV_INPUT_BUFFER_PADDING_SIZE);
89  if (!buf) {
90  ret = AVERROR(ENOMEM);
91  } else {
92  int64_t pos = avio_tell(s->pb);
93  len = ret = avio_read(s->pb, buf, len);
94  if (len >= 0) {
95  ret = ff_spdif_probe(buf, len, &codec);
97  s->streams[0]->codecpar->codec_id = codec;
98  wav->spdif = 1;
99  }
100  }
101  avio_seek(s->pb, pos, SEEK_SET);
102  av_free(buf);
103  }
104  }
105 
106  if (ret < 0)
107  av_log(s, AV_LOG_WARNING, "Cannot check for SPDIF\n");
108  }
109 }
110 
111 #if CONFIG_WAV_DEMUXER
112 
113 static int64_t next_tag(AVIOContext *pb, uint32_t *tag, int big_endian)
114 {
115  *tag = avio_rl32(pb);
116  if (!big_endian) {
117  return avio_rl32(pb);
118  } else {
119  return avio_rb32(pb);
120  }
121 }
122 
123 /* RIFF chunks are always at even offsets relative to where they start. */
124 static int64_t wav_seek_tag(WAVDemuxContext * wav, AVIOContext *s, int64_t offset, int whence)
125 {
126  offset += offset < INT64_MAX && offset + wav->unaligned & 1;
127 
128  return avio_seek(s, offset, whence);
129 }
130 
131 /* return the size of the found tag */
132 static int64_t find_tag(WAVDemuxContext * wav, AVIOContext *pb, uint32_t tag1)
133 {
134  unsigned int tag;
135  int64_t size;
136 
137  for (;;) {
138  if (avio_feof(pb))
139  return AVERROR_EOF;
140  size = next_tag(pb, &tag, wav->rifx);
141  if (tag == tag1)
142  break;
143  wav_seek_tag(wav, pb, size, SEEK_CUR);
144  }
145  return size;
146 }
147 
148 static int wav_probe(const AVProbeData *p)
149 {
150  /* check file header */
151  if (p->buf_size <= 32)
152  return 0;
153  if (!memcmp(p->buf + 8, "WAVE", 4)) {
154  if (!memcmp(p->buf, "RIFF", 4) || !memcmp(p->buf, "RIFX", 4))
155  /* Since the ACT demuxer has a standard WAV header at the top of
156  * its own, the returned score is decreased to avoid a probe
157  * conflict between ACT and WAV. */
158  return AVPROBE_SCORE_MAX - 1;
159  else if ((!memcmp(p->buf, "RF64", 4) ||
160  !memcmp(p->buf, "BW64", 4)) &&
161  !memcmp(p->buf + 12, "ds64", 4))
162  return AVPROBE_SCORE_MAX;
163  }
164  return 0;
165 }
166 
167 static void handle_stream_probing(AVStream *st)
168 {
170  FFStream *const sti = ffstream(st);
172  sti->probe_packets = FFMIN(sti->probe_packets, 32);
173  }
174 }
175 
176 static int wav_parse_fmt_tag(AVFormatContext *s, int64_t size, AVStream *st)
177 {
178  AVIOContext *pb = s->pb;
179  WAVDemuxContext *wav = s->priv_data;
180  int ret;
181 
182  /* parse fmt header */
183  ret = ff_get_wav_header(s, pb, st->codecpar, size, wav->rifx);
184  if (ret < 0)
185  return ret;
186  handle_stream_probing(st);
187 
189 
190  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
191 
192  return 0;
193 }
194 
195 static int wav_parse_xma2_tag(AVFormatContext *s, int64_t size, AVStream *st)
196 {
197  AVIOContext *pb = s->pb;
198  int version, num_streams, i, channels = 0, ret;
199 
200  if (size < 36)
201  return AVERROR_INVALIDDATA;
202 
206 
207  version = avio_r8(pb);
208  if (version != 3 && version != 4)
209  return AVERROR_INVALIDDATA;
210  num_streams = avio_r8(pb);
211  if (size != (32 + ((version==3)?0:8) + 4*num_streams))
212  return AVERROR_INVALIDDATA;
213  avio_skip(pb, 10);
214  st->codecpar->sample_rate = avio_rb32(pb);
215  if (version == 4)
216  avio_skip(pb, 8);
217  avio_skip(pb, 4);
218  st->duration = avio_rb32(pb);
219  avio_skip(pb, 8);
220 
221  for (i = 0; i < num_streams; i++) {
222  channels += avio_r8(pb);
223  avio_skip(pb, 3);
224  }
228 
229  if (st->codecpar->ch_layout.nb_channels <= 0 || st->codecpar->sample_rate <= 0)
230  return AVERROR_INVALIDDATA;
231 
232  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
233 
234  avio_seek(pb, -size, SEEK_CUR);
235  if ((ret = ff_get_extradata(s, st->codecpar, pb, size)) < 0)
236  return ret;
237 
238  return 0;
239 }
240 
241 static inline int wav_parse_bext_string(AVFormatContext *s, const char *key,
242  int length)
243 {
244  char temp[257];
245  int ret;
246 
247  av_assert0(length < sizeof(temp));
248  if ((ret = ffio_read_size(s->pb, temp, length)) < 0)
249  return ret;
250 
251  temp[length] = 0;
252 
253  if (strlen(temp))
254  return av_dict_set(&s->metadata, key, temp, 0);
255 
256  return 0;
257 }
258 
259 static int wav_parse_bext_tag(AVFormatContext *s, int64_t size)
260 {
261  char temp[131], *coding_history;
262  int ret, x;
263  uint64_t time_reference;
264  int64_t umid_parts[8], umid_mask = 0;
265 
266  if ((ret = wav_parse_bext_string(s, "description", 256)) < 0 ||
267  (ret = wav_parse_bext_string(s, "originator", 32)) < 0 ||
268  (ret = wav_parse_bext_string(s, "originator_reference", 32)) < 0 ||
269  (ret = wav_parse_bext_string(s, "origination_date", 10)) < 0 ||
270  (ret = wav_parse_bext_string(s, "origination_time", 8)) < 0)
271  return ret;
272 
273  time_reference = avio_rl64(s->pb);
274  snprintf(temp, sizeof(temp), "%"PRIu64, time_reference);
275  if ((ret = av_dict_set(&s->metadata, "time_reference", temp, 0)) < 0)
276  return ret;
277 
278  /* check if version is >= 1, in which case an UMID may be present */
279  if (avio_rl16(s->pb) >= 1) {
280  for (x = 0; x < 8; x++)
281  umid_mask |= umid_parts[x] = avio_rb64(s->pb);
282 
283  if (umid_mask) {
284  /* the string formatting below is per SMPTE 330M-2004 Annex C */
285  if (umid_parts[4] == 0 && umid_parts[5] == 0 &&
286  umid_parts[6] == 0 && umid_parts[7] == 0) {
287  /* basic UMID */
288  snprintf(temp, sizeof(temp),
289  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
290  umid_parts[0], umid_parts[1],
291  umid_parts[2], umid_parts[3]);
292  } else {
293  /* extended UMID */
294  snprintf(temp, sizeof(temp),
295  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64
296  "%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
297  umid_parts[0], umid_parts[1],
298  umid_parts[2], umid_parts[3],
299  umid_parts[4], umid_parts[5],
300  umid_parts[6], umid_parts[7]);
301  }
302 
303  if ((ret = av_dict_set(&s->metadata, "umid", temp, 0)) < 0)
304  return ret;
305  }
306 
307  avio_skip(s->pb, 190);
308  } else
309  avio_skip(s->pb, 254);
310 
311  if (size > 602) {
312  /* CodingHistory present */
313  size -= 602;
314 
315  if (!(coding_history = av_malloc(size + 1)))
316  return AVERROR(ENOMEM);
317 
318  if ((ret = ffio_read_size(s->pb, coding_history, size)) < 0) {
319  av_free(coding_history);
320  return ret;
321  }
322 
323  coding_history[size] = 0;
324  if ((ret = av_dict_set(&s->metadata, "coding_history", coding_history,
326  return ret;
327  }
328 
329  return 0;
330 }
331 
332 static const AVMetadataConv wav_metadata_conv[] = {
333  { "description", "comment" },
334  { "originator", "encoded_by" },
335  { "origination_date", "date" },
336  { "origination_time", "creation_time" },
337  { 0 },
338 };
339 
340 /* wav input */
341 static int wav_read_header(AVFormatContext *s)
342 {
343  int64_t size, av_uninit(data_size);
344  int64_t sample_count = 0;
345  int rf64 = 0, bw64 = 0;
346  uint32_t tag;
347  AVIOContext *pb = s->pb;
348  AVStream *st = NULL;
349  WAVDemuxContext *wav = s->priv_data;
350  int ret, got_fmt = 0, got_xma2 = 0;
351  int64_t next_tag_ofs, data_ofs = -1;
352 
353  wav->unaligned = avio_tell(s->pb) & 1;
354 
355  wav->smv_data_ofs = -1;
356 
357  /* read chunk ID */
358  tag = avio_rl32(pb);
359  switch (tag) {
360  case MKTAG('R', 'I', 'F', 'F'):
361  break;
362  case MKTAG('R', 'I', 'F', 'X'):
363  wav->rifx = 1;
364  break;
365  case MKTAG('R', 'F', '6', '4'):
366  rf64 = 1;
367  break;
368  case MKTAG('B', 'W', '6', '4'):
369  bw64 = 1;
370  break;
371  default:
372  av_log(s, AV_LOG_ERROR, "invalid start code %s in RIFF header\n",
373  av_fourcc2str(tag));
374  return AVERROR_INVALIDDATA;
375  }
376 
377  /* read chunk size */
378  avio_rl32(pb);
379 
380  /* read format */
381  if (avio_rl32(pb) != MKTAG('W', 'A', 'V', 'E')) {
382  av_log(s, AV_LOG_ERROR, "invalid format in RIFF header\n");
383  return AVERROR_INVALIDDATA;
384  }
385 
386  if (rf64 || bw64) {
387  if (avio_rl32(pb) != MKTAG('d', 's', '6', '4'))
388  return AVERROR_INVALIDDATA;
389  size = avio_rl32(pb);
390  if (size < 24)
391  return AVERROR_INVALIDDATA;
392  avio_rl64(pb); /* RIFF size */
393 
394  data_size = avio_rl64(pb);
395  sample_count = avio_rl64(pb);
396 
397  if (data_size < 0 || sample_count < 0) {
398  av_log(s, AV_LOG_ERROR, "negative data_size and/or sample_count in "
399  "ds64: data_size = %"PRId64", sample_count = %"PRId64"\n",
400  data_size, sample_count);
401  return AVERROR_INVALIDDATA;
402  }
403  avio_skip(pb, size - 24); /* skip rest of ds64 chunk */
404 
405  }
406 
407  /* Create the audio stream now so that its index is always zero */
408  st = avformat_new_stream(s, NULL);
409  if (!st)
410  return AVERROR(ENOMEM);
411 
412  for (;;) {
413  AVStream *vst;
414  size = next_tag(pb, &tag, wav->rifx);
415  next_tag_ofs = avio_tell(pb) + size;
416 
417  if (avio_feof(pb))
418  break;
419 
420  switch (tag) {
421  case MKTAG('f', 'm', 't', ' '):
422  /* only parse the first 'fmt ' tag found */
423  if (!got_xma2 && !got_fmt && (ret = wav_parse_fmt_tag(s, size, st)) < 0) {
424  return ret;
425  } else if (got_fmt)
426  av_log(s, AV_LOG_WARNING, "found more than one 'fmt ' tag\n");
427 
428  got_fmt = 1;
429  break;
430  case MKTAG('X', 'M', 'A', '2'):
431  /* only parse the first 'XMA2' tag found */
432  if (!got_fmt && !got_xma2 && (ret = wav_parse_xma2_tag(s, size, st)) < 0) {
433  return ret;
434  } else if (got_xma2)
435  av_log(s, AV_LOG_WARNING, "found more than one 'XMA2' tag\n");
436 
437  got_xma2 = 1;
438  break;
439  case MKTAG('d', 'a', 't', 'a'):
440  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) && !got_fmt && !got_xma2) {
442  "found no 'fmt ' tag before the 'data' tag\n");
443  return AVERROR_INVALIDDATA;
444  }
445 
446  if (rf64 || bw64) {
447  next_tag_ofs = wav->data_end = avio_tell(pb) + data_size;
448  } else if (size != 0xFFFFFFFF) {
449  data_size = size;
450  next_tag_ofs = wav->data_end = size ? next_tag_ofs : INT64_MAX;
451  } else {
452  av_log(s, AV_LOG_WARNING, "Ignoring maximum wav data size, "
453  "file may be invalid\n");
454  data_size = 0;
455  next_tag_ofs = wav->data_end = INT64_MAX;
456  }
457 
458  data_ofs = avio_tell(pb);
459 
460  /* don't look for footer metadata if we can't seek or if we don't
461  * know where the data tag ends
462  */
463  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) || (!(rf64 && !bw64) && !size))
464  goto break_loop;
465  break;
466  case MKTAG('f', 'a', 'c', 't'):
467  if (!sample_count)
468  sample_count = (!wav->rifx ? avio_rl32(pb) : avio_rb32(pb));
469  break;
470  case MKTAG('b', 'e', 'x', 't'):
471  if ((ret = wav_parse_bext_tag(s, size)) < 0)
472  return ret;
473  break;
474  case MKTAG('S','M','V','0'):
475  if (!got_fmt) {
476  av_log(s, AV_LOG_ERROR, "found no 'fmt ' tag before the 'SMV0' tag\n");
477  return AVERROR_INVALIDDATA;
478  }
479  // SMV file, a wav file with video appended.
480  if (size != MKTAG('0','2','0','0')) {
481  av_log(s, AV_LOG_ERROR, "Unknown SMV version found\n");
482  goto break_loop;
483  }
484  av_log(s, AV_LOG_DEBUG, "Found SMV data\n");
485  wav->smv_given_first = 0;
486  vst = avformat_new_stream(s, NULL);
487  if (!vst)
488  return AVERROR(ENOMEM);
489  wav->vst = vst;
490  avio_r8(pb);
491  vst->id = 1;
494  vst->codecpar->width = avio_rl24(pb);
495  vst->codecpar->height = avio_rl24(pb);
496  if ((ret = ff_alloc_extradata(vst->codecpar, 4)) < 0) {
497  av_log(s, AV_LOG_ERROR, "Could not allocate extradata.\n");
498  return ret;
499  }
500  size = avio_rl24(pb);
501  wav->smv_data_ofs = avio_tell(pb) + (size - 5) * 3;
502  avio_rl24(pb);
503  wav->smv_block_size = avio_rl24(pb);
504  if (!wav->smv_block_size)
505  return AVERROR_INVALIDDATA;
506  avpriv_set_pts_info(vst, 32, 1, avio_rl24(pb));
507  vst->duration = avio_rl24(pb);
508  avio_rl24(pb);
509  avio_rl24(pb);
510  wav->smv_frames_per_jpeg = avio_rl24(pb);
511  if (wav->smv_frames_per_jpeg > 65536) {
512  av_log(s, AV_LOG_ERROR, "too many frames per jpeg\n");
513  return AVERROR_INVALIDDATA;
514  }
516  goto break_loop;
517  case MKTAG('L', 'I', 'S', 'T'):
518  case MKTAG('l', 'i', 's', 't'):
519  if (size < 4) {
520  av_log(s, AV_LOG_ERROR, "too short LIST tag\n");
521  return AVERROR_INVALIDDATA;
522  }
523  switch (avio_rl32(pb)) {
524  case MKTAG('I', 'N', 'F', 'O'):
525  ff_read_riff_info(s, size - 4);
526  break;
527  case MKTAG('a', 'd', 't', 'l'):
528  if (s->nb_chapters > 0) {
529  while (avio_tell(pb) < next_tag_ofs &&
530  !avio_feof(pb)) {
531  char cue_label[512];
532  unsigned id, sub_size;
533 
534  if (avio_rl32(pb) != MKTAG('l', 'a', 'b', 'l'))
535  break;
536 
537  sub_size = avio_rl32(pb);
538  if (sub_size < 5)
539  break;
540  id = avio_rl32(pb);
541  avio_get_str(pb, sub_size - 4, cue_label, sizeof(cue_label));
542  avio_skip(pb, avio_tell(pb) & 1);
543 
544  for (int i = 0; i < s->nb_chapters; i++) {
545  if (s->chapters[i]->id == id) {
546  av_dict_set(&s->chapters[i]->metadata, "title", cue_label, 0);
547  break;
548  }
549  }
550  }
551  }
552  break;
553  }
554  break;
555  case MKTAG('I', 'D', '3', ' '):
556  case MKTAG('i', 'd', '3', ' '): {
557  ID3v2ExtraMeta *id3v2_extra_meta;
558  ff_id3v2_read_dict(pb, &ffformatcontext(s)->id3v2_meta, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta);
559  if (id3v2_extra_meta) {
560  ff_id3v2_parse_apic(s, id3v2_extra_meta);
561  ff_id3v2_parse_chapters(s, id3v2_extra_meta);
562  ff_id3v2_parse_priv(s, id3v2_extra_meta);
563  }
564  ff_id3v2_free_extra_meta(&id3v2_extra_meta);
565  }
566  break;
567  case MKTAG('c', 'u', 'e', ' '):
568  if (size >= 4 && got_fmt && st->codecpar->sample_rate > 0) {
569  AVRational tb = {1, st->codecpar->sample_rate};
570  unsigned nb_cues = avio_rl32(pb);
571 
572  if (size >= nb_cues * 24LL + 4LL) {
573  for (int i = 0; i < nb_cues; i++) {
574  unsigned offset, id = avio_rl32(pb);
575 
576  if (avio_feof(pb))
577  return AVERROR_INVALIDDATA;
578 
579  avio_skip(pb, 16);
580  offset = avio_rl32(pb);
581 
583  return AVERROR(ENOMEM);
584  }
585  }
586  }
587  break;
588  }
589 
590  /* seek to next tag unless we know that we'll run into EOF */
591  if ((avio_size(pb) > 0 && next_tag_ofs >= avio_size(pb)) ||
592  wav_seek_tag(wav, pb, next_tag_ofs, SEEK_SET) < 0) {
593  break;
594  }
595  }
596 
597 break_loop:
598  if (!got_fmt && !got_xma2) {
599  av_log(s, AV_LOG_ERROR, "no 'fmt ' or 'XMA2' tag found\n");
600  return AVERROR_INVALIDDATA;
601  }
602 
603  if (data_ofs < 0) {
604  av_log(s, AV_LOG_ERROR, "no 'data' tag found\n");
605  return AVERROR_INVALIDDATA;
606  }
607 
608  avio_seek(pb, data_ofs, SEEK_SET);
609 
610  if (data_size > (INT64_MAX>>3)) {
611  av_log(s, AV_LOG_WARNING, "Data size %"PRId64" is too large\n", data_size);
612  data_size = 0;
613  }
614 
615  if ( st->codecpar->bit_rate > 0 && data_size > 0
616  && st->codecpar->sample_rate > 0
617  && sample_count > 0 && st->codecpar->ch_layout.nb_channels > 1
618  && sample_count % st->codecpar->ch_layout.nb_channels == 0) {
619  if (fabs(8.0 * data_size * st->codecpar->ch_layout.nb_channels * st->codecpar->sample_rate /
620  sample_count /st->codecpar->bit_rate - 1.0) < 0.3)
621  sample_count /= st->codecpar->ch_layout.nb_channels;
622  }
623 
624  if (data_size > 0 && sample_count && st->codecpar->ch_layout.nb_channels &&
625  (data_size << 3) / sample_count / st->codecpar->ch_layout.nb_channels > st->codecpar->bits_per_coded_sample + 1) {
626  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
627  sample_count = 0;
628  }
629 
630  /* G.729 hack (for Ticket4577)
631  * FIXME: Come up with cleaner, more general solution */
632  if (st->codecpar->codec_id == AV_CODEC_ID_G729 && sample_count && (data_size << 3) > sample_count) {
633  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
634  sample_count = 0;
635  }
636 
637  if (!sample_count || av_get_exact_bits_per_sample(st->codecpar->codec_id) > 0)
638  if ( st->codecpar->ch_layout.nb_channels
639  && data_size
641  && wav->data_end <= avio_size(pb))
642  sample_count = (data_size << 3)
643  /
645 
646  if (sample_count)
647  st->duration = sample_count;
648 
651  st->codecpar->bits_per_coded_sample == 32 &&
652  st->codecpar->extradata_size == 2 &&
653  AV_RL16(st->codecpar->extradata) == 1) {
656  } else if (st->codecpar->codec_id == AV_CODEC_ID_PCM_S24LE &&
658  st->codecpar->bits_per_coded_sample == 24) {
660  } else if (st->codecpar->codec_id == AV_CODEC_ID_XMA1 ||
662  st->codecpar->block_align = 2048;
663  } else if (st->codecpar->codec_id == AV_CODEC_ID_ADPCM_MS && st->codecpar->ch_layout.nb_channels > 2 &&
664  st->codecpar->block_align < INT_MAX / st->codecpar->ch_layout.nb_channels) {
666  }
667 
668  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
670 
671  set_spdif(s, wav);
672 
673  return 0;
674 }
675 
676 /**
677  * Find chunk with w64 GUID by skipping over other chunks.
678  * @return the size of the found chunk
679  */
680 static int64_t find_guid(AVIOContext *pb, const uint8_t guid1[16])
681 {
682  uint8_t guid[16];
683  int64_t size;
684 
685  while (!avio_feof(pb)) {
686  avio_read(pb, guid, 16);
687  size = avio_rl64(pb);
688  if (size <= 24 || size > INT64_MAX - 8)
689  return AVERROR_INVALIDDATA;
690  if (!memcmp(guid, guid1, 16))
691  return size;
692  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
693  }
694  return AVERROR_EOF;
695 }
696 
697 static int wav_read_packet(AVFormatContext *s, AVPacket *pkt)
698 {
699  int ret, size;
700  int64_t left;
701  WAVDemuxContext *wav = s->priv_data;
702  AVStream *st = s->streams[0];
703 
704  if (CONFIG_SPDIF_DEMUXER && wav->spdif == 1)
705  return ff_spdif_read_packet(s, pkt);
706 
707  if (wav->smv_data_ofs > 0) {
708  int64_t audio_dts, video_dts;
709  AVStream *vst = wav->vst;
710 smv_retry:
713 
715  /*We always return a video frame first to get the pixel format first*/
716  wav->smv_last_stream = wav->smv_given_first ?
718  audio_dts, st->time_base) > 0 : 0;
719  wav->smv_given_first = 1;
720  }
721  wav->smv_last_stream = !wav->smv_last_stream;
722  wav->smv_last_stream |= wav->audio_eof;
723  wav->smv_last_stream &= !wav->smv_eof;
724  if (wav->smv_last_stream) {
725  uint64_t old_pos = avio_tell(s->pb);
726  uint64_t new_pos = wav->smv_data_ofs +
727  wav->smv_block * (int64_t)wav->smv_block_size;
728  if (avio_seek(s->pb, new_pos, SEEK_SET) < 0) {
729  ret = AVERROR_EOF;
730  goto smv_out;
731  }
732  size = avio_rl24(s->pb);
733  ret = av_get_packet(s->pb, pkt, size);
734  if (ret < 0)
735  goto smv_out;
736  pkt->pos -= 3;
737  pkt->pts = wav->smv_block * wav->smv_frames_per_jpeg;
739  wav->smv_block++;
740 
741  pkt->stream_index = vst->index;
742 smv_out:
743  avio_seek(s->pb, old_pos, SEEK_SET);
744  if (ret == AVERROR_EOF) {
745  wav->smv_eof = 1;
746  goto smv_retry;
747  }
748  return ret;
749  }
750  }
751 
752  left = wav->data_end - avio_tell(s->pb);
753  if (wav->ignore_length)
754  left = INT_MAX;
755  if (left <= 0) {
756  if (CONFIG_W64_DEMUXER && wav->w64)
757  left = find_guid(s->pb, ff_w64_guid_data) - 24;
758  else
759  left = find_tag(wav, s->pb, MKTAG('d', 'a', 't', 'a'));
760  if (left < 0) {
761  wav->audio_eof = 1;
762  if (wav->smv_data_ofs > 0 && !wav->smv_eof)
763  goto smv_retry;
764  return AVERROR_EOF;
765  }
766  wav->data_end = avio_tell(s->pb) + left;
767  }
768 
769  size = wav->max_size;
770  if (st->codecpar->block_align > 1) {
771  if (size < st->codecpar->block_align)
772  size = st->codecpar->block_align;
773  size = (size / st->codecpar->block_align) * st->codecpar->block_align;
774  }
775  size = FFMIN(size, left);
776  ret = av_get_packet(s->pb, pkt, size);
777  if (ret < 0)
778  return ret;
779  pkt->stream_index = 0;
780 
781  return ret;
782 }
783 
784 static int wav_read_seek(AVFormatContext *s,
785  int stream_index, int64_t timestamp, int flags)
786 {
787  WAVDemuxContext *wav = s->priv_data;
788  AVStream *ast = s->streams[0], *vst = wav->vst;
789  wav->smv_eof = 0;
790  wav->audio_eof = 0;
791 
792  if (stream_index != 0 && (!vst || stream_index != vst->index))
793  return AVERROR(EINVAL);
794  if (wav->smv_data_ofs > 0) {
795  int64_t smv_timestamp = timestamp;
796  if (stream_index == 0)
797  smv_timestamp = av_rescale_q(timestamp, ast->time_base, vst->time_base);
798  else
799  timestamp = av_rescale_q(smv_timestamp, vst->time_base, ast->time_base);
800  if (wav->smv_frames_per_jpeg > 0) {
801  wav->smv_block = smv_timestamp / wav->smv_frames_per_jpeg;
802  }
803  }
804 
805  switch (ast->codecpar->codec_id) {
806  case AV_CODEC_ID_MP2:
807  case AV_CODEC_ID_MP3:
808  case AV_CODEC_ID_AC3:
809  case AV_CODEC_ID_DTS:
810  case AV_CODEC_ID_XMA2:
811  /* use generic seeking with dynamically generated indexes */
812  return -1;
813  default:
814  break;
815  }
816  return ff_pcm_read_seek(s, 0, timestamp, flags);
817 }
818 
819 static const AVClass wav_demuxer_class = {
820  .class_name = "WAV demuxer",
821  .item_name = av_default_item_name,
822  .option = demux_options,
823  .version = LIBAVUTIL_VERSION_INT,
824 };
826  .name = "wav",
827  .long_name = NULL_IF_CONFIG_SMALL("WAV / WAVE (Waveform Audio)"),
828  .priv_data_size = sizeof(WAVDemuxContext),
829  .read_probe = wav_probe,
830  .read_header = wav_read_header,
831  .read_packet = wav_read_packet,
832  .read_seek = wav_read_seek,
834  .codec_tag = ff_wav_codec_tags_list,
835  .priv_class = &wav_demuxer_class,
836 };
837 #endif /* CONFIG_WAV_DEMUXER */
838 
839 #if CONFIG_W64_DEMUXER
840 static int w64_probe(const AVProbeData *p)
841 {
842  if (p->buf_size <= 40)
843  return 0;
844  if (!memcmp(p->buf, ff_w64_guid_riff, 16) &&
845  !memcmp(p->buf + 24, ff_w64_guid_wave, 16))
846  return AVPROBE_SCORE_MAX;
847  else
848  return 0;
849 }
850 
851 static int w64_read_header(AVFormatContext *s)
852 {
853  int64_t size, data_ofs = 0;
854  AVIOContext *pb = s->pb;
855  WAVDemuxContext *wav = s->priv_data;
856  AVStream *st;
857  uint8_t guid[16];
858  int ret;
859 
860  avio_read(pb, guid, 16);
861  if (memcmp(guid, ff_w64_guid_riff, 16))
862  return AVERROR_INVALIDDATA;
863 
864  /* riff + wave + fmt + sizes */
865  if (avio_rl64(pb) < 16 + 8 + 16 + 8 + 16 + 8)
866  return AVERROR_INVALIDDATA;
867 
868  avio_read(pb, guid, 16);
869  if (memcmp(guid, ff_w64_guid_wave, 16)) {
870  av_log(s, AV_LOG_ERROR, "could not find wave guid\n");
871  return AVERROR_INVALIDDATA;
872  }
873 
874  wav->w64 = 1;
875 
876  st = avformat_new_stream(s, NULL);
877  if (!st)
878  return AVERROR(ENOMEM);
879 
880  while (!avio_feof(pb)) {
881  if (avio_read(pb, guid, 16) != 16)
882  break;
883  size = avio_rl64(pb);
884  if (size <= 24 || INT64_MAX - size < avio_tell(pb))
885  return AVERROR_INVALIDDATA;
886 
887  if (!memcmp(guid, ff_w64_guid_fmt, 16)) {
888  /* subtract chunk header size - normal wav file doesn't count it */
889  ret = ff_get_wav_header(s, pb, st->codecpar, size - 24, 0);
890  if (ret < 0)
891  return ret;
892  avio_skip(pb, FFALIGN(size, INT64_C(8)) - size);
893 
894  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
895  } else if (!memcmp(guid, ff_w64_guid_fact, 16)) {
896  int64_t samples;
897 
898  samples = avio_rl64(pb);
899  if (samples > 0)
900  st->duration = samples;
901  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 32);
902  } else if (!memcmp(guid, ff_w64_guid_data, 16)) {
903  wav->data_end = avio_tell(pb) + size - 24;
904 
905  data_ofs = avio_tell(pb);
906  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
907  break;
908 
909  avio_skip(pb, size - 24);
910  } else if (!memcmp(guid, ff_w64_guid_summarylist, 16)) {
911  int64_t start, end, cur;
912  uint32_t count, chunk_size, i;
913  int64_t filesize = avio_size(s->pb);
914 
915  start = avio_tell(pb);
916  end = start + FFALIGN(size, INT64_C(8)) - 24;
917  count = avio_rl32(pb);
918 
919  for (i = 0; i < count; i++) {
920  char chunk_key[5], *value;
921 
922  if (avio_feof(pb) || (cur = avio_tell(pb)) < 0 || cur > end - 8 /* = tag + size */)
923  break;
924 
925  chunk_key[4] = 0;
926  avio_read(pb, chunk_key, 4);
927  chunk_size = avio_rl32(pb);
928  if (chunk_size == UINT32_MAX || (filesize >= 0 && chunk_size > filesize))
929  return AVERROR_INVALIDDATA;
930 
931  value = av_malloc(chunk_size + 1);
932  if (!value)
933  return AVERROR(ENOMEM);
934 
935  ret = avio_get_str16le(pb, chunk_size, value, chunk_size);
936  if (ret < 0) {
937  av_free(value);
938  return ret;
939  }
940  avio_skip(pb, chunk_size - ret);
941 
942  av_dict_set(&s->metadata, chunk_key, value, AV_DICT_DONT_STRDUP_VAL);
943  }
944 
945  avio_skip(pb, end - avio_tell(pb));
946  } else {
947  av_log(s, AV_LOG_DEBUG, "unknown guid: "FF_PRI_GUID"\n", FF_ARG_GUID(guid));
948  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
949  }
950  }
951 
952  if (!data_ofs)
953  return AVERROR_EOF;
954 
955  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
957 
958  handle_stream_probing(st);
960 
961  avio_seek(pb, data_ofs, SEEK_SET);
962 
963  set_spdif(s, wav);
964 
965  return 0;
966 }
967 
968 static const AVClass w64_demuxer_class = {
969  .class_name = "W64 demuxer",
970  .item_name = av_default_item_name,
972  .version = LIBAVUTIL_VERSION_INT,
973 };
974 
976  .name = "w64",
977  .long_name = NULL_IF_CONFIG_SMALL("Sony Wave64"),
978  .priv_data_size = sizeof(WAVDemuxContext),
979  .read_probe = w64_probe,
980  .read_header = w64_read_header,
981  .read_packet = wav_read_packet,
982  .read_seek = wav_read_seek,
984  .codec_tag = ff_wav_codec_tags_list,
985  .priv_class = &w64_demuxer_class,
986 };
987 #endif /* CONFIG_W64_DEMUXER */
avpriv_new_chapter
AVChapter * avpriv_new_chapter(AVFormatContext *s, int64_t id, AVRational time_base, int64_t start, int64_t end, const char *title)
Add a new chapter.
Definition: demux_utils.c:42
WAVDemuxContext
Definition: wavdec.c:49
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:318
WAVDemuxContext::unaligned
int unaligned
Definition: wavdec.c:65
WAVDemuxContext::smv_block
int smv_block
Definition: wavdec.c:57
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:363
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:75
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:430
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
avformat_new_stream
AVStream * avformat_new_stream(AVFormatContext *s, const AVCodec *c)
Add a new stream to a media file.
Definition: options.c:237
pcm.h
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:57
AV_WL32
#define AV_WL32(p, v)
Definition: intreadwrite.h:426
av_compare_ts
int av_compare_ts(int64_t ts_a, AVRational tb_a, int64_t ts_b, AVRational tb_b)
Compare two timestamps each in its own time base.
Definition: mathematics.c:147
W64_DEMUXER_OPTIONS_OFFSET
#define W64_DEMUXER_OPTIONS_OFFSET
ffformatcontext
static av_always_inline FFFormatContext * ffformatcontext(AVFormatContext *s)
Definition: internal.h:192
AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:57
WAVDemuxContext::smv_data_ofs
int64_t smv_data_ofs
Definition: wavdec.c:54
audio_dts
int64_t audio_dts
Definition: movenc.c:61
WAVDemuxContext::smv_frames_per_jpeg
int smv_frames_per_jpeg
Definition: wavdec.c:56
id3v2.h
WAVDemuxContext::max_size
int max_size
Definition: wavdec.c:62
AVOption
AVOption.
Definition: opt.h:251
AVMetadataConv
Definition: metadata.h:34
AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: packet.h:392
mathematics.h
AVProbeData::buf_size
int buf_size
Size of buf except extra allocated bytes.
Definition: avformat.h:456
AVChannelLayout::order
enum AVChannelOrder order
Channel order used in this layout.
Definition: channel_layout.h:295
AVChannelLayout::nb_channels
int nb_channels
Number of channels in this layout.
Definition: channel_layout.h:300
avio_size
int64_t avio_size(AVIOContext *s)
Get the filesize.
Definition: aviobuf.c:352
sample_rate
sample_rate
Definition: ffmpeg_filter.c:153
WAVDemuxContext::data_end
int64_t data_end
Definition: wavdec.c:51
video_dts
int64_t video_dts
Definition: movenc.c:61
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:30
WAVDemuxContext::w64
int w64
Definition: wavdec.c:52
ff_get_extradata
int ff_get_extradata(void *logctx, AVCodecParameters *par, AVIOContext *pb, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0 and f...
Definition: demux_utils.c:355
AVPROBE_SCORE_MAX
#define AVPROBE_SCORE_MAX
maximum score
Definition: avformat.h:465
return
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a it should return
Definition: filter_design.txt:264
avpriv_set_pts_info
void avpriv_set_pts_info(AVStream *st, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: avformat.c:697
ff_w64_guid_summarylist
const uint8_t ff_w64_guid_summarylist[16]
Definition: w64.c:47
ffstream
static av_always_inline FFStream * ffstream(AVStream *st)
Definition: internal.h:407
read_seek
static int read_seek(AVFormatContext *ctx, int stream_index, int64_t timestamp, int flags)
Definition: libcdio.c:151
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:505
AVFMT_GENERIC_INDEX
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:482
demux_options
static const AVOption demux_options[]
Definition: wavdec.c:71
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:428
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:998
avio_rl16
unsigned int avio_rl16(AVIOContext *s)
Definition: aviobuf.c:743
ff_id3v2_parse_chapters
int ff_id3v2_parse_chapters(AVFormatContext *s, ID3v2ExtraMeta *cur)
Create chapters for all CHAP tags found in the ID3v2 header.
Definition: id3v2.c:1189
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:72
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:586
avassert.h
avio_rb32
unsigned int avio_rb32(AVIOContext *s)
Definition: aviobuf.c:790
pkt
AVPacket * pkt
Definition: movenc.c:59
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
AVInputFormat
Definition: avformat.h:656
ID3v2ExtraMeta
Definition: id3v2.h:84
avio_get_str16le
int avio_get_str16le(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a UTF-16 string from pb and convert it to UTF-8.
FF_ARG_GUID
#define FF_ARG_GUID(g)
Definition: riff.h:108
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:256
AV_CODEC_ID_XMA1
@ AV_CODEC_ID_XMA1
Definition: codec_id.h:506
AVInputFormat::name
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:661
AVProbeData::buf
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:455
AV_CHANNEL_ORDER_UNSPEC
@ AV_CHANNEL_ORDER_UNSPEC
Only the channel count is specified, without any further information about the channel order.
Definition: channel_layout.h:106
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
AVCodecParameters::width
int width
Video only.
Definition: codec_par.h:127
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:427
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:37
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:201
AV_CODEC_ID_PCM_F24LE
@ AV_CODEC_ID_PCM_F24LE
Definition: codec_id.h:352
channels
channels
Definition: aptx.h:32
AV_RL16
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_RL16
Definition: bytestream.h:94
ff_w64_demuxer
const AVInputFormat ff_w64_demuxer
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
ff_read_riff_info
int ff_read_riff_info(AVFormatContext *s, int64_t size)
Definition: riffdec.c:235
ff_wav_demuxer
const AVInputFormat ff_wav_demuxer
key
const char * key
Definition: hwcontext_opencl.c:174
if
if(ret)
Definition: filter_design.txt:179
FFStream::need_parsing
enum AVStreamParseType need_parsing
Definition: internal.h:380
AVFormatContext
Format I/O context.
Definition: avformat.h:1213
internal.h
ff_metadata_conv_ctx
void ff_metadata_conv_ctx(AVFormatContext *ctx, const AVMetadataConv *d_conv, const AVMetadataConv *s_conv)
Definition: metadata.c:59
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:1108
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
read_header
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:532
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
fabs
static __device__ float fabs(float a)
Definition: cuda_runtime.h:182
AVStream::time_base
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented.
Definition: avformat.h:978
NULL
#define NULL
Definition: coverity.c:32
read_probe
static int read_probe(const AVProbeData *pd)
Definition: jvdec.c:55
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:237
ff_id3v2_parse_apic
int ff_id3v2_parse_apic(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Create a stream for each APIC (attached picture) extracted from the ID3v2 header.
Definition: id3v2.c:1158
avio_rb64
uint64_t avio_rb64(AVIOContext *s)
Definition: aviobuf.c:937
AVProbeData
This structure contains the data a format has to probe a file.
Definition: avformat.h:453
AVCodecParameters::ch_layout
AVChannelLayout ch_layout
Audio only.
Definition: codec_par.h:212
AVPROBE_SCORE_EXTENSION
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:463
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:177
av_channel_layout_uninit
void av_channel_layout_uninit(AVChannelLayout *channel_layout)
Free any allocated data in the channel layout and reset the channel count to 0.
Definition: channel_layout.c:630
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:47
ff_w64_guid_fmt
const uint8_t ff_w64_guid_fmt[16]
Definition: w64.c:33
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:79
WAVDemuxContext::smv_last_stream
int smv_last_stream
Definition: wavdec.c:58
av_get_exact_bits_per_sample
int av_get_exact_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:495
avio_rl32
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:759
AVIOContext
Bytestream IO Context.
Definition: avio.h:162
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:330
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:117
DEC
#define DEC
Definition: wavdec.c:70
id
enum AVCodecID id
Definition: extract_extradata_bsf.c:324
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:263
FFStream
Definition: internal.h:197
ff_spdif_probe
int ff_spdif_probe(const uint8_t *p_buf, int buf_size, enum AVCodecID *codec)
Definition: spdifdec.c:116
WAVDemuxContext::smv_eof
int smv_eof
Definition: wavdec.c:59
AV_CODEC_ID_DTS
@ AV_CODEC_ID_DTS
Definition: codec_id.h:431
avio_get_str
int avio_get_str(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a string from pb into buf.
Definition: aviobuf.c:895
size
int size
Definition: twinvq_data.h:10344
AV_CODEC_ID_SMVJPEG
@ AV_CODEC_ID_SMVJPEG
Definition: codec_id.h:263
avio.h
ID3v2_DEFAULT_MAGIC
#define ID3v2_DEFAULT_MAGIC
Default magic bytes for ID3v2 header: "ID3".
Definition: id3v2.h:35
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:248
ff_riff_info_conv
const AVMetadataConv ff_riff_info_conv[]
Definition: riff.c:609
avio_r8
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:632
ffio_ensure_seekback
int ffio_ensure_seekback(AVIOContext *s, int64_t buf_size)
Ensures that the requested seekback buffer size will be available.
Definition: aviobuf.c:1055
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
version
version
Definition: libkvazaar.c:313
FFStream::probe_packets
int probe_packets
Number of packets to buffer for codec probing.
Definition: internal.h:377
ff_spdif_read_packet
int ff_spdif_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: spdifdec.c:173
WAVDemuxContext::rifx
int rifx
Definition: wavdec.c:66
log.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:269
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:367
avio_rl24
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:751
avio_internal.h
WAVDemuxContext::audio_eof
int audio_eof
Definition: wavdec.c:60
ff_w64_guid_wave
const uint8_t ff_w64_guid_wave[16]
Definition: w64.c:28
AVCodecParameters::height
int height
Definition: codec_par.h:128
AVCodecParameters::block_align
int block_align
Audio only.
Definition: codec_par.h:184
WAVDemuxContext::smv_block_size
int smv_block_size
Definition: wavdec.c:55
ff_id3v2_read_dict
void ff_id3v2_read_dict(AVIOContext *pb, AVDictionary **metadata, const char *magic, ID3v2ExtraMeta **extra_meta)
Read an ID3v2 tag into specified dictionary and retrieve supported extra metadata.
Definition: id3v2.c:1130
value
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
Definition: writing_filters.txt:86
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
tb
#define tb
Definition: regdef.h:68
demux.h
AV_CODEC_ID_PCM_F16LE
@ AV_CODEC_ID_PCM_F16LE
Definition: codec_id.h:351
ff_w64_guid_fact
const uint8_t ff_w64_guid_fact[16]
Definition: w64.c:38
len
int len
Definition: vorbis_enc_data.h:426
ff_get_wav_header
int ff_get_wav_header(AVFormatContext *s, AVIOContext *pb, AVCodecParameters *par, int size, int big_endian)
Definition: riffdec.c:94
av_get_packet
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:102
av_uninit
#define av_uninit(x)
Definition: attributes.h:154
tag
uint32_t tag
Definition: movenc.c:1646
AVStream::id
int id
Format-specific stream ID.
Definition: avformat.h:962
ret
ret
Definition: filter_design.txt:187
read_packet
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_reading.c:42
AVStream
Stream structure.
Definition: avformat.h:948
WAVDemuxContext::spdif
int spdif
Definition: wavdec.c:63
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:260
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:71
ff_pcm_read_seek
int ff_pcm_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
Definition: pcm.c:56
metadata.h
pos
unsigned int pos
Definition: spdifenc.c:412
avformat.h
dict.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
set_spdif
static void set_spdif(AVFormatContext *s, WAVDemuxContext *wav)
Definition: wavdec.c:80
AVStream::index
int index
stream index in AVFormatContext
Definition: avformat.h:956
WAVDemuxContext::smv_given_first
int smv_given_first
Definition: wavdec.c:64
AV_CODEC_ID_G729
@ AV_CODEC_ID_G729
Definition: codec_id.h:480
w64.h
WAVDemuxContext::ignore_length
int ignore_length
Definition: wavdec.c:61
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:41
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:225
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:641
temp
else temp
Definition: vf_mcdeint.c:248
AVSTREAM_PARSE_FULL_RAW
@ AVSTREAM_PARSE_FULL_RAW
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:802
OFFSET
#define OFFSET(x)
Definition: wavdec.c:69
samples
Filter the word “frame” indicates either a video frame or a group of audio samples
Definition: filter_design.txt:8
AVPacket::stream_index
int stream_index
Definition: packet.h:376
avio_skip
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:347
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
ff_w64_guid_data
const uint8_t ff_w64_guid_data[16]
Definition: w64.c:42
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:326
AVCodecParameters::bits_per_coded_sample
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: codec_par.h:103
find_guid
static const GUIDParseTable * find_guid(ff_asf_guid guid)
Definition: asfdec_o.c:1535
AV_CODEC_ID_XMA2
@ AV_CODEC_ID_XMA2
Definition: codec_id.h:507
FFStream::request_probe
int request_probe
stream probing state -1 -> probing finished 0 -> no probing requested rest -> perform probing with re...
Definition: internal.h:266
ff_w64_guid_riff
const uint8_t ff_w64_guid_riff[16]
Definition: w64.c:23
av_free
#define av_free(p)
Definition: tableprint_vlc.h:33
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:61
AVPacket
This structure stores compressed data.
Definition: packet.h:351
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Definition: opt.h:244
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:70
riff.h
ff_id3v2_free_extra_meta
void ff_id3v2_free_extra_meta(ID3v2ExtraMeta **extra_meta)
Free memory allocated parsing special (non-text) metadata.
Definition: id3v2.c:1142
FFStream::cur_dts
int64_t cur_dts
Definition: internal.h:404
AVPacket::pos
int64_t pos
byte position in stream, -1 if unknown
Definition: packet.h:394
avio_rl64
uint64_t avio_rl64(AVIOContext *s)
Definition: aviobuf.c:767
int32_t
int32_t
Definition: audioconvert.c:56
flags
#define flags(name, subs,...)
Definition: cbs_av1.c:561
AVCodecParameters::bit_rate
int64_t bit_rate
The average bitrate of the encoded data (in bits per second).
Definition: codec_par.h:90
ff_id3v2_parse_priv
int ff_id3v2_parse_priv(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Add metadata for all PRIV tags in the ID3v2 header.
Definition: id3v2.c:1254
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
MKTAG
#define MKTAG(a, b, c, d)
Definition: macros.h:55
ffio_read_size
int ffio_read_size(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:691
snprintf
#define snprintf
Definition: snprintf.h:34
WAVDemuxContext::vst
AVStream * vst
Definition: wavdec.c:53
spdif.h
FF_PRI_GUID
#define FF_PRI_GUID
Definition: riff.h:104
ff_wav_codec_tags_list
const AVCodecTag *const ff_wav_codec_tags_list[]
av_fourcc2str
#define av_fourcc2str(fourcc)
Definition: avutil.h:354
ff_alloc_extradata
int ff_alloc_extradata(AVCodecParameters *par, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0.
Definition: utils.c:238
avio_feof
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:375