FFmpeg
wavdec.c
Go to the documentation of this file.
1 /*
2  * WAV demuxer
3  * Copyright (c) 2001, 2002 Fabrice Bellard
4  *
5  * Sony Wave64 demuxer
6  * RF64 demuxer
7  * Copyright (c) 2009 Daniel Verkamp
8  *
9  * BW64 demuxer
10  *
11  * This file is part of FFmpeg.
12  *
13  * FFmpeg is free software; you can redistribute it and/or
14  * modify it under the terms of the GNU Lesser General Public
15  * License as published by the Free Software Foundation; either
16  * version 2.1 of the License, or (at your option) any later version.
17  *
18  * FFmpeg is distributed in the hope that it will be useful,
19  * but WITHOUT ANY WARRANTY; without even the implied warranty of
20  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21  * Lesser General Public License for more details.
22  *
23  * You should have received a copy of the GNU Lesser General Public
24  * License along with FFmpeg; if not, write to the Free Software
25  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26  */
27 
28 #include <stdint.h>
29 
30 #include "config.h"
31 #include "libavutil/avassert.h"
32 #include "libavutil/dict.h"
33 #include "libavutil/intreadwrite.h"
34 #include "libavutil/log.h"
35 #include "libavutil/mathematics.h"
36 #include "libavutil/opt.h"
37 #include "avformat.h"
38 #include "avio.h"
39 #include "avio_internal.h"
40 #include "id3v2.h"
41 #include "internal.h"
42 #include "metadata.h"
43 #include "pcm.h"
44 #include "riff.h"
45 #include "w64.h"
46 #include "spdif.h"
47 
48 typedef struct WAVDemuxContext {
49  const AVClass *class;
50  int64_t data_end;
51  int w64;
53  int64_t smv_data_ofs;
56  int smv_block;
58  int smv_eof;
59  int audio_eof;
61  int max_size;
62  int spdif;
64  int unaligned; // e.g. if an odd number of bytes ID3 tag was prepended
65  int rifx; // RIFX: integer byte order for parameters is big endian
67 
68 #define OFFSET(x) offsetof(WAVDemuxContext, x)
69 #define DEC AV_OPT_FLAG_DECODING_PARAM
70 static const AVOption demux_options[] = {
71 #define W64_DEMUXER_OPTIONS_OFFSET (1 * CONFIG_WAV_DEMUXER)
72 #if CONFIG_WAV_DEMUXER
73  { "ignore_length", "Ignore length", OFFSET(ignore_length), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, DEC },
74 #endif
75  { "max_size", "max size of single packet", OFFSET(max_size), AV_OPT_TYPE_INT, { .i64 = 4096 }, 1024, 1 << 22, DEC },
76  { NULL },
77 };
78 
80 {
81  if (CONFIG_SPDIF_DEMUXER && s->streams[0]->codecpar->codec_tag == 1) {
82  enum AVCodecID codec;
83  int len = 1<<16;
84  int ret = ffio_ensure_seekback(s->pb, len);
85 
86  if (ret >= 0) {
87  uint8_t *buf = av_malloc(len + AV_INPUT_BUFFER_PADDING_SIZE);
88  if (!buf) {
89  ret = AVERROR(ENOMEM);
90  } else {
91  int64_t pos = avio_tell(s->pb);
92  len = ret = avio_read(s->pb, buf, len);
93  if (len >= 0) {
94  ret = ff_spdif_probe(buf, len, &codec);
96  s->streams[0]->codecpar->codec_id = codec;
97  wav->spdif = 1;
98  }
99  }
100  avio_seek(s->pb, pos, SEEK_SET);
101  av_free(buf);
102  }
103  }
104 
105  if (ret < 0)
106  av_log(s, AV_LOG_WARNING, "Cannot check for SPDIF\n");
107  }
108 }
109 
110 #if CONFIG_WAV_DEMUXER
111 
112 static int64_t next_tag(AVIOContext *pb, uint32_t *tag, int big_endian)
113 {
114  *tag = avio_rl32(pb);
115  if (!big_endian) {
116  return avio_rl32(pb);
117  } else {
118  return avio_rb32(pb);
119  }
120 }
121 
122 /* RIFF chunks are always at even offsets relative to where they start. */
123 static int64_t wav_seek_tag(WAVDemuxContext * wav, AVIOContext *s, int64_t offset, int whence)
124 {
125  offset += offset < INT64_MAX && offset + wav->unaligned & 1;
126 
127  return avio_seek(s, offset, whence);
128 }
129 
130 /* return the size of the found tag */
131 static int64_t find_tag(WAVDemuxContext * wav, AVIOContext *pb, uint32_t tag1)
132 {
133  unsigned int tag;
134  int64_t size;
135 
136  for (;;) {
137  if (avio_feof(pb))
138  return AVERROR_EOF;
139  size = next_tag(pb, &tag, wav->rifx);
140  if (tag == tag1)
141  break;
142  wav_seek_tag(wav, pb, size, SEEK_CUR);
143  }
144  return size;
145 }
146 
147 static int wav_probe(const AVProbeData *p)
148 {
149  /* check file header */
150  if (p->buf_size <= 32)
151  return 0;
152  if (!memcmp(p->buf + 8, "WAVE", 4)) {
153  if (!memcmp(p->buf, "RIFF", 4) || !memcmp(p->buf, "RIFX", 4))
154  /* Since the ACT demuxer has a standard WAV header at the top of
155  * its own, the returned score is decreased to avoid a probe
156  * conflict between ACT and WAV. */
157  return AVPROBE_SCORE_MAX - 1;
158  else if ((!memcmp(p->buf, "RF64", 4) ||
159  !memcmp(p->buf, "BW64", 4)) &&
160  !memcmp(p->buf + 12, "ds64", 4))
161  return AVPROBE_SCORE_MAX;
162  }
163  return 0;
164 }
165 
166 static void handle_stream_probing(AVStream *st)
167 {
169  FFStream *const sti = ffstream(st);
171  sti->probe_packets = FFMIN(sti->probe_packets, 32);
172  }
173 }
174 
175 static int wav_parse_fmt_tag(AVFormatContext *s, int64_t size, AVStream *st)
176 {
177  AVIOContext *pb = s->pb;
178  WAVDemuxContext *wav = s->priv_data;
179  int ret;
180 
181  /* parse fmt header */
182  ret = ff_get_wav_header(s, pb, st->codecpar, size, wav->rifx);
183  if (ret < 0)
184  return ret;
185  handle_stream_probing(st);
186 
188 
189  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
190 
191  return 0;
192 }
193 
194 static int wav_parse_xma2_tag(AVFormatContext *s, int64_t size, AVStream *st)
195 {
196  AVIOContext *pb = s->pb;
197  int version, num_streams, i, channels = 0, ret;
198 
199  if (size < 36)
200  return AVERROR_INVALIDDATA;
201 
205 
206  version = avio_r8(pb);
207  if (version != 3 && version != 4)
208  return AVERROR_INVALIDDATA;
209  num_streams = avio_r8(pb);
210  if (size != (32 + ((version==3)?0:8) + 4*num_streams))
211  return AVERROR_INVALIDDATA;
212  avio_skip(pb, 10);
213  st->codecpar->sample_rate = avio_rb32(pb);
214  if (version == 4)
215  avio_skip(pb, 8);
216  avio_skip(pb, 4);
217  st->duration = avio_rb32(pb);
218  avio_skip(pb, 8);
219 
220  for (i = 0; i < num_streams; i++) {
221  channels += avio_r8(pb);
222  avio_skip(pb, 3);
223  }
224  st->codecpar->channels = channels;
225 
226  if (st->codecpar->channels <= 0 || st->codecpar->sample_rate <= 0)
227  return AVERROR_INVALIDDATA;
228 
229  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
230 
231  avio_seek(pb, -size, SEEK_CUR);
232  if ((ret = ff_get_extradata(s, st->codecpar, pb, size)) < 0)
233  return ret;
234 
235  return 0;
236 }
237 
238 static inline int wav_parse_bext_string(AVFormatContext *s, const char *key,
239  int length)
240 {
241  char temp[257];
242  int ret;
243 
244  av_assert0(length < sizeof(temp));
245  if ((ret = ffio_read_size(s->pb, temp, length)) < 0)
246  return ret;
247 
248  temp[length] = 0;
249 
250  if (strlen(temp))
251  return av_dict_set(&s->metadata, key, temp, 0);
252 
253  return 0;
254 }
255 
256 static int wav_parse_bext_tag(AVFormatContext *s, int64_t size)
257 {
258  char temp[131], *coding_history;
259  int ret, x;
260  uint64_t time_reference;
261  int64_t umid_parts[8], umid_mask = 0;
262 
263  if ((ret = wav_parse_bext_string(s, "description", 256)) < 0 ||
264  (ret = wav_parse_bext_string(s, "originator", 32)) < 0 ||
265  (ret = wav_parse_bext_string(s, "originator_reference", 32)) < 0 ||
266  (ret = wav_parse_bext_string(s, "origination_date", 10)) < 0 ||
267  (ret = wav_parse_bext_string(s, "origination_time", 8)) < 0)
268  return ret;
269 
270  time_reference = avio_rl64(s->pb);
271  snprintf(temp, sizeof(temp), "%"PRIu64, time_reference);
272  if ((ret = av_dict_set(&s->metadata, "time_reference", temp, 0)) < 0)
273  return ret;
274 
275  /* check if version is >= 1, in which case an UMID may be present */
276  if (avio_rl16(s->pb) >= 1) {
277  for (x = 0; x < 8; x++)
278  umid_mask |= umid_parts[x] = avio_rb64(s->pb);
279 
280  if (umid_mask) {
281  /* the string formatting below is per SMPTE 330M-2004 Annex C */
282  if (umid_parts[4] == 0 && umid_parts[5] == 0 &&
283  umid_parts[6] == 0 && umid_parts[7] == 0) {
284  /* basic UMID */
285  snprintf(temp, sizeof(temp),
286  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
287  umid_parts[0], umid_parts[1],
288  umid_parts[2], umid_parts[3]);
289  } else {
290  /* extended UMID */
291  snprintf(temp, sizeof(temp),
292  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64
293  "%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
294  umid_parts[0], umid_parts[1],
295  umid_parts[2], umid_parts[3],
296  umid_parts[4], umid_parts[5],
297  umid_parts[6], umid_parts[7]);
298  }
299 
300  if ((ret = av_dict_set(&s->metadata, "umid", temp, 0)) < 0)
301  return ret;
302  }
303 
304  avio_skip(s->pb, 190);
305  } else
306  avio_skip(s->pb, 254);
307 
308  if (size > 602) {
309  /* CodingHistory present */
310  size -= 602;
311 
312  if (!(coding_history = av_malloc(size + 1)))
313  return AVERROR(ENOMEM);
314 
315  if ((ret = ffio_read_size(s->pb, coding_history, size)) < 0) {
316  av_free(coding_history);
317  return ret;
318  }
319 
320  coding_history[size] = 0;
321  if ((ret = av_dict_set(&s->metadata, "coding_history", coding_history,
323  return ret;
324  }
325 
326  return 0;
327 }
328 
329 static const AVMetadataConv wav_metadata_conv[] = {
330  { "description", "comment" },
331  { "originator", "encoded_by" },
332  { "origination_date", "date" },
333  { "origination_time", "creation_time" },
334  { 0 },
335 };
336 
337 /* wav input */
338 static int wav_read_header(AVFormatContext *s)
339 {
340  int64_t size, av_uninit(data_size);
341  int64_t sample_count = 0;
342  int rf64 = 0, bw64 = 0;
343  uint32_t tag;
344  AVIOContext *pb = s->pb;
345  AVStream *st = NULL;
346  WAVDemuxContext *wav = s->priv_data;
347  int ret, got_fmt = 0, got_xma2 = 0;
348  int64_t next_tag_ofs, data_ofs = -1;
349 
350  wav->unaligned = avio_tell(s->pb) & 1;
351 
352  wav->smv_data_ofs = -1;
353 
354  /* read chunk ID */
355  tag = avio_rl32(pb);
356  switch (tag) {
357  case MKTAG('R', 'I', 'F', 'F'):
358  break;
359  case MKTAG('R', 'I', 'F', 'X'):
360  wav->rifx = 1;
361  break;
362  case MKTAG('R', 'F', '6', '4'):
363  rf64 = 1;
364  break;
365  case MKTAG('B', 'W', '6', '4'):
366  bw64 = 1;
367  break;
368  default:
369  av_log(s, AV_LOG_ERROR, "invalid start code %s in RIFF header\n",
370  av_fourcc2str(tag));
371  return AVERROR_INVALIDDATA;
372  }
373 
374  /* read chunk size */
375  avio_rl32(pb);
376 
377  /* read format */
378  if (avio_rl32(pb) != MKTAG('W', 'A', 'V', 'E')) {
379  av_log(s, AV_LOG_ERROR, "invalid format in RIFF header\n");
380  return AVERROR_INVALIDDATA;
381  }
382 
383  if (rf64 || bw64) {
384  if (avio_rl32(pb) != MKTAG('d', 's', '6', '4'))
385  return AVERROR_INVALIDDATA;
386  size = avio_rl32(pb);
387  if (size < 24)
388  return AVERROR_INVALIDDATA;
389  avio_rl64(pb); /* RIFF size */
390 
391  data_size = avio_rl64(pb);
392  sample_count = avio_rl64(pb);
393 
394  if (data_size < 0 || sample_count < 0) {
395  av_log(s, AV_LOG_ERROR, "negative data_size and/or sample_count in "
396  "ds64: data_size = %"PRId64", sample_count = %"PRId64"\n",
397  data_size, sample_count);
398  return AVERROR_INVALIDDATA;
399  }
400  avio_skip(pb, size - 24); /* skip rest of ds64 chunk */
401 
402  }
403 
404  /* Create the audio stream now so that its index is always zero */
405  st = avformat_new_stream(s, NULL);
406  if (!st)
407  return AVERROR(ENOMEM);
408 
409  for (;;) {
410  AVStream *vst;
411  size = next_tag(pb, &tag, wav->rifx);
412  next_tag_ofs = avio_tell(pb) + size;
413 
414  if (avio_feof(pb))
415  break;
416 
417  switch (tag) {
418  case MKTAG('f', 'm', 't', ' '):
419  /* only parse the first 'fmt ' tag found */
420  if (!got_xma2 && !got_fmt && (ret = wav_parse_fmt_tag(s, size, st)) < 0) {
421  return ret;
422  } else if (got_fmt)
423  av_log(s, AV_LOG_WARNING, "found more than one 'fmt ' tag\n");
424 
425  got_fmt = 1;
426  break;
427  case MKTAG('X', 'M', 'A', '2'):
428  /* only parse the first 'XMA2' tag found */
429  if (!got_fmt && !got_xma2 && (ret = wav_parse_xma2_tag(s, size, st)) < 0) {
430  return ret;
431  } else if (got_xma2)
432  av_log(s, AV_LOG_WARNING, "found more than one 'XMA2' tag\n");
433 
434  got_xma2 = 1;
435  break;
436  case MKTAG('d', 'a', 't', 'a'):
437  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) && !got_fmt && !got_xma2) {
439  "found no 'fmt ' tag before the 'data' tag\n");
440  return AVERROR_INVALIDDATA;
441  }
442 
443  if (rf64 || bw64) {
444  next_tag_ofs = wav->data_end = avio_tell(pb) + data_size;
445  } else if (size != 0xFFFFFFFF) {
446  data_size = size;
447  next_tag_ofs = wav->data_end = size ? next_tag_ofs : INT64_MAX;
448  } else {
449  av_log(s, AV_LOG_WARNING, "Ignoring maximum wav data size, "
450  "file may be invalid\n");
451  data_size = 0;
452  next_tag_ofs = wav->data_end = INT64_MAX;
453  }
454 
455  data_ofs = avio_tell(pb);
456 
457  /* don't look for footer metadata if we can't seek or if we don't
458  * know where the data tag ends
459  */
460  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) || (!(rf64 && !bw64) && !size))
461  goto break_loop;
462  break;
463  case MKTAG('f', 'a', 'c', 't'):
464  if (!sample_count)
465  sample_count = (!wav->rifx ? avio_rl32(pb) : avio_rb32(pb));
466  break;
467  case MKTAG('b', 'e', 'x', 't'):
468  if ((ret = wav_parse_bext_tag(s, size)) < 0)
469  return ret;
470  break;
471  case MKTAG('S','M','V','0'):
472  if (!got_fmt) {
473  av_log(s, AV_LOG_ERROR, "found no 'fmt ' tag before the 'SMV0' tag\n");
474  return AVERROR_INVALIDDATA;
475  }
476  // SMV file, a wav file with video appended.
477  if (size != MKTAG('0','2','0','0')) {
478  av_log(s, AV_LOG_ERROR, "Unknown SMV version found\n");
479  goto break_loop;
480  }
481  av_log(s, AV_LOG_DEBUG, "Found SMV data\n");
482  wav->smv_given_first = 0;
483  vst = avformat_new_stream(s, NULL);
484  if (!vst)
485  return AVERROR(ENOMEM);
486  wav->vst = vst;
487  avio_r8(pb);
488  vst->id = 1;
491  vst->codecpar->width = avio_rl24(pb);
492  vst->codecpar->height = avio_rl24(pb);
493  if ((ret = ff_alloc_extradata(vst->codecpar, 4)) < 0) {
494  av_log(s, AV_LOG_ERROR, "Could not allocate extradata.\n");
495  return ret;
496  }
497  size = avio_rl24(pb);
498  wav->smv_data_ofs = avio_tell(pb) + (size - 5) * 3;
499  avio_rl24(pb);
500  wav->smv_block_size = avio_rl24(pb);
501  if (!wav->smv_block_size)
502  return AVERROR_INVALIDDATA;
503  avpriv_set_pts_info(vst, 32, 1, avio_rl24(pb));
504  vst->duration = avio_rl24(pb);
505  avio_rl24(pb);
506  avio_rl24(pb);
507  wav->smv_frames_per_jpeg = avio_rl24(pb);
508  if (wav->smv_frames_per_jpeg > 65536) {
509  av_log(s, AV_LOG_ERROR, "too many frames per jpeg\n");
510  return AVERROR_INVALIDDATA;
511  }
513  goto break_loop;
514  case MKTAG('L', 'I', 'S', 'T'):
515  case MKTAG('l', 'i', 's', 't'):
516  if (size < 4) {
517  av_log(s, AV_LOG_ERROR, "too short LIST tag\n");
518  return AVERROR_INVALIDDATA;
519  }
520  switch (avio_rl32(pb)) {
521  case MKTAG('I', 'N', 'F', 'O'):
522  ff_read_riff_info(s, size - 4);
523  break;
524  case MKTAG('a', 'd', 't', 'l'):
525  if (s->nb_chapters > 0) {
526  while (avio_tell(pb) < next_tag_ofs &&
527  !avio_feof(pb)) {
528  char cue_label[512];
529  unsigned id, sub_size;
530 
531  if (avio_rl32(pb) != MKTAG('l', 'a', 'b', 'l'))
532  break;
533 
534  sub_size = avio_rl32(pb);
535  if (sub_size < 5)
536  break;
537  id = avio_rl32(pb);
538  avio_get_str(pb, sub_size - 4, cue_label, sizeof(cue_label));
539  avio_skip(pb, avio_tell(pb) & 1);
540 
541  for (int i = 0; i < s->nb_chapters; i++) {
542  if (s->chapters[i]->id == id) {
543  av_dict_set(&s->chapters[i]->metadata, "title", cue_label, 0);
544  break;
545  }
546  }
547  }
548  }
549  break;
550  }
551  break;
552  case MKTAG('I', 'D', '3', ' '):
553  case MKTAG('i', 'd', '3', ' '): {
554  ID3v2ExtraMeta *id3v2_extra_meta;
555  ff_id3v2_read_dict(pb, &ffformatcontext(s)->id3v2_meta, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta);
556  if (id3v2_extra_meta) {
557  ff_id3v2_parse_apic(s, id3v2_extra_meta);
558  ff_id3v2_parse_chapters(s, id3v2_extra_meta);
559  ff_id3v2_parse_priv(s, id3v2_extra_meta);
560  }
561  ff_id3v2_free_extra_meta(&id3v2_extra_meta);
562  }
563  break;
564  case MKTAG('c', 'u', 'e', ' '):
565  if (size >= 4 && got_fmt && st->codecpar->sample_rate > 0) {
566  AVRational tb = {1, st->codecpar->sample_rate};
567  unsigned nb_cues = avio_rl32(pb);
568 
569  if (size >= nb_cues * 24LL + 4LL) {
570  for (int i = 0; i < nb_cues; i++) {
571  unsigned offset, id = avio_rl32(pb);
572 
573  if (avio_feof(pb))
574  return AVERROR_INVALIDDATA;
575 
576  avio_skip(pb, 16);
577  offset = avio_rl32(pb);
578 
580  return AVERROR(ENOMEM);
581  }
582  }
583  }
584  break;
585  }
586 
587  /* seek to next tag unless we know that we'll run into EOF */
588  if ((avio_size(pb) > 0 && next_tag_ofs >= avio_size(pb)) ||
589  wav_seek_tag(wav, pb, next_tag_ofs, SEEK_SET) < 0) {
590  break;
591  }
592  }
593 
594 break_loop:
595  if (!got_fmt && !got_xma2) {
596  av_log(s, AV_LOG_ERROR, "no 'fmt ' or 'XMA2' tag found\n");
597  return AVERROR_INVALIDDATA;
598  }
599 
600  if (data_ofs < 0) {
601  av_log(s, AV_LOG_ERROR, "no 'data' tag found\n");
602  return AVERROR_INVALIDDATA;
603  }
604 
605  avio_seek(pb, data_ofs, SEEK_SET);
606 
607  if (data_size > (INT64_MAX>>3)) {
608  av_log(s, AV_LOG_WARNING, "Data size %"PRId64" is too large\n", data_size);
609  data_size = 0;
610  }
611 
612  if ( st->codecpar->bit_rate > 0 && data_size > 0
613  && st->codecpar->sample_rate > 0
614  && sample_count > 0 && st->codecpar->channels > 1
615  && sample_count % st->codecpar->channels == 0) {
616  if (fabs(8.0 * data_size * st->codecpar->channels * st->codecpar->sample_rate /
617  sample_count /st->codecpar->bit_rate - 1.0) < 0.3)
618  sample_count /= st->codecpar->channels;
619  }
620 
621  if ( data_size > 0 && sample_count && st->codecpar->channels
622  && (data_size << 3) / sample_count / st->codecpar->channels > st->codecpar->bits_per_coded_sample + 1) {
623  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
624  sample_count = 0;
625  }
626 
627  /* G.729 hack (for Ticket4577)
628  * FIXME: Come up with cleaner, more general solution */
629  if (st->codecpar->codec_id == AV_CODEC_ID_G729 && sample_count && (data_size << 3) > sample_count) {
630  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
631  sample_count = 0;
632  }
633 
634  if (!sample_count || av_get_exact_bits_per_sample(st->codecpar->codec_id) > 0)
635  if ( st->codecpar->channels
636  && data_size
638  && wav->data_end <= avio_size(pb))
639  sample_count = (data_size << 3)
640  /
641  (st->codecpar->channels * (uint64_t)av_get_bits_per_sample(st->codecpar->codec_id));
642 
643  if (sample_count)
644  st->duration = sample_count;
645 
647  st->codecpar->block_align == st->codecpar->channels * 4 &&
648  st->codecpar->bits_per_coded_sample == 32 &&
649  st->codecpar->extradata_size == 2 &&
650  AV_RL16(st->codecpar->extradata) == 1) {
653  } else if (st->codecpar->codec_id == AV_CODEC_ID_PCM_S24LE &&
654  st->codecpar->block_align == st->codecpar->channels * 4 &&
655  st->codecpar->bits_per_coded_sample == 24) {
657  } else if (st->codecpar->codec_id == AV_CODEC_ID_XMA1 ||
659  st->codecpar->block_align = 2048;
660  } else if (st->codecpar->codec_id == AV_CODEC_ID_ADPCM_MS && st->codecpar->channels > 2 &&
661  st->codecpar->block_align < INT_MAX / st->codecpar->channels) {
662  st->codecpar->block_align *= st->codecpar->channels;
663  }
664 
665  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
667 
668  set_spdif(s, wav);
669 
670  return 0;
671 }
672 
673 /**
674  * Find chunk with w64 GUID by skipping over other chunks.
675  * @return the size of the found chunk
676  */
677 static int64_t find_guid(AVIOContext *pb, const uint8_t guid1[16])
678 {
679  uint8_t guid[16];
680  int64_t size;
681 
682  while (!avio_feof(pb)) {
683  avio_read(pb, guid, 16);
684  size = avio_rl64(pb);
685  if (size <= 24 || size > INT64_MAX - 8)
686  return AVERROR_INVALIDDATA;
687  if (!memcmp(guid, guid1, 16))
688  return size;
689  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
690  }
691  return AVERROR_EOF;
692 }
693 
694 static int wav_read_packet(AVFormatContext *s, AVPacket *pkt)
695 {
696  int ret, size;
697  int64_t left;
698  WAVDemuxContext *wav = s->priv_data;
699  AVStream *st = s->streams[0];
700 
701  if (CONFIG_SPDIF_DEMUXER && wav->spdif == 1)
702  return ff_spdif_read_packet(s, pkt);
703 
704  if (wav->smv_data_ofs > 0) {
705  int64_t audio_dts, video_dts;
706  AVStream *vst = wav->vst;
707 smv_retry:
710 
712  /*We always return a video frame first to get the pixel format first*/
713  wav->smv_last_stream = wav->smv_given_first ?
715  audio_dts, st->time_base) > 0 : 0;
716  wav->smv_given_first = 1;
717  }
718  wav->smv_last_stream = !wav->smv_last_stream;
719  wav->smv_last_stream |= wav->audio_eof;
720  wav->smv_last_stream &= !wav->smv_eof;
721  if (wav->smv_last_stream) {
722  uint64_t old_pos = avio_tell(s->pb);
723  uint64_t new_pos = wav->smv_data_ofs +
724  wav->smv_block * (int64_t)wav->smv_block_size;
725  if (avio_seek(s->pb, new_pos, SEEK_SET) < 0) {
726  ret = AVERROR_EOF;
727  goto smv_out;
728  }
729  size = avio_rl24(s->pb);
730  ret = av_get_packet(s->pb, pkt, size);
731  if (ret < 0)
732  goto smv_out;
733  pkt->pos -= 3;
734  pkt->pts = wav->smv_block * wav->smv_frames_per_jpeg;
736  wav->smv_block++;
737 
738  pkt->stream_index = vst->index;
739 smv_out:
740  avio_seek(s->pb, old_pos, SEEK_SET);
741  if (ret == AVERROR_EOF) {
742  wav->smv_eof = 1;
743  goto smv_retry;
744  }
745  return ret;
746  }
747  }
748 
749  left = wav->data_end - avio_tell(s->pb);
750  if (wav->ignore_length)
751  left = INT_MAX;
752  if (left <= 0) {
753  if (CONFIG_W64_DEMUXER && wav->w64)
754  left = find_guid(s->pb, ff_w64_guid_data) - 24;
755  else
756  left = find_tag(wav, s->pb, MKTAG('d', 'a', 't', 'a'));
757  if (left < 0) {
758  wav->audio_eof = 1;
759  if (wav->smv_data_ofs > 0 && !wav->smv_eof)
760  goto smv_retry;
761  return AVERROR_EOF;
762  }
763  wav->data_end = avio_tell(s->pb) + left;
764  }
765 
766  size = wav->max_size;
767  if (st->codecpar->block_align > 1) {
768  if (size < st->codecpar->block_align)
769  size = st->codecpar->block_align;
770  size = (size / st->codecpar->block_align) * st->codecpar->block_align;
771  }
772  size = FFMIN(size, left);
773  ret = av_get_packet(s->pb, pkt, size);
774  if (ret < 0)
775  return ret;
776  pkt->stream_index = 0;
777 
778  return ret;
779 }
780 
781 static int wav_read_seek(AVFormatContext *s,
782  int stream_index, int64_t timestamp, int flags)
783 {
784  WAVDemuxContext *wav = s->priv_data;
785  AVStream *ast = s->streams[0], *vst = wav->vst;
786  wav->smv_eof = 0;
787  wav->audio_eof = 0;
788 
789  if (stream_index != 0 && (!vst || stream_index != vst->index))
790  return AVERROR(EINVAL);
791  if (wav->smv_data_ofs > 0) {
792  int64_t smv_timestamp = timestamp;
793  if (stream_index == 0)
794  smv_timestamp = av_rescale_q(timestamp, ast->time_base, vst->time_base);
795  else
796  timestamp = av_rescale_q(smv_timestamp, vst->time_base, ast->time_base);
797  if (wav->smv_frames_per_jpeg > 0) {
798  wav->smv_block = smv_timestamp / wav->smv_frames_per_jpeg;
799  }
800  }
801 
802  switch (ast->codecpar->codec_id) {
803  case AV_CODEC_ID_MP2:
804  case AV_CODEC_ID_MP3:
805  case AV_CODEC_ID_AC3:
806  case AV_CODEC_ID_DTS:
807  case AV_CODEC_ID_XMA2:
808  /* use generic seeking with dynamically generated indexes */
809  return -1;
810  default:
811  break;
812  }
813  return ff_pcm_read_seek(s, 0, timestamp, flags);
814 }
815 
816 static const AVClass wav_demuxer_class = {
817  .class_name = "WAV demuxer",
818  .item_name = av_default_item_name,
819  .option = demux_options,
820  .version = LIBAVUTIL_VERSION_INT,
821 };
823  .name = "wav",
824  .long_name = NULL_IF_CONFIG_SMALL("WAV / WAVE (Waveform Audio)"),
825  .priv_data_size = sizeof(WAVDemuxContext),
826  .read_probe = wav_probe,
827  .read_header = wav_read_header,
828  .read_packet = wav_read_packet,
829  .read_seek = wav_read_seek,
831  .codec_tag = ff_wav_codec_tags_list,
832  .priv_class = &wav_demuxer_class,
833 };
834 #endif /* CONFIG_WAV_DEMUXER */
835 
836 #if CONFIG_W64_DEMUXER
837 static int w64_probe(const AVProbeData *p)
838 {
839  if (p->buf_size <= 40)
840  return 0;
841  if (!memcmp(p->buf, ff_w64_guid_riff, 16) &&
842  !memcmp(p->buf + 24, ff_w64_guid_wave, 16))
843  return AVPROBE_SCORE_MAX;
844  else
845  return 0;
846 }
847 
848 static int w64_read_header(AVFormatContext *s)
849 {
850  int64_t size, data_ofs = 0;
851  AVIOContext *pb = s->pb;
852  WAVDemuxContext *wav = s->priv_data;
853  AVStream *st;
854  uint8_t guid[16];
855  int ret;
856 
857  avio_read(pb, guid, 16);
858  if (memcmp(guid, ff_w64_guid_riff, 16))
859  return AVERROR_INVALIDDATA;
860 
861  /* riff + wave + fmt + sizes */
862  if (avio_rl64(pb) < 16 + 8 + 16 + 8 + 16 + 8)
863  return AVERROR_INVALIDDATA;
864 
865  avio_read(pb, guid, 16);
866  if (memcmp(guid, ff_w64_guid_wave, 16)) {
867  av_log(s, AV_LOG_ERROR, "could not find wave guid\n");
868  return AVERROR_INVALIDDATA;
869  }
870 
871  wav->w64 = 1;
872 
873  st = avformat_new_stream(s, NULL);
874  if (!st)
875  return AVERROR(ENOMEM);
876 
877  while (!avio_feof(pb)) {
878  if (avio_read(pb, guid, 16) != 16)
879  break;
880  size = avio_rl64(pb);
881  if (size <= 24 || INT64_MAX - size < avio_tell(pb))
882  return AVERROR_INVALIDDATA;
883 
884  if (!memcmp(guid, ff_w64_guid_fmt, 16)) {
885  /* subtract chunk header size - normal wav file doesn't count it */
886  ret = ff_get_wav_header(s, pb, st->codecpar, size - 24, 0);
887  if (ret < 0)
888  return ret;
889  avio_skip(pb, FFALIGN(size, INT64_C(8)) - size);
890 
891  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
892  } else if (!memcmp(guid, ff_w64_guid_fact, 16)) {
893  int64_t samples;
894 
895  samples = avio_rl64(pb);
896  if (samples > 0)
897  st->duration = samples;
898  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 32);
899  } else if (!memcmp(guid, ff_w64_guid_data, 16)) {
900  wav->data_end = avio_tell(pb) + size - 24;
901 
902  data_ofs = avio_tell(pb);
903  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
904  break;
905 
906  avio_skip(pb, size - 24);
907  } else if (!memcmp(guid, ff_w64_guid_summarylist, 16)) {
908  int64_t start, end, cur;
909  uint32_t count, chunk_size, i;
910  int64_t filesize = avio_size(s->pb);
911 
912  start = avio_tell(pb);
913  end = start + FFALIGN(size, INT64_C(8)) - 24;
914  count = avio_rl32(pb);
915 
916  for (i = 0; i < count; i++) {
917  char chunk_key[5], *value;
918 
919  if (avio_feof(pb) || (cur = avio_tell(pb)) < 0 || cur > end - 8 /* = tag + size */)
920  break;
921 
922  chunk_key[4] = 0;
923  avio_read(pb, chunk_key, 4);
924  chunk_size = avio_rl32(pb);
925  if (chunk_size == UINT32_MAX || (filesize >= 0 && chunk_size > filesize))
926  return AVERROR_INVALIDDATA;
927 
928  value = av_malloc(chunk_size + 1);
929  if (!value)
930  return AVERROR(ENOMEM);
931 
932  ret = avio_get_str16le(pb, chunk_size, value, chunk_size);
933  if (ret < 0) {
934  av_free(value);
935  return ret;
936  }
937  avio_skip(pb, chunk_size - ret);
938 
939  av_dict_set(&s->metadata, chunk_key, value, AV_DICT_DONT_STRDUP_VAL);
940  }
941 
942  avio_skip(pb, end - avio_tell(pb));
943  } else {
944  av_log(s, AV_LOG_DEBUG, "unknown guid: "FF_PRI_GUID"\n", FF_ARG_GUID(guid));
945  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
946  }
947  }
948 
949  if (!data_ofs)
950  return AVERROR_EOF;
951 
952  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
954 
955  handle_stream_probing(st);
957 
958  avio_seek(pb, data_ofs, SEEK_SET);
959 
960  set_spdif(s, wav);
961 
962  return 0;
963 }
964 
965 static const AVClass w64_demuxer_class = {
966  .class_name = "W64 demuxer",
967  .item_name = av_default_item_name,
969  .version = LIBAVUTIL_VERSION_INT,
970 };
971 
973  .name = "w64",
974  .long_name = NULL_IF_CONFIG_SMALL("Sony Wave64"),
975  .priv_data_size = sizeof(WAVDemuxContext),
976  .read_probe = w64_probe,
977  .read_header = w64_read_header,
978  .read_packet = wav_read_packet,
979  .read_seek = wav_read_seek,
981  .codec_tag = ff_wav_codec_tags_list,
982  .priv_class = &w64_demuxer_class,
983 };
984 #endif /* CONFIG_W64_DEMUXER */
WAVDemuxContext
Definition: wavdec.c:48
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:314
WAVDemuxContext::unaligned
int unaligned
Definition: wavdec.c:64
WAVDemuxContext::smv_block
int smv_block
Definition: wavdec.c:56
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:359
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:74
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:426
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
avformat_new_stream
AVStream * avformat_new_stream(AVFormatContext *s, const AVCodec *c)
Add a new stream to a media file.
Definition: utils.c:724
pcm.h
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:56
AV_WL32
#define AV_WL32(p, v)
Definition: intreadwrite.h:426
av_compare_ts
int av_compare_ts(int64_t ts_a, AVRational tb_a, int64_t ts_b, AVRational tb_b)
Compare two timestamps each in its own time base.
Definition: mathematics.c:146
ff_get_extradata
int ff_get_extradata(AVFormatContext *s, AVCodecParameters *par, AVIOContext *pb, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0 and f...
Definition: utils.c:469
W64_DEMUXER_OPTIONS_OFFSET
#define W64_DEMUXER_OPTIONS_OFFSET
ffformatcontext
static av_always_inline FFFormatContext * ffformatcontext(AVFormatContext *s)
Definition: internal.h:186
AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:57
WAVDemuxContext::smv_data_ofs
int64_t smv_data_ofs
Definition: wavdec.c:53
audio_dts
int64_t audio_dts
Definition: movenc.c:61
WAVDemuxContext::smv_frames_per_jpeg
int smv_frames_per_jpeg
Definition: wavdec.c:55
id3v2.h
WAVDemuxContext::max_size
int max_size
Definition: wavdec.c:61
AVOption
AVOption.
Definition: opt.h:247
AVMetadataConv
Definition: metadata.h:34
AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: packet.h:391
mathematics.h
AVProbeData::buf_size
int buf_size
Size of buf except extra allocated bytes.
Definition: avformat.h:449
avio_size
int64_t avio_size(AVIOContext *s)
Get the filesize.
Definition: aviobuf.c:338
sample_rate
sample_rate
Definition: ffmpeg_filter.c:156
WAVDemuxContext::data_end
int64_t data_end
Definition: wavdec.c:50
video_dts
int64_t video_dts
Definition: movenc.c:61
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31
WAVDemuxContext::w64
int w64
Definition: wavdec.c:51
AVPROBE_SCORE_MAX
#define AVPROBE_SCORE_MAX
maximum score
Definition: avformat.h:458
return
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a it should return
Definition: filter_design.txt:264
AVCodecParameters::channels
int channels
Audio only.
Definition: codec_par.h:166
ff_w64_guid_summarylist
const uint8_t ff_w64_guid_summarylist[16]
Definition: w64.c:47
ffstream
static av_always_inline FFStream * ffstream(AVStream *st)
Definition: internal.h:429
read_seek
static int read_seek(AVFormatContext *ctx, int stream_index, int64_t timestamp, int flags)
Definition: libcdio.c:149
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:486
AVFMT_GENERIC_INDEX
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:468
demux_options
static const AVOption demux_options[]
Definition: wavdec.c:70
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:424
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:900
avio_rl16
unsigned int avio_rl16(AVIOContext *s)
Definition: aviobuf.c:726
ff_id3v2_parse_chapters
int ff_id3v2_parse_chapters(AVFormatContext *s, ID3v2ExtraMeta *cur)
Create chapters for all CHAP tags found in the ID3v2 header.
Definition: id3v2.c:1188
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:72
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:591
avassert.h
avio_rb32
unsigned int avio_rb32(AVIOContext *s)
Definition: aviobuf.c:773
pkt
AVPacket * pkt
Definition: movenc.c:59
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
AVInputFormat
Definition: avformat.h:638
ID3v2ExtraMeta
Definition: id3v2.h:84
avio_get_str16le
int avio_get_str16le(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a UTF-16 string from pb and convert it to UTF-8.
FF_ARG_GUID
#define FF_ARG_GUID(g)
Definition: riff.h:108
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:257
AV_CODEC_ID_XMA1
@ AV_CODEC_ID_XMA1
Definition: codec_id.h:502
AVInputFormat::name
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:643
AVProbeData::buf
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:448
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
AVCodecParameters::width
int width
Video only.
Definition: codec_par.h:126
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:423
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:37
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:201
AV_CODEC_ID_PCM_F24LE
@ AV_CODEC_ID_PCM_F24LE
Definition: codec_id.h:348
channels
channels
Definition: aptx.h:33
AV_RL16
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_RL16
Definition: bytestream.h:94
ff_w64_demuxer
const AVInputFormat ff_w64_demuxer
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:141
ff_read_riff_info
int ff_read_riff_info(AVFormatContext *s, int64_t size)
Definition: riffdec.c:227
ff_wav_demuxer
const AVInputFormat ff_wav_demuxer
key
const char * key
Definition: hwcontext_opencl.c:168
if
if(ret)
Definition: filter_design.txt:179
FFStream::need_parsing
enum AVStreamParseType need_parsing
Definition: internal.h:402
AVFormatContext
Format I/O context.
Definition: avformat.h:1109
internal.h
ff_metadata_conv_ctx
void ff_metadata_conv_ctx(AVFormatContext *ctx, const AVMetadataConv *d_conv, const AVMetadataConv *s_conv)
Definition: metadata.c:59
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:1004
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
read_header
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:527
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
fabs
static __device__ float fabs(float a)
Definition: cuda_runtime.h:182
AVStream::time_base
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented.
Definition: avformat.h:880
NULL
#define NULL
Definition: coverity.c:32
read_probe
static int read_probe(const AVProbeData *pd)
Definition: jvdec.c:55
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:235
ff_id3v2_parse_apic
int ff_id3v2_parse_apic(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Create a stream for each APIC (attached picture) extracted from the ID3v2 header.
Definition: id3v2.c:1157
avio_rb64
uint64_t avio_rb64(AVIOContext *s)
Definition: aviobuf.c:920
AVProbeData
This structure contains the data a format has to probe a file.
Definition: avformat.h:446
AVPROBE_SCORE_EXTENSION
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:456
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:170
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:47
ff_w64_guid_fmt
const uint8_t ff_w64_guid_fmt[16]
Definition: w64.c:33
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:78
WAVDemuxContext::smv_last_stream
int smv_last_stream
Definition: wavdec.c:57
av_get_exact_bits_per_sample
int av_get_exact_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:502
avio_rl32
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:742
AVIOContext
Bytestream IO Context.
Definition: avio.h:161
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:326
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:117
DEC
#define DEC
Definition: wavdec.c:69
id
enum AVCodecID id
Definition: extract_extradata_bsf.c:325
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:262
FFStream
Definition: internal.h:191
ff_spdif_probe
int ff_spdif_probe(const uint8_t *p_buf, int buf_size, enum AVCodecID *codec)
Definition: spdifdec.c:116
WAVDemuxContext::smv_eof
int smv_eof
Definition: wavdec.c:58
AV_CODEC_ID_DTS
@ AV_CODEC_ID_DTS
Definition: codec_id.h:427
avio_get_str
int avio_get_str(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a string from pb into buf.
Definition: aviobuf.c:878
size
int size
Definition: twinvq_data.h:10344
AV_CODEC_ID_SMVJPEG
@ AV_CODEC_ID_SMVJPEG
Definition: codec_id.h:263
avio.h
ID3v2_DEFAULT_MAGIC
#define ID3v2_DEFAULT_MAGIC
Default magic bytes for ID3v2 header: "ID3".
Definition: id3v2.h:35
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:248
ff_riff_info_conv
const AVMetadataConv ff_riff_info_conv[]
Definition: riff.c:605
avio_r8
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:616
ffio_ensure_seekback
int ffio_ensure_seekback(AVIOContext *s, int64_t buf_size)
Ensures that the requested seekback buffer size will be available.
Definition: aviobuf.c:1016
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
version
version
Definition: libkvazaar.c:307
FFStream::probe_packets
int probe_packets
Number of packets to buffer for codec probing.
Definition: internal.h:399
ff_spdif_read_packet
int ff_spdif_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: spdifdec.c:173
WAVDemuxContext::rifx
int rifx
Definition: wavdec.c:65
log.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:271
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:366
avio_rl24
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:734
avio_internal.h
WAVDemuxContext::audio_eof
int audio_eof
Definition: wavdec.c:59
ff_w64_guid_wave
const uint8_t ff_w64_guid_wave[16]
Definition: w64.c:28
AVCodecParameters::height
int height
Definition: codec_par.h:127
AVCodecParameters::block_align
int block_align
Audio only.
Definition: codec_par.h:177
WAVDemuxContext::smv_block_size
int smv_block_size
Definition: wavdec.c:54
ff_id3v2_read_dict
void ff_id3v2_read_dict(AVIOContext *pb, AVDictionary **metadata, const char *magic, ID3v2ExtraMeta **extra_meta)
Read an ID3v2 tag into specified dictionary and retrieve supported extra metadata.
Definition: id3v2.c:1129
value
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
Definition: writing_filters.txt:86
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
tb
#define tb
Definition: regdef.h:68
AV_CODEC_ID_PCM_F16LE
@ AV_CODEC_ID_PCM_F16LE
Definition: codec_id.h:347
ff_w64_guid_fact
const uint8_t ff_w64_guid_fact[16]
Definition: w64.c:38
len
int len
Definition: vorbis_enc_data.h:426
ff_get_wav_header
int ff_get_wav_header(AVFormatContext *s, AVIOContext *pb, AVCodecParameters *par, int size, int big_endian)
Definition: riffdec.c:90
avpriv_new_chapter
AVChapter * avpriv_new_chapter(AVFormatContext *s, int64_t id, AVRational time_base, int64_t start, int64_t end, const char *title)
Add a new chapter.
Definition: utils.c:835
av_get_packet
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:196
av_uninit
#define av_uninit(x)
Definition: attributes.h:154
tag
uint32_t tag
Definition: movenc.c:1595
AVStream::id
int id
Format-specific stream ID.
Definition: avformat.h:864
ret
ret
Definition: filter_design.txt:187
read_packet
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_reading.c:42
AVStream
Stream structure.
Definition: avformat.h:857
WAVDemuxContext::spdif
int spdif
Definition: wavdec.c:62
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:246
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:71
ff_pcm_read_seek
int ff_pcm_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
Definition: pcm.c:56
metadata.h
pos
unsigned int pos
Definition: spdifenc.c:412
avformat.h
dict.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
set_spdif
static void set_spdif(AVFormatContext *s, WAVDemuxContext *wav)
Definition: wavdec.c:79
AVStream::index
int index
stream index in AVFormatContext
Definition: avformat.h:858
WAVDemuxContext::smv_given_first
int smv_given_first
Definition: wavdec.c:63
AV_CODEC_ID_G729
@ AV_CODEC_ID_G729
Definition: codec_id.h:476
w64.h
WAVDemuxContext::ignore_length
int ignore_length
Definition: wavdec.c:60
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:40
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:224
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:625
temp
else temp
Definition: vf_mcdeint.c:248
AVSTREAM_PARSE_FULL_RAW
@ AVSTREAM_PARSE_FULL_RAW
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:784
OFFSET
#define OFFSET(x)
Definition: wavdec.c:68
samples
Filter the word “frame” indicates either a video frame or a group of audio samples
Definition: filter_design.txt:8
avpriv_set_pts_info
void avpriv_set_pts_info(AVStream *st, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: utils.c:1146
AVPacket::stream_index
int stream_index
Definition: packet.h:375
avio_skip
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:333
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
ff_w64_guid_data
const uint8_t ff_w64_guid_data[16]
Definition: w64.c:42
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:322
AVCodecParameters::bits_per_coded_sample
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: codec_par.h:102
find_guid
static const GUIDParseTable * find_guid(ff_asf_guid guid)
Definition: asfdec_o.c:1535
AV_CODEC_ID_XMA2
@ AV_CODEC_ID_XMA2
Definition: codec_id.h:503
FFStream::request_probe
int request_probe
stream probing state -1 -> probing finished 0 -> no probing requested rest -> perform probing with re...
Definition: internal.h:288
ff_w64_guid_riff
const uint8_t ff_w64_guid_riff[16]
Definition: w64.c:23
av_free
#define av_free(p)
Definition: tableprint_vlc.h:34
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:60
AVPacket
This structure stores compressed data.
Definition: packet.h:350
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Definition: opt.h:241
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:70
riff.h
ff_id3v2_free_extra_meta
void ff_id3v2_free_extra_meta(ID3v2ExtraMeta **extra_meta)
Free memory allocated parsing special (non-text) metadata.
Definition: id3v2.c:1141
FFStream::cur_dts
int64_t cur_dts
Definition: internal.h:426
AVPacket::pos
int64_t pos
byte position in stream, -1 if unknown
Definition: packet.h:393
avio_rl64
uint64_t avio_rl64(AVIOContext *s)
Definition: aviobuf.c:750
int32_t
int32_t
Definition: audioconvert.c:56
flags
#define flags(name, subs,...)
Definition: cbs_av1.c:561
AVCodecParameters::bit_rate
int64_t bit_rate
The average bitrate of the encoded data (in bits per second).
Definition: codec_par.h:89
ff_id3v2_parse_priv
int ff_id3v2_parse_priv(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Add metadata for all PRIV tags in the ID3v2 header.
Definition: id3v2.c:1253
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
MKTAG
#define MKTAG(a, b, c, d)
Definition: macros.h:55
ffio_read_size
int ffio_read_size(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:674
snprintf
#define snprintf
Definition: snprintf.h:34
WAVDemuxContext::vst
AVStream * vst
Definition: wavdec.c:52
spdif.h
FF_PRI_GUID
#define FF_PRI_GUID
Definition: riff.h:104
ff_wav_codec_tags_list
const AVCodecTag *const ff_wav_codec_tags_list[]
av_fourcc2str
#define av_fourcc2str(fourcc)
Definition: avutil.h:348
ff_alloc_extradata
int ff_alloc_extradata(AVCodecParameters *par, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0.
Definition: utils.c:451
avio_feof
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:360