FFmpeg
wavdec.c
Go to the documentation of this file.
1 /*
2  * WAV demuxer
3  * Copyright (c) 2001, 2002 Fabrice Bellard
4  *
5  * Sony Wave64 demuxer
6  * RF64 demuxer
7  * Copyright (c) 2009 Daniel Verkamp
8  *
9  * BW64 demuxer
10  *
11  * This file is part of FFmpeg.
12  *
13  * FFmpeg is free software; you can redistribute it and/or
14  * modify it under the terms of the GNU Lesser General Public
15  * License as published by the Free Software Foundation; either
16  * version 2.1 of the License, or (at your option) any later version.
17  *
18  * FFmpeg is distributed in the hope that it will be useful,
19  * but WITHOUT ANY WARRANTY; without even the implied warranty of
20  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21  * Lesser General Public License for more details.
22  *
23  * You should have received a copy of the GNU Lesser General Public
24  * License along with FFmpeg; if not, write to the Free Software
25  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26  */
27 
28 #include <stdint.h>
29 
30 #include "config.h"
31 #include "libavutil/avassert.h"
32 #include "libavutil/dict.h"
33 #include "libavutil/intreadwrite.h"
34 #include "libavutil/log.h"
35 #include "libavutil/mathematics.h"
36 #include "libavutil/opt.h"
37 #include "avformat.h"
38 #include "avio.h"
39 #include "avio_internal.h"
40 #include "id3v2.h"
41 #include "internal.h"
42 #include "metadata.h"
43 #include "pcm.h"
44 #include "riff.h"
45 #include "w64.h"
46 #include "spdif.h"
47 
48 typedef struct WAVDemuxContext {
49  const AVClass *class;
50  int64_t data_end;
51  int w64;
53  int64_t smv_data_ofs;
56  int smv_block;
58  int smv_eof;
59  int audio_eof;
61  int max_size;
62  int spdif;
64  int unaligned; // e.g. if an odd number of bytes ID3 tag was prepended
65  int rifx; // RIFX: integer byte order for parameters is big endian
67 
68 #define OFFSET(x) offsetof(WAVDemuxContext, x)
69 #define DEC AV_OPT_FLAG_DECODING_PARAM
70 static const AVOption demux_options[] = {
71 #define W64_DEMUXER_OPTIONS_OFFSET (1 * CONFIG_WAV_DEMUXER)
72 #if CONFIG_WAV_DEMUXER
73  { "ignore_length", "Ignore length", OFFSET(ignore_length), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, DEC },
74 #endif
75  { "max_size", "max size of single packet", OFFSET(max_size), AV_OPT_TYPE_INT, { .i64 = 4096 }, 1024, 1 << 22, DEC },
76  { NULL },
77 };
78 
80 {
81  if (CONFIG_SPDIF_DEMUXER && s->streams[0]->codecpar->codec_tag == 1) {
82  enum AVCodecID codec;
83  int len = 1<<16;
84  int ret = ffio_ensure_seekback(s->pb, len);
85 
86  if (ret >= 0) {
87  uint8_t *buf = av_malloc(len + AV_INPUT_BUFFER_PADDING_SIZE);
88  if (!buf) {
89  ret = AVERROR(ENOMEM);
90  } else {
91  int64_t pos = avio_tell(s->pb);
92  len = ret = avio_read(s->pb, buf, len);
93  if (len >= 0) {
94  ret = ff_spdif_probe(buf, len, &codec);
96  s->streams[0]->codecpar->codec_id = codec;
97  wav->spdif = 1;
98  }
99  }
100  avio_seek(s->pb, pos, SEEK_SET);
101  av_free(buf);
102  }
103  }
104 
105  if (ret < 0)
106  av_log(s, AV_LOG_WARNING, "Cannot check for SPDIF\n");
107  }
108 }
109 
110 #if CONFIG_WAV_DEMUXER
111 
112 static int64_t next_tag(AVIOContext *pb, uint32_t *tag, int big_endian)
113 {
114  *tag = avio_rl32(pb);
115  if (!big_endian) {
116  return avio_rl32(pb);
117  } else {
118  return avio_rb32(pb);
119  }
120 }
121 
122 /* RIFF chunks are always at even offsets relative to where they start. */
123 static int64_t wav_seek_tag(WAVDemuxContext * wav, AVIOContext *s, int64_t offset, int whence)
124 {
125  offset += offset < INT64_MAX && offset + wav->unaligned & 1;
126 
127  return avio_seek(s, offset, whence);
128 }
129 
130 /* return the size of the found tag */
131 static int64_t find_tag(WAVDemuxContext * wav, AVIOContext *pb, uint32_t tag1)
132 {
133  unsigned int tag;
134  int64_t size;
135 
136  for (;;) {
137  if (avio_feof(pb))
138  return AVERROR_EOF;
139  size = next_tag(pb, &tag, wav->rifx);
140  if (tag == tag1)
141  break;
142  wav_seek_tag(wav, pb, size, SEEK_CUR);
143  }
144  return size;
145 }
146 
147 static int wav_probe(const AVProbeData *p)
148 {
149  /* check file header */
150  if (p->buf_size <= 32)
151  return 0;
152  if (!memcmp(p->buf + 8, "WAVE", 4)) {
153  if (!memcmp(p->buf, "RIFF", 4) || !memcmp(p->buf, "RIFX", 4))
154  /* Since the ACT demuxer has a standard WAV header at the top of
155  * its own, the returned score is decreased to avoid a probe
156  * conflict between ACT and WAV. */
157  return AVPROBE_SCORE_MAX - 1;
158  else if ((!memcmp(p->buf, "RF64", 4) ||
159  !memcmp(p->buf, "BW64", 4)) &&
160  !memcmp(p->buf + 12, "ds64", 4))
161  return AVPROBE_SCORE_MAX;
162  }
163  return 0;
164 }
165 
166 static void handle_stream_probing(AVStream *st)
167 {
171  }
172 }
173 
174 static int wav_parse_fmt_tag(AVFormatContext *s, int64_t size, AVStream *st)
175 {
176  AVIOContext *pb = s->pb;
177  WAVDemuxContext *wav = s->priv_data;
178  int ret;
179 
180  /* parse fmt header */
181  ret = ff_get_wav_header(s, pb, st->codecpar, size, wav->rifx);
182  if (ret < 0)
183  return ret;
184  handle_stream_probing(st);
185 
187 
188  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
189 
190  return 0;
191 }
192 
193 static int wav_parse_xma2_tag(AVFormatContext *s, int64_t size, AVStream *st)
194 {
195  AVIOContext *pb = s->pb;
196  int version, num_streams, i, channels = 0, ret;
197 
198  if (size < 36)
199  return AVERROR_INVALIDDATA;
200 
204 
205  version = avio_r8(pb);
206  if (version != 3 && version != 4)
207  return AVERROR_INVALIDDATA;
208  num_streams = avio_r8(pb);
209  if (size != (32 + ((version==3)?0:8) + 4*num_streams))
210  return AVERROR_INVALIDDATA;
211  avio_skip(pb, 10);
212  st->codecpar->sample_rate = avio_rb32(pb);
213  if (version == 4)
214  avio_skip(pb, 8);
215  avio_skip(pb, 4);
216  st->duration = avio_rb32(pb);
217  avio_skip(pb, 8);
218 
219  for (i = 0; i < num_streams; i++) {
220  channels += avio_r8(pb);
221  avio_skip(pb, 3);
222  }
223  st->codecpar->channels = channels;
224 
225  if (st->codecpar->channels <= 0 || st->codecpar->sample_rate <= 0)
226  return AVERROR_INVALIDDATA;
227 
228  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
229 
230  avio_seek(pb, -size, SEEK_CUR);
231  if ((ret = ff_get_extradata(s, st->codecpar, pb, size)) < 0)
232  return ret;
233 
234  return 0;
235 }
236 
237 static inline int wav_parse_bext_string(AVFormatContext *s, const char *key,
238  int length)
239 {
240  char temp[257];
241  int ret;
242 
243  av_assert0(length < sizeof(temp));
244  if ((ret = avio_read(s->pb, temp, length)) != length)
245  return ret < 0 ? ret : AVERROR_INVALIDDATA;
246 
247  temp[length] = 0;
248 
249  if (strlen(temp))
250  return av_dict_set(&s->metadata, key, temp, 0);
251 
252  return 0;
253 }
254 
255 static int wav_parse_bext_tag(AVFormatContext *s, int64_t size)
256 {
257  char temp[131], *coding_history;
258  int ret, x;
259  uint64_t time_reference;
260  int64_t umid_parts[8], umid_mask = 0;
261 
262  if ((ret = wav_parse_bext_string(s, "description", 256)) < 0 ||
263  (ret = wav_parse_bext_string(s, "originator", 32)) < 0 ||
264  (ret = wav_parse_bext_string(s, "originator_reference", 32)) < 0 ||
265  (ret = wav_parse_bext_string(s, "origination_date", 10)) < 0 ||
266  (ret = wav_parse_bext_string(s, "origination_time", 8)) < 0)
267  return ret;
268 
269  time_reference = avio_rl64(s->pb);
270  snprintf(temp, sizeof(temp), "%"PRIu64, time_reference);
271  if ((ret = av_dict_set(&s->metadata, "time_reference", temp, 0)) < 0)
272  return ret;
273 
274  /* check if version is >= 1, in which case an UMID may be present */
275  if (avio_rl16(s->pb) >= 1) {
276  for (x = 0; x < 8; x++)
277  umid_mask |= umid_parts[x] = avio_rb64(s->pb);
278 
279  if (umid_mask) {
280  /* the string formatting below is per SMPTE 330M-2004 Annex C */
281  if (umid_parts[4] == 0 && umid_parts[5] == 0 &&
282  umid_parts[6] == 0 && umid_parts[7] == 0) {
283  /* basic UMID */
284  snprintf(temp, sizeof(temp),
285  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
286  umid_parts[0], umid_parts[1],
287  umid_parts[2], umid_parts[3]);
288  } else {
289  /* extended UMID */
290  snprintf(temp, sizeof(temp),
291  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64
292  "%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
293  umid_parts[0], umid_parts[1],
294  umid_parts[2], umid_parts[3],
295  umid_parts[4], umid_parts[5],
296  umid_parts[6], umid_parts[7]);
297  }
298 
299  if ((ret = av_dict_set(&s->metadata, "umid", temp, 0)) < 0)
300  return ret;
301  }
302 
303  avio_skip(s->pb, 190);
304  } else
305  avio_skip(s->pb, 254);
306 
307  if (size > 602) {
308  /* CodingHistory present */
309  size -= 602;
310 
311  if (!(coding_history = av_malloc(size + 1)))
312  return AVERROR(ENOMEM);
313 
314  if ((ret = avio_read(s->pb, coding_history, size)) != size) {
315  av_free(coding_history);
316  return ret < 0 ? ret : AVERROR_INVALIDDATA;
317  }
318 
319  coding_history[size] = 0;
320  if ((ret = av_dict_set(&s->metadata, "coding_history", coding_history,
322  return ret;
323  }
324 
325  return 0;
326 }
327 
328 static const AVMetadataConv wav_metadata_conv[] = {
329  { "description", "comment" },
330  { "originator", "encoded_by" },
331  { "origination_date", "date" },
332  { "origination_time", "creation_time" },
333  { 0 },
334 };
335 
336 /* wav input */
337 static int wav_read_header(AVFormatContext *s)
338 {
339  int64_t size, av_uninit(data_size);
340  int64_t sample_count = 0;
341  int rf64 = 0, bw64 = 0;
342  uint32_t tag;
343  AVIOContext *pb = s->pb;
344  AVStream *st = NULL;
345  WAVDemuxContext *wav = s->priv_data;
346  int ret, got_fmt = 0, got_xma2 = 0;
347  int64_t next_tag_ofs, data_ofs = -1;
348 
349  wav->unaligned = avio_tell(s->pb) & 1;
350 
351  wav->smv_data_ofs = -1;
352 
353  /* read chunk ID */
354  tag = avio_rl32(pb);
355  switch (tag) {
356  case MKTAG('R', 'I', 'F', 'F'):
357  break;
358  case MKTAG('R', 'I', 'F', 'X'):
359  wav->rifx = 1;
360  break;
361  case MKTAG('R', 'F', '6', '4'):
362  rf64 = 1;
363  break;
364  case MKTAG('B', 'W', '6', '4'):
365  bw64 = 1;
366  break;
367  default:
368  av_log(s, AV_LOG_ERROR, "invalid start code %s in RIFF header\n",
369  av_fourcc2str(tag));
370  return AVERROR_INVALIDDATA;
371  }
372 
373  /* read chunk size */
374  avio_rl32(pb);
375 
376  /* read format */
377  if (avio_rl32(pb) != MKTAG('W', 'A', 'V', 'E')) {
378  av_log(s, AV_LOG_ERROR, "invalid format in RIFF header\n");
379  return AVERROR_INVALIDDATA;
380  }
381 
382  if (rf64 || bw64) {
383  if (avio_rl32(pb) != MKTAG('d', 's', '6', '4'))
384  return AVERROR_INVALIDDATA;
385  size = avio_rl32(pb);
386  if (size < 24)
387  return AVERROR_INVALIDDATA;
388  avio_rl64(pb); /* RIFF size */
389 
390  data_size = avio_rl64(pb);
391  sample_count = avio_rl64(pb);
392 
393  if (data_size < 0 || sample_count < 0) {
394  av_log(s, AV_LOG_ERROR, "negative data_size and/or sample_count in "
395  "ds64: data_size = %"PRId64", sample_count = %"PRId64"\n",
396  data_size, sample_count);
397  return AVERROR_INVALIDDATA;
398  }
399  avio_skip(pb, size - 24); /* skip rest of ds64 chunk */
400 
401  }
402 
403  /* Create the audio stream now so that its index is always zero */
404  st = avformat_new_stream(s, NULL);
405  if (!st)
406  return AVERROR(ENOMEM);
407 
408  for (;;) {
409  AVStream *vst;
410  size = next_tag(pb, &tag, wav->rifx);
411  next_tag_ofs = avio_tell(pb) + size;
412 
413  if (avio_feof(pb))
414  break;
415 
416  switch (tag) {
417  case MKTAG('f', 'm', 't', ' '):
418  /* only parse the first 'fmt ' tag found */
419  if (!got_xma2 && !got_fmt && (ret = wav_parse_fmt_tag(s, size, st)) < 0) {
420  return ret;
421  } else if (got_fmt)
422  av_log(s, AV_LOG_WARNING, "found more than one 'fmt ' tag\n");
423 
424  got_fmt = 1;
425  break;
426  case MKTAG('X', 'M', 'A', '2'):
427  /* only parse the first 'XMA2' tag found */
428  if (!got_fmt && !got_xma2 && (ret = wav_parse_xma2_tag(s, size, st)) < 0) {
429  return ret;
430  } else if (got_xma2)
431  av_log(s, AV_LOG_WARNING, "found more than one 'XMA2' tag\n");
432 
433  got_xma2 = 1;
434  break;
435  case MKTAG('d', 'a', 't', 'a'):
436  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) && !got_fmt && !got_xma2) {
438  "found no 'fmt ' tag before the 'data' tag\n");
439  return AVERROR_INVALIDDATA;
440  }
441 
442  if (rf64 || bw64) {
443  next_tag_ofs = wav->data_end = avio_tell(pb) + data_size;
444  } else if (size != 0xFFFFFFFF) {
445  data_size = size;
446  next_tag_ofs = wav->data_end = size ? next_tag_ofs : INT64_MAX;
447  } else {
448  av_log(s, AV_LOG_WARNING, "Ignoring maximum wav data size, "
449  "file may be invalid\n");
450  data_size = 0;
451  next_tag_ofs = wav->data_end = INT64_MAX;
452  }
453 
454  data_ofs = avio_tell(pb);
455 
456  /* don't look for footer metadata if we can't seek or if we don't
457  * know where the data tag ends
458  */
459  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) || (!(rf64 && !bw64) && !size))
460  goto break_loop;
461  break;
462  case MKTAG('f', 'a', 'c', 't'):
463  if (!sample_count)
464  sample_count = (!wav->rifx ? avio_rl32(pb) : avio_rb32(pb));
465  break;
466  case MKTAG('b', 'e', 'x', 't'):
467  if ((ret = wav_parse_bext_tag(s, size)) < 0)
468  return ret;
469  break;
470  case MKTAG('S','M','V','0'):
471  if (!got_fmt) {
472  av_log(s, AV_LOG_ERROR, "found no 'fmt ' tag before the 'SMV0' tag\n");
473  return AVERROR_INVALIDDATA;
474  }
475  // SMV file, a wav file with video appended.
476  if (size != MKTAG('0','2','0','0')) {
477  av_log(s, AV_LOG_ERROR, "Unknown SMV version found\n");
478  goto break_loop;
479  }
480  av_log(s, AV_LOG_DEBUG, "Found SMV data\n");
481  wav->smv_given_first = 0;
482  vst = avformat_new_stream(s, NULL);
483  if (!vst)
484  return AVERROR(ENOMEM);
485  wav->vst = vst;
486  avio_r8(pb);
487  vst->id = 1;
490  vst->codecpar->width = avio_rl24(pb);
491  vst->codecpar->height = avio_rl24(pb);
492  if ((ret = ff_alloc_extradata(vst->codecpar, 4)) < 0) {
493  av_log(s, AV_LOG_ERROR, "Could not allocate extradata.\n");
494  return ret;
495  }
496  size = avio_rl24(pb);
497  wav->smv_data_ofs = avio_tell(pb) + (size - 5) * 3;
498  avio_rl24(pb);
499  wav->smv_block_size = avio_rl24(pb);
500  avpriv_set_pts_info(vst, 32, 1, avio_rl24(pb));
501  vst->duration = avio_rl24(pb);
502  avio_rl24(pb);
503  avio_rl24(pb);
504  wav->smv_frames_per_jpeg = avio_rl24(pb);
505  if (wav->smv_frames_per_jpeg > 65536) {
506  av_log(s, AV_LOG_ERROR, "too many frames per jpeg\n");
507  return AVERROR_INVALIDDATA;
508  }
510  goto break_loop;
511  case MKTAG('L', 'I', 'S', 'T'):
512  case MKTAG('l', 'i', 's', 't'):
513  if (size < 4) {
514  av_log(s, AV_LOG_ERROR, "too short LIST tag\n");
515  return AVERROR_INVALIDDATA;
516  }
517  switch (avio_rl32(pb)) {
518  case MKTAG('I', 'N', 'F', 'O'):
519  ff_read_riff_info(s, size - 4);
520  break;
521  case MKTAG('a', 'd', 't', 'l'):
522  if (s->nb_chapters > 0) {
523  while (avio_tell(pb) < next_tag_ofs &&
524  !avio_feof(pb)) {
525  char cue_label[512];
526  unsigned id, sub_size;
527 
528  if (avio_rl32(pb) != MKTAG('l', 'a', 'b', 'l'))
529  break;
530 
531  sub_size = avio_rl32(pb);
532  if (sub_size < 5)
533  break;
534  id = avio_rl32(pb);
535  avio_get_str(pb, sub_size - 4, cue_label, sizeof(cue_label));
536  avio_skip(pb, avio_tell(pb) & 1);
537 
538  for (int i = 0; i < s->nb_chapters; i++) {
539  if (s->chapters[i]->id == id) {
540  av_dict_set(&s->chapters[i]->metadata, "title", cue_label, 0);
541  break;
542  }
543  }
544  }
545  }
546  break;
547  }
548  break;
549  case MKTAG('I', 'D', '3', ' '):
550  case MKTAG('i', 'd', '3', ' '): {
551  ID3v2ExtraMeta *id3v2_extra_meta;
552  ff_id3v2_read_dict(pb, &s->internal->id3v2_meta, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta);
553  if (id3v2_extra_meta) {
554  ff_id3v2_parse_apic(s, id3v2_extra_meta);
555  ff_id3v2_parse_chapters(s, id3v2_extra_meta);
556  ff_id3v2_parse_priv(s, id3v2_extra_meta);
557  }
558  ff_id3v2_free_extra_meta(&id3v2_extra_meta);
559  }
560  break;
561  case MKTAG('c', 'u', 'e', ' '):
562  if (size >= 4 && got_fmt && st->codecpar->sample_rate > 0) {
563  AVRational tb = {1, st->codecpar->sample_rate};
564  unsigned nb_cues = avio_rl32(pb);
565 
566  if (size >= nb_cues * 24LL + 4LL) {
567  for (int i = 0; i < nb_cues; i++) {
568  unsigned offset, id = avio_rl32(pb);
569 
570  if (avio_feof(pb))
571  return AVERROR_INVALIDDATA;
572 
573  avio_skip(pb, 16);
574  offset = avio_rl32(pb);
575 
577  return AVERROR(ENOMEM);
578  }
579  }
580  }
581  break;
582  }
583 
584  /* seek to next tag unless we know that we'll run into EOF */
585  if ((avio_size(pb) > 0 && next_tag_ofs >= avio_size(pb)) ||
586  wav_seek_tag(wav, pb, next_tag_ofs, SEEK_SET) < 0) {
587  break;
588  }
589  }
590 
591 break_loop:
592  if (!got_fmt && !got_xma2) {
593  av_log(s, AV_LOG_ERROR, "no 'fmt ' or 'XMA2' tag found\n");
594  return AVERROR_INVALIDDATA;
595  }
596 
597  if (data_ofs < 0) {
598  av_log(s, AV_LOG_ERROR, "no 'data' tag found\n");
599  return AVERROR_INVALIDDATA;
600  }
601 
602  avio_seek(pb, data_ofs, SEEK_SET);
603 
604  if (data_size > (INT64_MAX>>3)) {
605  av_log(s, AV_LOG_WARNING, "Data size %"PRId64" is too large\n", data_size);
606  data_size = 0;
607  }
608 
609  if ( st->codecpar->bit_rate > 0 && data_size > 0
610  && st->codecpar->sample_rate > 0
611  && sample_count > 0 && st->codecpar->channels > 1
612  && sample_count % st->codecpar->channels == 0) {
613  if (fabs(8.0 * data_size * st->codecpar->channels * st->codecpar->sample_rate /
614  sample_count /st->codecpar->bit_rate - 1.0) < 0.3)
615  sample_count /= st->codecpar->channels;
616  }
617 
618  if ( data_size > 0 && sample_count && st->codecpar->channels
619  && (data_size << 3) / sample_count / st->codecpar->channels > st->codecpar->bits_per_coded_sample + 1) {
620  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
621  sample_count = 0;
622  }
623 
624  /* G.729 hack (for Ticket4577)
625  * FIXME: Come up with cleaner, more general solution */
626  if (st->codecpar->codec_id == AV_CODEC_ID_G729 && sample_count && (data_size << 3) > sample_count) {
627  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
628  sample_count = 0;
629  }
630 
631  if (!sample_count || av_get_exact_bits_per_sample(st->codecpar->codec_id) > 0)
632  if ( st->codecpar->channels
633  && data_size
635  && wav->data_end <= avio_size(pb))
636  sample_count = (data_size << 3)
637  /
638  (st->codecpar->channels * (uint64_t)av_get_bits_per_sample(st->codecpar->codec_id));
639 
640  if (sample_count)
641  st->duration = sample_count;
642 
644  st->codecpar->block_align == st->codecpar->channels * 4 &&
645  st->codecpar->bits_per_coded_sample == 32 &&
646  st->codecpar->extradata_size == 2 &&
647  AV_RL16(st->codecpar->extradata) == 1) {
650  } else if (st->codecpar->codec_id == AV_CODEC_ID_PCM_S24LE &&
651  st->codecpar->block_align == st->codecpar->channels * 4 &&
652  st->codecpar->bits_per_coded_sample == 24) {
654  } else if (st->codecpar->codec_id == AV_CODEC_ID_XMA1 ||
656  st->codecpar->block_align = 2048;
657  } else if (st->codecpar->codec_id == AV_CODEC_ID_ADPCM_MS && st->codecpar->channels > 2 &&
658  st->codecpar->block_align < INT_MAX / st->codecpar->channels) {
659  st->codecpar->block_align *= st->codecpar->channels;
660  }
661 
662  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
664 
665  set_spdif(s, wav);
666 
667  return 0;
668 }
669 
670 /**
671  * Find chunk with w64 GUID by skipping over other chunks.
672  * @return the size of the found chunk
673  */
674 static int64_t find_guid(AVIOContext *pb, const uint8_t guid1[16])
675 {
676  uint8_t guid[16];
677  int64_t size;
678 
679  while (!avio_feof(pb)) {
680  avio_read(pb, guid, 16);
681  size = avio_rl64(pb);
682  if (size <= 24 || size > INT64_MAX - 8)
683  return AVERROR_INVALIDDATA;
684  if (!memcmp(guid, guid1, 16))
685  return size;
686  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
687  }
688  return AVERROR_EOF;
689 }
690 
691 static int wav_read_packet(AVFormatContext *s, AVPacket *pkt)
692 {
693  int ret, size;
694  int64_t left;
695  WAVDemuxContext *wav = s->priv_data;
696  AVStream *st = s->streams[0];
697 
698  if (CONFIG_SPDIF_DEMUXER && wav->spdif == 1)
699  return ff_spdif_read_packet(s, pkt);
700 
701  if (wav->smv_data_ofs > 0) {
702  int64_t audio_dts, video_dts;
703  AVStream *vst = wav->vst;
704 smv_retry:
707 
709  /*We always return a video frame first to get the pixel format first*/
710  wav->smv_last_stream = wav->smv_given_first ?
712  audio_dts, st->time_base) > 0 : 0;
713  wav->smv_given_first = 1;
714  }
715  wav->smv_last_stream = !wav->smv_last_stream;
716  wav->smv_last_stream |= wav->audio_eof;
717  wav->smv_last_stream &= !wav->smv_eof;
718  if (wav->smv_last_stream) {
719  uint64_t old_pos = avio_tell(s->pb);
720  uint64_t new_pos = wav->smv_data_ofs +
721  wav->smv_block * wav->smv_block_size;
722  if (avio_seek(s->pb, new_pos, SEEK_SET) < 0) {
723  ret = AVERROR_EOF;
724  goto smv_out;
725  }
726  size = avio_rl24(s->pb);
727  ret = av_get_packet(s->pb, pkt, size);
728  if (ret < 0)
729  goto smv_out;
730  pkt->pos -= 3;
731  pkt->pts = wav->smv_block * wav->smv_frames_per_jpeg;
733  wav->smv_block++;
734 
735  pkt->stream_index = vst->index;
736 smv_out:
737  avio_seek(s->pb, old_pos, SEEK_SET);
738  if (ret == AVERROR_EOF) {
739  wav->smv_eof = 1;
740  goto smv_retry;
741  }
742  return ret;
743  }
744  }
745 
746  left = wav->data_end - avio_tell(s->pb);
747  if (wav->ignore_length)
748  left = INT_MAX;
749  if (left <= 0) {
750  if (CONFIG_W64_DEMUXER && wav->w64)
751  left = find_guid(s->pb, ff_w64_guid_data) - 24;
752  else
753  left = find_tag(wav, s->pb, MKTAG('d', 'a', 't', 'a'));
754  if (left < 0) {
755  wav->audio_eof = 1;
756  if (wav->smv_data_ofs > 0 && !wav->smv_eof)
757  goto smv_retry;
758  return AVERROR_EOF;
759  }
760  wav->data_end = avio_tell(s->pb) + left;
761  }
762 
763  size = wav->max_size;
764  if (st->codecpar->block_align > 1) {
765  if (size < st->codecpar->block_align)
766  size = st->codecpar->block_align;
767  size = (size / st->codecpar->block_align) * st->codecpar->block_align;
768  }
769  size = FFMIN(size, left);
770  ret = av_get_packet(s->pb, pkt, size);
771  if (ret < 0)
772  return ret;
773  pkt->stream_index = 0;
774 
775  return ret;
776 }
777 
778 static int wav_read_seek(AVFormatContext *s,
779  int stream_index, int64_t timestamp, int flags)
780 {
781  WAVDemuxContext *wav = s->priv_data;
782  AVStream *ast = s->streams[0], *vst = wav->vst;
783  wav->smv_eof = 0;
784  wav->audio_eof = 0;
785 
786  if (stream_index != 0 && (!vst || stream_index != vst->index))
787  return AVERROR(EINVAL);
788  if (wav->smv_data_ofs > 0) {
789  int64_t smv_timestamp = timestamp;
790  if (stream_index == 0)
791  smv_timestamp = av_rescale_q(timestamp, ast->time_base, vst->time_base);
792  else
793  timestamp = av_rescale_q(smv_timestamp, vst->time_base, ast->time_base);
794  if (wav->smv_frames_per_jpeg > 0) {
795  wav->smv_block = smv_timestamp / wav->smv_frames_per_jpeg;
796  }
797  }
798 
799  switch (ast->codecpar->codec_id) {
800  case AV_CODEC_ID_MP2:
801  case AV_CODEC_ID_MP3:
802  case AV_CODEC_ID_AC3:
803  case AV_CODEC_ID_DTS:
804  case AV_CODEC_ID_XMA2:
805  /* use generic seeking with dynamically generated indexes */
806  return -1;
807  default:
808  break;
809  }
810  return ff_pcm_read_seek(s, 0, timestamp, flags);
811 }
812 
813 static const AVClass wav_demuxer_class = {
814  .class_name = "WAV demuxer",
815  .item_name = av_default_item_name,
816  .option = demux_options,
817  .version = LIBAVUTIL_VERSION_INT,
818 };
820  .name = "wav",
821  .long_name = NULL_IF_CONFIG_SMALL("WAV / WAVE (Waveform Audio)"),
822  .priv_data_size = sizeof(WAVDemuxContext),
823  .read_probe = wav_probe,
824  .read_header = wav_read_header,
825  .read_packet = wav_read_packet,
826  .read_seek = wav_read_seek,
828  .codec_tag = ff_wav_codec_tags_list,
829  .priv_class = &wav_demuxer_class,
830 };
831 #endif /* CONFIG_WAV_DEMUXER */
832 
833 #if CONFIG_W64_DEMUXER
834 static int w64_probe(const AVProbeData *p)
835 {
836  if (p->buf_size <= 40)
837  return 0;
838  if (!memcmp(p->buf, ff_w64_guid_riff, 16) &&
839  !memcmp(p->buf + 24, ff_w64_guid_wave, 16))
840  return AVPROBE_SCORE_MAX;
841  else
842  return 0;
843 }
844 
845 static int w64_read_header(AVFormatContext *s)
846 {
847  int64_t size, data_ofs = 0;
848  AVIOContext *pb = s->pb;
849  WAVDemuxContext *wav = s->priv_data;
850  AVStream *st;
851  uint8_t guid[16];
852  int ret;
853 
854  avio_read(pb, guid, 16);
855  if (memcmp(guid, ff_w64_guid_riff, 16))
856  return AVERROR_INVALIDDATA;
857 
858  /* riff + wave + fmt + sizes */
859  if (avio_rl64(pb) < 16 + 8 + 16 + 8 + 16 + 8)
860  return AVERROR_INVALIDDATA;
861 
862  avio_read(pb, guid, 16);
863  if (memcmp(guid, ff_w64_guid_wave, 16)) {
864  av_log(s, AV_LOG_ERROR, "could not find wave guid\n");
865  return AVERROR_INVALIDDATA;
866  }
867 
868  wav->w64 = 1;
869 
870  st = avformat_new_stream(s, NULL);
871  if (!st)
872  return AVERROR(ENOMEM);
873 
874  while (!avio_feof(pb)) {
875  if (avio_read(pb, guid, 16) != 16)
876  break;
877  size = avio_rl64(pb);
878  if (size <= 24 || INT64_MAX - size < avio_tell(pb))
879  return AVERROR_INVALIDDATA;
880 
881  if (!memcmp(guid, ff_w64_guid_fmt, 16)) {
882  /* subtract chunk header size - normal wav file doesn't count it */
883  ret = ff_get_wav_header(s, pb, st->codecpar, size - 24, 0);
884  if (ret < 0)
885  return ret;
886  avio_skip(pb, FFALIGN(size, INT64_C(8)) - size);
887 
888  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
889  } else if (!memcmp(guid, ff_w64_guid_fact, 16)) {
890  int64_t samples;
891 
892  samples = avio_rl64(pb);
893  if (samples > 0)
894  st->duration = samples;
895  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 32);
896  } else if (!memcmp(guid, ff_w64_guid_data, 16)) {
897  wav->data_end = avio_tell(pb) + size - 24;
898 
899  data_ofs = avio_tell(pb);
900  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
901  break;
902 
903  avio_skip(pb, size - 24);
904  } else if (!memcmp(guid, ff_w64_guid_summarylist, 16)) {
905  int64_t start, end, cur;
906  uint32_t count, chunk_size, i;
907  int64_t filesize = avio_size(s->pb);
908 
909  start = avio_tell(pb);
910  end = start + FFALIGN(size, INT64_C(8)) - 24;
911  count = avio_rl32(pb);
912 
913  for (i = 0; i < count; i++) {
914  char chunk_key[5], *value;
915 
916  if (avio_feof(pb) || (cur = avio_tell(pb)) < 0 || cur > end - 8 /* = tag + size */)
917  break;
918 
919  chunk_key[4] = 0;
920  avio_read(pb, chunk_key, 4);
921  chunk_size = avio_rl32(pb);
922  if (chunk_size == UINT32_MAX || (filesize >= 0 && chunk_size > filesize))
923  return AVERROR_INVALIDDATA;
924 
925  value = av_malloc(chunk_size + 1);
926  if (!value)
927  return AVERROR(ENOMEM);
928 
929  ret = avio_get_str16le(pb, chunk_size, value, chunk_size);
930  if (ret < 0) {
931  av_free(value);
932  return ret;
933  }
934  avio_skip(pb, chunk_size - ret);
935 
936  av_dict_set(&s->metadata, chunk_key, value, AV_DICT_DONT_STRDUP_VAL);
937  }
938 
939  avio_skip(pb, end - avio_tell(pb));
940  } else {
941  av_log(s, AV_LOG_DEBUG, "unknown guid: "FF_PRI_GUID"\n", FF_ARG_GUID(guid));
942  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
943  }
944  }
945 
946  if (!data_ofs)
947  return AVERROR_EOF;
948 
949  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
951 
952  handle_stream_probing(st);
954 
955  avio_seek(pb, data_ofs, SEEK_SET);
956 
957  set_spdif(s, wav);
958 
959  return 0;
960 }
961 
962 static const AVClass w64_demuxer_class = {
963  .class_name = "W64 demuxer",
964  .item_name = av_default_item_name,
966  .version = LIBAVUTIL_VERSION_INT,
967 };
968 
970  .name = "w64",
971  .long_name = NULL_IF_CONFIG_SMALL("Sony Wave64"),
972  .priv_data_size = sizeof(WAVDemuxContext),
973  .read_probe = w64_probe,
974  .read_header = w64_read_header,
975  .read_packet = wav_read_packet,
976  .read_seek = wav_read_seek,
978  .codec_tag = ff_wav_codec_tags_list,
979  .priv_class = &w64_demuxer_class,
980 };
981 #endif /* CONFIG_W64_DEMUXER */
WAVDemuxContext
Definition: wavdec.c:48
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:313
WAVDemuxContext::unaligned
int unaligned
Definition: wavdec.c:64
WAVDemuxContext::smv_block
int smv_block
Definition: wavdec.c:56
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:358
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:74
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:425
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
avformat_new_stream
AVStream * avformat_new_stream(AVFormatContext *s, const AVCodec *c)
Add a new stream to a media file.
Definition: utils.c:4374
pcm.h
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:56
AV_WL32
#define AV_WL32(p, v)
Definition: intreadwrite.h:426
av_compare_ts
int av_compare_ts(int64_t ts_a, AVRational tb_a, int64_t ts_b, AVRational tb_b)
Compare two timestamps each in its own time base.
Definition: mathematics.c:146
ff_get_extradata
int ff_get_extradata(AVFormatContext *s, AVCodecParameters *par, AVIOContext *pb, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0 and f...
Definition: utils.c:3282
W64_DEMUXER_OPTIONS_OFFSET
#define W64_DEMUXER_OPTIONS_OFFSET
AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:55
MKTAG
#define MKTAG(a, b, c, d)
Definition: common.h:478
WAVDemuxContext::smv_data_ofs
int64_t smv_data_ofs
Definition: wavdec.c:53
audio_dts
int64_t audio_dts
Definition: movenc.c:61
WAVDemuxContext::smv_frames_per_jpeg
int smv_frames_per_jpeg
Definition: wavdec.c:55
id3v2.h
WAVDemuxContext::max_size
int max_size
Definition: wavdec.c:61
AVStream::internal
AVStreamInternal * internal
An opaque field for libavformat internal usage.
Definition: avformat.h:1009
AVOption
AVOption.
Definition: opt.h:247
AVStreamInternal::probe_packets
int probe_packets
Number of packets to buffer for codec probing.
Definition: internal.h:383
AVMetadataConv
Definition: metadata.h:34
AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: packet.h:391
mathematics.h
AVProbeData::buf_size
int buf_size
Size of buf except extra allocated bytes.
Definition: avformat.h:449
avio_size
int64_t avio_size(AVIOContext *s)
Get the filesize.
Definition: aviobuf.c:332
sample_rate
sample_rate
Definition: ffmpeg_filter.c:156
WAVDemuxContext::data_end
int64_t data_end
Definition: wavdec.c:50
video_dts
int64_t video_dts
Definition: movenc.c:61
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31
WAVDemuxContext::w64
int w64
Definition: wavdec.c:51
AVPROBE_SCORE_MAX
#define AVPROBE_SCORE_MAX
maximum score
Definition: avformat.h:458
return
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a it should return
Definition: filter_design.txt:264
AVCodecParameters::channels
int channels
Audio only.
Definition: codec_par.h:166
ff_w64_guid_summarylist
const uint8_t ff_w64_guid_summarylist[16]
Definition: w64.c:47
read_seek
static int read_seek(AVFormatContext *ctx, int stream_index, int64_t timestamp, int flags)
Definition: libcdio.c:149
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:538
AVFMT_GENERIC_INDEX
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:468
demux_options
static const AVOption demux_options[]
Definition: wavdec.c:70
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:423
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:890
avio_rl16
unsigned int avio_rl16(AVIOContext *s)
Definition: aviobuf.c:717
ff_id3v2_parse_chapters
int ff_id3v2_parse_chapters(AVFormatContext *s, ID3v2ExtraMeta *cur)
Create chapters for all CHAP tags found in the ID3v2 header.
Definition: id3v2.c:1188
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:72
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:585
avassert.h
avio_rb32
unsigned int avio_rb32(AVIOContext *s)
Definition: aviobuf.c:764
pkt
AVPacket * pkt
Definition: movenc.c:59
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
AVInputFormat
Definition: avformat.h:626
ID3v2ExtraMeta
Definition: id3v2.h:84
avio_get_str16le
int avio_get_str16le(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a UTF-16 string from pb and convert it to UTF-8.
FF_ARG_GUID
#define FF_ARG_GUID(g)
Definition: riff.h:108
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:257
AV_CODEC_ID_XMA1
@ AV_CODEC_ID_XMA1
Definition: codec_id.h:501
AVInputFormat::name
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:631
AVProbeData::buf
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:448
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
AVCodecParameters::width
int width
Video only.
Definition: codec_par.h:126
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:422
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:37
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:201
AV_CODEC_ID_PCM_F24LE
@ AV_CODEC_ID_PCM_F24LE
Definition: codec_id.h:347
channels
channels
Definition: aptx.h:33
AV_RL16
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_RL16
Definition: bytestream.h:94
ff_w64_demuxer
const AVInputFormat ff_w64_demuxer
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:141
ff_read_riff_info
int ff_read_riff_info(AVFormatContext *s, int64_t size)
Definition: riffdec.c:227
ff_wav_demuxer
const AVInputFormat ff_wav_demuxer
key
const char * key
Definition: hwcontext_opencl.c:168
if
if(ret)
Definition: filter_design.txt:179
AVFormatContext
Format I/O context.
Definition: avformat.h:1107
internal.h
ff_metadata_conv_ctx
void ff_metadata_conv_ctx(AVFormatContext *ctx, const AVMetadataConv *d_conv, const AVMetadataConv *s_conv)
Definition: metadata.c:59
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:994
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
read_header
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:527
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
fabs
static __device__ float fabs(float a)
Definition: cuda_runtime.h:182
AVStream::time_base
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented.
Definition: avformat.h:870
NULL
#define NULL
Definition: coverity.c:32
read_probe
static int read_probe(const AVProbeData *pd)
Definition: jvdec.c:55
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
AVStreamInternal::cur_dts
int64_t cur_dts
Definition: internal.h:410
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:235
ff_id3v2_parse_apic
int ff_id3v2_parse_apic(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Create a stream for each APIC (attached picture) extracted from the ID3v2 header.
Definition: id3v2.c:1157
avio_rb64
uint64_t avio_rb64(AVIOContext *s)
Definition: aviobuf.c:885
AVProbeData
This structure contains the data a format has to probe a file.
Definition: avformat.h:446
AVPROBE_SCORE_EXTENSION
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:456
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:170
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:47
ff_w64_guid_fmt
const uint8_t ff_w64_guid_fmt[16]
Definition: w64.c:33
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:78
WAVDemuxContext::smv_last_stream
int smv_last_stream
Definition: wavdec.c:57
av_get_exact_bits_per_sample
int av_get_exact_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:496
avio_rl32
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:733
AVIOContext
Bytestream IO Context.
Definition: avio.h:161
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:325
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:116
DEC
#define DEC
Definition: wavdec.c:69
id
enum AVCodecID id
Definition: extract_extradata_bsf.c:325
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:260
AVStreamInternal::request_probe
int request_probe
stream probing state -1 -> probing finished 0 -> no probing requested rest -> perform probing with re...
Definition: internal.h:272
ff_spdif_probe
int ff_spdif_probe(const uint8_t *p_buf, int buf_size, enum AVCodecID *codec)
Definition: spdifdec.c:116
WAVDemuxContext::smv_eof
int smv_eof
Definition: wavdec.c:58
avpriv_set_pts_info
void avpriv_set_pts_info(AVStream *s, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: utils.c:4799
AV_CODEC_ID_DTS
@ AV_CODEC_ID_DTS
Definition: codec_id.h:426
avio_get_str
int avio_get_str(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a string from pb into buf.
Definition: aviobuf.c:843
size
int size
Definition: twinvq_data.h:10344
AV_CODEC_ID_SMVJPEG
@ AV_CODEC_ID_SMVJPEG
Definition: codec_id.h:263
avio.h
ID3v2_DEFAULT_MAGIC
#define ID3v2_DEFAULT_MAGIC
Default magic bytes for ID3v2 header: "ID3".
Definition: id3v2.h:35
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:248
ff_riff_info_conv
const AVMetadataConv ff_riff_info_conv[]
Definition: riff.c:604
avio_r8
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:607
FFMIN
#define FFMIN(a, b)
Definition: common.h:105
ffio_ensure_seekback
int ffio_ensure_seekback(AVIOContext *s, int64_t buf_size)
Ensures that the requested seekback buffer size will be available.
Definition: aviobuf.c:981
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
version
version
Definition: libkvazaar.c:307
ff_spdif_read_packet
int ff_spdif_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: spdifdec.c:173
WAVDemuxContext::rifx
int rifx
Definition: wavdec.c:65
i
int i
Definition: input.c:406
log.h
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:366
avio_rl24
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:725
avio_internal.h
WAVDemuxContext::audio_eof
int audio_eof
Definition: wavdec.c:59
ff_w64_guid_wave
const uint8_t ff_w64_guid_wave[16]
Definition: w64.c:28
AVCodecParameters::height
int height
Definition: codec_par.h:127
AVCodecParameters::block_align
int block_align
Audio only.
Definition: codec_par.h:177
WAVDemuxContext::smv_block_size
int smv_block_size
Definition: wavdec.c:54
ff_id3v2_read_dict
void ff_id3v2_read_dict(AVIOContext *pb, AVDictionary **metadata, const char *magic, ID3v2ExtraMeta **extra_meta)
Read an ID3v2 tag into specified dictionary and retrieve supported extra metadata.
Definition: id3v2.c:1129
value
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
Definition: writing_filters.txt:86
tb
#define tb
Definition: regdef.h:68
AV_CODEC_ID_PCM_F16LE
@ AV_CODEC_ID_PCM_F16LE
Definition: codec_id.h:346
ff_w64_guid_fact
const uint8_t ff_w64_guid_fact[16]
Definition: w64.c:38
len
int len
Definition: vorbis_enc_data.h:426
ff_get_wav_header
int ff_get_wav_header(AVFormatContext *s, AVIOContext *pb, AVCodecParameters *par, int size, int big_endian)
Definition: riffdec.c:90
avpriv_new_chapter
AVChapter * avpriv_new_chapter(AVFormatContext *s, int64_t id, AVRational time_base, int64_t start, int64_t end, const char *title)
Add a new chapter.
Definition: utils.c:4487
av_get_packet
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:281
av_uninit
#define av_uninit(x)
Definition: attributes.h:154
tag
uint32_t tag
Definition: movenc.c:1594
AVStream::id
int id
Format-specific stream ID.
Definition: avformat.h:854
ret
ret
Definition: filter_design.txt:187
read_packet
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_reading.c:42
AVStream
Stream structure.
Definition: avformat.h:847
WAVDemuxContext::spdif
int spdif
Definition: wavdec.c:62
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:243
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:71
ff_pcm_read_seek
int ff_pcm_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
Definition: pcm.c:56
AVStreamInternal::need_parsing
enum AVStreamParseType need_parsing
Definition: internal.h:386
metadata.h
pos
unsigned int pos
Definition: spdifenc.c:412
avformat.h
dict.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
set_spdif
static void set_spdif(AVFormatContext *s, WAVDemuxContext *wav)
Definition: wavdec.c:79
AVStream::index
int index
stream index in AVFormatContext
Definition: avformat.h:848
WAVDemuxContext::smv_given_first
int smv_given_first
Definition: wavdec.c:63
AV_CODEC_ID_G729
@ AV_CODEC_ID_G729
Definition: codec_id.h:475
w64.h
WAVDemuxContext::ignore_length
int ignore_length
Definition: wavdec.c:60
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:40
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:224
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:616
temp
else temp
Definition: vf_mcdeint.c:259
AVSTREAM_PARSE_FULL_RAW
@ AVSTREAM_PARSE_FULL_RAW
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:772
OFFSET
#define OFFSET(x)
Definition: wavdec.c:68
samples
Filter the word “frame” indicates either a video frame or a group of audio samples
Definition: filter_design.txt:8
AVPacket::stream_index
int stream_index
Definition: packet.h:375
avio_skip
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:327
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
ff_w64_guid_data
const uint8_t ff_w64_guid_data[16]
Definition: w64.c:42
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:321
AVCodecParameters::bits_per_coded_sample
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: codec_par.h:102
find_guid
static const GUIDParseTable * find_guid(ff_asf_guid guid)
Definition: asfdec_o.c:1533
AV_CODEC_ID_XMA2
@ AV_CODEC_ID_XMA2
Definition: codec_id.h:502
ff_w64_guid_riff
const uint8_t ff_w64_guid_riff[16]
Definition: w64.c:23
av_free
#define av_free(p)
Definition: tableprint_vlc.h:34
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:48
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:60
AVPacket
This structure stores compressed data.
Definition: packet.h:350
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Definition: opt.h:241
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:70
riff.h
ff_id3v2_free_extra_meta
void ff_id3v2_free_extra_meta(ID3v2ExtraMeta **extra_meta)
Free memory allocated parsing special (non-text) metadata.
Definition: id3v2.c:1141
AVPacket::pos
int64_t pos
byte position in stream, -1 if unknown
Definition: packet.h:393
avio_rl64
uint64_t avio_rl64(AVIOContext *s)
Definition: aviobuf.c:741
int32_t
int32_t
Definition: audioconvert.c:56
flags
#define flags(name, subs,...)
Definition: cbs_av1.c:561
AVCodecParameters::bit_rate
int64_t bit_rate
The average bitrate of the encoded data (in bits per second).
Definition: codec_par.h:89
ff_id3v2_parse_priv
int ff_id3v2_parse_priv(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Add metadata for all PRIV tags in the ID3v2 header.
Definition: id3v2.c:1253
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
snprintf
#define snprintf
Definition: snprintf.h:34
WAVDemuxContext::vst
AVStream * vst
Definition: wavdec.c:52
spdif.h
FF_PRI_GUID
#define FF_PRI_GUID
Definition: riff.h:104
ff_wav_codec_tags_list
const AVCodecTag *const ff_wav_codec_tags_list[]
av_fourcc2str
#define av_fourcc2str(fourcc)
Definition: avutil.h:348
ff_alloc_extradata
int ff_alloc_extradata(AVCodecParameters *par, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0.
Definition: utils.c:3264
avio_feof
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:354