FFmpeg
wavdec.c
Go to the documentation of this file.
1 /*
2  * WAV demuxer
3  * Copyright (c) 2001, 2002 Fabrice Bellard
4  *
5  * Sony Wave64 demuxer
6  * RF64 demuxer
7  * Copyright (c) 2009 Daniel Verkamp
8  *
9  * This file is part of FFmpeg.
10  *
11  * FFmpeg is free software; you can redistribute it and/or
12  * modify it under the terms of the GNU Lesser General Public
13  * License as published by the Free Software Foundation; either
14  * version 2.1 of the License, or (at your option) any later version.
15  *
16  * FFmpeg is distributed in the hope that it will be useful,
17  * but WITHOUT ANY WARRANTY; without even the implied warranty of
18  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19  * Lesser General Public License for more details.
20  *
21  * You should have received a copy of the GNU Lesser General Public
22  * License along with FFmpeg; if not, write to the Free Software
23  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
24  */
25 
26 #include <stdint.h>
27 
28 #include "libavutil/avassert.h"
29 #include "libavutil/dict.h"
30 #include "libavutil/intreadwrite.h"
31 #include "libavutil/log.h"
32 #include "libavutil/mathematics.h"
33 #include "libavutil/opt.h"
34 #include "avformat.h"
35 #include "avio.h"
36 #include "avio_internal.h"
37 #include "id3v2.h"
38 #include "internal.h"
39 #include "metadata.h"
40 #include "pcm.h"
41 #include "riff.h"
42 #include "w64.h"
43 #include "spdif.h"
44 
45 typedef struct WAVDemuxContext {
46  const AVClass *class;
47  int64_t data_end;
48  int w64;
49  int64_t smv_data_ofs;
52  int smv_block;
54  int smv_eof;
55  int audio_eof;
57  int spdif;
60  int unaligned; // e.g. if an odd number of bytes ID3 tag was prepended
61  int rifx; // RIFX: integer byte order for parameters is big endian
63 
65 {
66  if (CONFIG_SPDIF_DEMUXER && s->streams[0]->codecpar->codec_tag == 1) {
67  enum AVCodecID codec;
68  int len = 1<<16;
69  int ret = ffio_ensure_seekback(s->pb, len);
70 
71  if (ret >= 0) {
73  if (!buf) {
74  ret = AVERROR(ENOMEM);
75  } else {
76  int64_t pos = avio_tell(s->pb);
77  len = ret = avio_read(s->pb, buf, len);
78  if (len >= 0) {
79  ret = ff_spdif_probe(buf, len, &codec);
81  s->streams[0]->codecpar->codec_id = codec;
82  wav->spdif = 1;
83  }
84  }
85  avio_seek(s->pb, pos, SEEK_SET);
86  av_free(buf);
87  }
88  }
89 
90  if (ret < 0)
91  av_log(s, AV_LOG_WARNING, "Cannot check for SPDIF\n");
92  }
93 }
94 
95 #if CONFIG_WAV_DEMUXER
96 
97 static int64_t next_tag(AVIOContext *pb, uint32_t *tag, int big_endian)
98 {
99  *tag = avio_rl32(pb);
100  if (!big_endian) {
101  return avio_rl32(pb);
102  } else {
103  return avio_rb32(pb);
104  }
105 }
106 
107 /* RIFF chunks are always at even offsets relative to where they start. */
108 static int64_t wav_seek_tag(WAVDemuxContext * wav, AVIOContext *s, int64_t offset, int whence)
109 {
110  offset += offset < INT64_MAX && offset + wav->unaligned & 1;
111 
112  return avio_seek(s, offset, whence);
113 }
114 
115 /* return the size of the found tag */
116 static int64_t find_tag(WAVDemuxContext * wav, AVIOContext *pb, uint32_t tag1)
117 {
118  unsigned int tag;
119  int64_t size;
120 
121  for (;;) {
122  if (avio_feof(pb))
123  return AVERROR_EOF;
124  size = next_tag(pb, &tag, wav->rifx);
125  if (tag == tag1)
126  break;
127  wav_seek_tag(wav, pb, size, SEEK_CUR);
128  }
129  return size;
130 }
131 
132 static int wav_probe(const AVProbeData *p)
133 {
134  /* check file header */
135  if (p->buf_size <= 32)
136  return 0;
137  if (!memcmp(p->buf + 8, "WAVE", 4)) {
138  if (!memcmp(p->buf, "RIFF", 4) || !memcmp(p->buf, "RIFX", 4))
139  /* Since the ACT demuxer has a standard WAV header at the top of
140  * its own, the returned score is decreased to avoid a probe
141  * conflict between ACT and WAV. */
142  return AVPROBE_SCORE_MAX - 1;
143  else if (!memcmp(p->buf, "RF64", 4) &&
144  !memcmp(p->buf + 12, "ds64", 4))
145  return AVPROBE_SCORE_MAX;
146  }
147  return 0;
148 }
149 
150 static void handle_stream_probing(AVStream *st)
151 {
154  st->probe_packets = FFMIN(st->probe_packets, 32);
155  }
156 }
157 
158 static int wav_parse_fmt_tag(AVFormatContext *s, int64_t size, AVStream **st)
159 {
160  AVIOContext *pb = s->pb;
161  WAVDemuxContext *wav = s->priv_data;
162  int ret;
163 
164  /* parse fmt header */
165  *st = avformat_new_stream(s, NULL);
166  if (!*st)
167  return AVERROR(ENOMEM);
168 
169  ret = ff_get_wav_header(s, pb, (*st)->codecpar, size, wav->rifx);
170  if (ret < 0)
171  return ret;
172  handle_stream_probing(*st);
173 
174  (*st)->need_parsing = AVSTREAM_PARSE_FULL_RAW;
175 
176  avpriv_set_pts_info(*st, 64, 1, (*st)->codecpar->sample_rate);
177 
178  return 0;
179 }
180 
181 static int wav_parse_xma2_tag(AVFormatContext *s, int64_t size, AVStream **st)
182 {
183  AVIOContext *pb = s->pb;
184  int version, num_streams, i, channels = 0, ret;
185 
186  if (size < 36)
187  return AVERROR_INVALIDDATA;
188 
189  *st = avformat_new_stream(s, NULL);
190  if (!*st)
191  return AVERROR(ENOMEM);
192 
193  (*st)->codecpar->codec_type = AVMEDIA_TYPE_AUDIO;
194  (*st)->codecpar->codec_id = AV_CODEC_ID_XMA2;
195  (*st)->need_parsing = AVSTREAM_PARSE_FULL_RAW;
196 
197  version = avio_r8(pb);
198  if (version != 3 && version != 4)
199  return AVERROR_INVALIDDATA;
200  num_streams = avio_r8(pb);
201  if (size != (32 + ((version==3)?0:8) + 4*num_streams))
202  return AVERROR_INVALIDDATA;
203  avio_skip(pb, 10);
204  (*st)->codecpar->sample_rate = avio_rb32(pb);
205  if (version == 4)
206  avio_skip(pb, 8);
207  avio_skip(pb, 4);
208  (*st)->duration = avio_rb32(pb);
209  avio_skip(pb, 8);
210 
211  for (i = 0; i < num_streams; i++) {
212  channels += avio_r8(pb);
213  avio_skip(pb, 3);
214  }
215  (*st)->codecpar->channels = channels;
216 
217  if ((*st)->codecpar->channels <= 0 || (*st)->codecpar->sample_rate <= 0)
218  return AVERROR_INVALIDDATA;
219 
220  avpriv_set_pts_info(*st, 64, 1, (*st)->codecpar->sample_rate);
221 
222  avio_seek(pb, -size, SEEK_CUR);
223  if ((ret = ff_get_extradata(s, (*st)->codecpar, pb, size)) < 0)
224  return ret;
225 
226  return 0;
227 }
228 
229 static inline int wav_parse_bext_string(AVFormatContext *s, const char *key,
230  int length)
231 {
232  char temp[257];
233  int ret;
234 
235  av_assert0(length < sizeof(temp));
236  if ((ret = avio_read(s->pb, temp, length)) != length)
237  return ret < 0 ? ret : AVERROR_INVALIDDATA;
238 
239  temp[length] = 0;
240 
241  if (strlen(temp))
242  return av_dict_set(&s->metadata, key, temp, 0);
243 
244  return 0;
245 }
246 
247 static int wav_parse_bext_tag(AVFormatContext *s, int64_t size)
248 {
249  char temp[131], *coding_history;
250  int ret, x;
251  uint64_t time_reference;
252  int64_t umid_parts[8], umid_mask = 0;
253 
254  if ((ret = wav_parse_bext_string(s, "description", 256)) < 0 ||
255  (ret = wav_parse_bext_string(s, "originator", 32)) < 0 ||
256  (ret = wav_parse_bext_string(s, "originator_reference", 32)) < 0 ||
257  (ret = wav_parse_bext_string(s, "origination_date", 10)) < 0 ||
258  (ret = wav_parse_bext_string(s, "origination_time", 8)) < 0)
259  return ret;
260 
261  time_reference = avio_rl64(s->pb);
262  snprintf(temp, sizeof(temp), "%"PRIu64, time_reference);
263  if ((ret = av_dict_set(&s->metadata, "time_reference", temp, 0)) < 0)
264  return ret;
265 
266  /* check if version is >= 1, in which case an UMID may be present */
267  if (avio_rl16(s->pb) >= 1) {
268  for (x = 0; x < 8; x++)
269  umid_mask |= umid_parts[x] = avio_rb64(s->pb);
270 
271  if (umid_mask) {
272  /* the string formatting below is per SMPTE 330M-2004 Annex C */
273  if (umid_parts[4] == 0 && umid_parts[5] == 0 &&
274  umid_parts[6] == 0 && umid_parts[7] == 0) {
275  /* basic UMID */
276  snprintf(temp, sizeof(temp),
277  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
278  umid_parts[0], umid_parts[1],
279  umid_parts[2], umid_parts[3]);
280  } else {
281  /* extended UMID */
282  snprintf(temp, sizeof(temp),
283  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64
284  "%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
285  umid_parts[0], umid_parts[1],
286  umid_parts[2], umid_parts[3],
287  umid_parts[4], umid_parts[5],
288  umid_parts[6], umid_parts[7]);
289  }
290 
291  if ((ret = av_dict_set(&s->metadata, "umid", temp, 0)) < 0)
292  return ret;
293  }
294 
295  avio_skip(s->pb, 190);
296  } else
297  avio_skip(s->pb, 254);
298 
299  if (size > 602) {
300  /* CodingHistory present */
301  size -= 602;
302 
303  if (!(coding_history = av_malloc(size + 1)))
304  return AVERROR(ENOMEM);
305 
306  if ((ret = avio_read(s->pb, coding_history, size)) != size) {
307  av_free(coding_history);
308  return ret < 0 ? ret : AVERROR_INVALIDDATA;
309  }
310 
311  coding_history[size] = 0;
312  if ((ret = av_dict_set(&s->metadata, "coding_history", coding_history,
314  return ret;
315  }
316 
317  return 0;
318 }
319 
320 static const AVMetadataConv wav_metadata_conv[] = {
321  { "description", "comment" },
322  { "originator", "encoded_by" },
323  { "origination_date", "date" },
324  { "origination_time", "creation_time" },
325  { 0 },
326 };
327 
328 /* wav input */
329 static int wav_read_header(AVFormatContext *s)
330 {
331  int64_t size, av_uninit(data_size);
332  int64_t sample_count = 0;
333  int rf64 = 0;
334  uint32_t tag;
335  AVIOContext *pb = s->pb;
336  AVStream *st = NULL;
337  WAVDemuxContext *wav = s->priv_data;
338  int ret, got_fmt = 0, got_xma2 = 0;
339  int64_t next_tag_ofs, data_ofs = -1;
340 
341  wav->unaligned = avio_tell(s->pb) & 1;
342 
343  wav->smv_data_ofs = -1;
344 
345  /* read chunk ID */
346  tag = avio_rl32(pb);
347  switch (tag) {
348  case MKTAG('R', 'I', 'F', 'F'):
349  break;
350  case MKTAG('R', 'I', 'F', 'X'):
351  wav->rifx = 1;
352  break;
353  case MKTAG('R', 'F', '6', '4'):
354  rf64 = 1;
355  break;
356  default:
357  av_log(s, AV_LOG_ERROR, "invalid start code %s in RIFF header\n",
358  av_fourcc2str(tag));
359  return AVERROR_INVALIDDATA;
360  }
361 
362  /* read chunk size */
363  avio_rl32(pb);
364 
365  /* read format */
366  if (avio_rl32(pb) != MKTAG('W', 'A', 'V', 'E')) {
367  av_log(s, AV_LOG_ERROR, "invalid format in RIFF header\n");
368  return AVERROR_INVALIDDATA;
369  }
370 
371  if (rf64) {
372  if (avio_rl32(pb) != MKTAG('d', 's', '6', '4'))
373  return AVERROR_INVALIDDATA;
374  size = avio_rl32(pb);
375  if (size < 24)
376  return AVERROR_INVALIDDATA;
377  avio_rl64(pb); /* RIFF size */
378 
379  data_size = avio_rl64(pb);
380  sample_count = avio_rl64(pb);
381 
382  if (data_size < 0 || sample_count < 0) {
383  av_log(s, AV_LOG_ERROR, "negative data_size and/or sample_count in "
384  "ds64: data_size = %"PRId64", sample_count = %"PRId64"\n",
385  data_size, sample_count);
386  return AVERROR_INVALIDDATA;
387  }
388  avio_skip(pb, size - 24); /* skip rest of ds64 chunk */
389 
390  }
391 
392  for (;;) {
393  AVStream *vst;
394  size = next_tag(pb, &tag, wav->rifx);
395  next_tag_ofs = avio_tell(pb) + size;
396 
397  if (avio_feof(pb))
398  break;
399 
400  switch (tag) {
401  case MKTAG('f', 'm', 't', ' '):
402  /* only parse the first 'fmt ' tag found */
403  if (!got_xma2 && !got_fmt && (ret = wav_parse_fmt_tag(s, size, &st)) < 0) {
404  return ret;
405  } else if (got_fmt)
406  av_log(s, AV_LOG_WARNING, "found more than one 'fmt ' tag\n");
407 
408  got_fmt = 1;
409  break;
410  case MKTAG('X', 'M', 'A', '2'):
411  /* only parse the first 'XMA2' tag found */
412  if (!got_fmt && !got_xma2 && (ret = wav_parse_xma2_tag(s, size, &st)) < 0) {
413  return ret;
414  } else if (got_xma2)
415  av_log(s, AV_LOG_WARNING, "found more than one 'XMA2' tag\n");
416 
417  got_xma2 = 1;
418  break;
419  case MKTAG('d', 'a', 't', 'a'):
420  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) && !got_fmt && !got_xma2) {
422  "found no 'fmt ' tag before the 'data' tag\n");
423  return AVERROR_INVALIDDATA;
424  }
425 
426  if (rf64) {
427  next_tag_ofs = wav->data_end = avio_tell(pb) + data_size;
428  } else if (size != 0xFFFFFFFF) {
429  data_size = size;
430  next_tag_ofs = wav->data_end = size ? next_tag_ofs : INT64_MAX;
431  } else {
432  av_log(s, AV_LOG_WARNING, "Ignoring maximum wav data size, "
433  "file may be invalid\n");
434  data_size = 0;
435  next_tag_ofs = wav->data_end = INT64_MAX;
436  }
437 
438  data_ofs = avio_tell(pb);
439 
440  /* don't look for footer metadata if we can't seek or if we don't
441  * know where the data tag ends
442  */
443  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) || (!rf64 && !size))
444  goto break_loop;
445  break;
446  case MKTAG('f', 'a', 'c', 't'):
447  if (!sample_count)
448  sample_count = (!wav->rifx ? avio_rl32(pb) : avio_rb32(pb));
449  break;
450  case MKTAG('b', 'e', 'x', 't'):
451  if ((ret = wav_parse_bext_tag(s, size)) < 0)
452  return ret;
453  break;
454  case MKTAG('S','M','V','0'):
455  if (!got_fmt) {
456  av_log(s, AV_LOG_ERROR, "found no 'fmt ' tag before the 'SMV0' tag\n");
457  return AVERROR_INVALIDDATA;
458  }
459  // SMV file, a wav file with video appended.
460  if (size != MKTAG('0','2','0','0')) {
461  av_log(s, AV_LOG_ERROR, "Unknown SMV version found\n");
462  goto break_loop;
463  }
464  av_log(s, AV_LOG_DEBUG, "Found SMV data\n");
465  wav->smv_given_first = 0;
466  vst = avformat_new_stream(s, NULL);
467  if (!vst)
468  return AVERROR(ENOMEM);
469  avio_r8(pb);
470  vst->id = 1;
473  vst->codecpar->width = avio_rl24(pb);
474  vst->codecpar->height = avio_rl24(pb);
475  if ((ret = ff_alloc_extradata(vst->codecpar, 4)) < 0) {
476  av_log(s, AV_LOG_ERROR, "Could not allocate extradata.\n");
477  return ret;
478  }
479  size = avio_rl24(pb);
480  wav->smv_data_ofs = avio_tell(pb) + (size - 5) * 3;
481  avio_rl24(pb);
482  wav->smv_block_size = avio_rl24(pb);
483  if (!wav->smv_block_size)
484  return AVERROR_INVALIDDATA;
485  avpriv_set_pts_info(vst, 32, 1, avio_rl24(pb));
486  vst->duration = avio_rl24(pb);
487  avio_rl24(pb);
488  avio_rl24(pb);
489  wav->smv_frames_per_jpeg = avio_rl24(pb);
490  if (wav->smv_frames_per_jpeg > 65536) {
491  av_log(s, AV_LOG_ERROR, "too many frames per jpeg\n");
492  return AVERROR_INVALIDDATA;
493  }
495  wav->smv_cur_pt = 0;
496  goto break_loop;
497  case MKTAG('L', 'I', 'S', 'T'):
498  if (size < 4) {
499  av_log(s, AV_LOG_ERROR, "too short LIST tag\n");
500  return AVERROR_INVALIDDATA;
501  }
502  switch (avio_rl32(pb)) {
503  case MKTAG('I', 'N', 'F', 'O'):
504  ff_read_riff_info(s, size - 4);
505  }
506  break;
507  case MKTAG('I', 'D', '3', ' '):
508  case MKTAG('i', 'd', '3', ' '): {
509  ID3v2ExtraMeta *id3v2_extra_meta = NULL;
510  ff_id3v2_read_dict(pb, &s->internal->id3v2_meta, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta);
511  if (id3v2_extra_meta) {
512  ff_id3v2_parse_apic(s, id3v2_extra_meta);
513  ff_id3v2_parse_chapters(s, id3v2_extra_meta);
514  ff_id3v2_parse_priv(s, id3v2_extra_meta);
515  }
516  ff_id3v2_free_extra_meta(&id3v2_extra_meta);
517  }
518  break;
519  }
520 
521  /* seek to next tag unless we know that we'll run into EOF */
522  if ((avio_size(pb) > 0 && next_tag_ofs >= avio_size(pb)) ||
523  wav_seek_tag(wav, pb, next_tag_ofs, SEEK_SET) < 0) {
524  break;
525  }
526  }
527 
528 break_loop:
529  if (!got_fmt && !got_xma2) {
530  av_log(s, AV_LOG_ERROR, "no 'fmt ' or 'XMA2' tag found\n");
531  return AVERROR_INVALIDDATA;
532  }
533 
534  if (data_ofs < 0) {
535  av_log(s, AV_LOG_ERROR, "no 'data' tag found\n");
536  return AVERROR_INVALIDDATA;
537  }
538 
539  avio_seek(pb, data_ofs, SEEK_SET);
540 
541  if (data_size > (INT64_MAX>>3)) {
542  av_log(s, AV_LOG_WARNING, "Data size %"PRId64" is too large\n", data_size);
543  data_size = 0;
544  }
545 
546  if ( st->codecpar->bit_rate > 0 && data_size > 0
547  && st->codecpar->sample_rate > 0
548  && sample_count > 0 && st->codecpar->channels > 1
549  && sample_count % st->codecpar->channels == 0) {
550  if (fabs(8.0 * data_size * st->codecpar->channels * st->codecpar->sample_rate /
551  sample_count /st->codecpar->bit_rate - 1.0) < 0.3)
552  sample_count /= st->codecpar->channels;
553  }
554 
555  if ( data_size > 0 && sample_count && st->codecpar->channels
556  && (data_size << 3) / sample_count / st->codecpar->channels > st->codecpar->bits_per_coded_sample + 1) {
557  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
558  sample_count = 0;
559  }
560 
561  /* G.729 hack (for Ticket4577)
562  * FIXME: Come up with cleaner, more general solution */
563  if (st->codecpar->codec_id == AV_CODEC_ID_G729 && sample_count && (data_size << 3) > sample_count) {
564  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
565  sample_count = 0;
566  }
567 
568  if (!sample_count || av_get_exact_bits_per_sample(st->codecpar->codec_id) > 0)
569  if ( st->codecpar->channels
570  && data_size
572  && wav->data_end <= avio_size(pb))
573  sample_count = (data_size << 3)
574  /
575  (st->codecpar->channels * (uint64_t)av_get_bits_per_sample(st->codecpar->codec_id));
576 
577  if (sample_count)
578  st->duration = sample_count;
579 
581  st->codecpar->block_align == st->codecpar->channels * 4 &&
582  st->codecpar->bits_per_coded_sample == 32 &&
583  st->codecpar->extradata_size == 2 &&
584  AV_RL16(st->codecpar->extradata) == 1) {
587  } else if (st->codecpar->codec_id == AV_CODEC_ID_PCM_S24LE &&
588  st->codecpar->block_align == st->codecpar->channels * 4 &&
589  st->codecpar->bits_per_coded_sample == 24) {
591  } else if (st->codecpar->codec_id == AV_CODEC_ID_XMA1 ||
593  st->codecpar->block_align = 2048;
594  } else if (st->codecpar->codec_id == AV_CODEC_ID_ADPCM_MS && st->codecpar->channels > 2 &&
595  st->codecpar->block_align < INT_MAX / st->codecpar->channels) {
596  st->codecpar->block_align *= st->codecpar->channels;
597  }
598 
599  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
601 
602  set_spdif(s, wav);
603 
604  return 0;
605 }
606 
607 /**
608  * Find chunk with w64 GUID by skipping over other chunks.
609  * @return the size of the found chunk
610  */
611 static int64_t find_guid(AVIOContext *pb, const uint8_t guid1[16])
612 {
613  uint8_t guid[16];
614  int64_t size;
615 
616  while (!avio_feof(pb)) {
617  avio_read(pb, guid, 16);
618  size = avio_rl64(pb);
619  if (size <= 24 || size > INT64_MAX - 8)
620  return AVERROR_INVALIDDATA;
621  if (!memcmp(guid, guid1, 16))
622  return size;
623  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
624  }
625  return AVERROR_EOF;
626 }
627 
628 #define MAX_SIZE 4096
629 
630 static int wav_read_packet(AVFormatContext *s, AVPacket *pkt)
631 {
632  int ret, size;
633  int64_t left;
634  AVStream *st;
635  WAVDemuxContext *wav = s->priv_data;
636 
637  if (CONFIG_SPDIF_DEMUXER && wav->spdif == 1)
638  return ff_spdif_read_packet(s, pkt);
639 
640  if (wav->smv_data_ofs > 0) {
641  int64_t audio_dts, video_dts;
642 smv_retry:
643  audio_dts = (int32_t)s->streams[0]->cur_dts;
644  video_dts = (int32_t)s->streams[1]->cur_dts;
645 
647  /*We always return a video frame first to get the pixel format first*/
648  wav->smv_last_stream = wav->smv_given_first ?
649  av_compare_ts(video_dts, s->streams[1]->time_base,
650  audio_dts, s->streams[0]->time_base) > 0 : 0;
651  wav->smv_given_first = 1;
652  }
653  wav->smv_last_stream = !wav->smv_last_stream;
654  wav->smv_last_stream |= wav->audio_eof;
655  wav->smv_last_stream &= !wav->smv_eof;
656  if (wav->smv_last_stream) {
657  uint64_t old_pos = avio_tell(s->pb);
658  uint64_t new_pos = wav->smv_data_ofs +
659  wav->smv_block * (int64_t)wav->smv_block_size;
660  if (avio_seek(s->pb, new_pos, SEEK_SET) < 0) {
661  ret = AVERROR_EOF;
662  goto smv_out;
663  }
664  size = avio_rl24(s->pb);
665  ret = av_get_packet(s->pb, pkt, size);
666  if (ret < 0)
667  goto smv_out;
668  pkt->pos -= 3;
669  pkt->pts = wav->smv_block * wav->smv_frames_per_jpeg + wav->smv_cur_pt;
670  wav->smv_cur_pt++;
671  if (wav->smv_frames_per_jpeg > 0)
672  wav->smv_cur_pt %= wav->smv_frames_per_jpeg;
673  if (!wav->smv_cur_pt)
674  wav->smv_block++;
675 
676  pkt->stream_index = 1;
677 smv_out:
678  avio_seek(s->pb, old_pos, SEEK_SET);
679  if (ret == AVERROR_EOF) {
680  wav->smv_eof = 1;
681  goto smv_retry;
682  }
683  return ret;
684  }
685  }
686 
687  st = s->streams[0];
688 
689  left = wav->data_end - avio_tell(s->pb);
690  if (wav->ignore_length)
691  left = INT_MAX;
692  if (left <= 0) {
693  if (CONFIG_W64_DEMUXER && wav->w64)
694  left = find_guid(s->pb, ff_w64_guid_data) - 24;
695  else
696  left = find_tag(wav, s->pb, MKTAG('d', 'a', 't', 'a'));
697  if (left < 0) {
698  wav->audio_eof = 1;
699  if (wav->smv_data_ofs > 0 && !wav->smv_eof)
700  goto smv_retry;
701  return AVERROR_EOF;
702  }
703  wav->data_end = avio_tell(s->pb) + left;
704  }
705 
706  size = MAX_SIZE;
707  if (st->codecpar->block_align > 1) {
708  if (size < st->codecpar->block_align)
709  size = st->codecpar->block_align;
710  size = (size / st->codecpar->block_align) * st->codecpar->block_align;
711  }
712  size = FFMIN(size, left);
713  ret = av_get_packet(s->pb, pkt, size);
714  if (ret < 0)
715  return ret;
716  pkt->stream_index = 0;
717 
718  return ret;
719 }
720 
721 static int wav_read_seek(AVFormatContext *s,
722  int stream_index, int64_t timestamp, int flags)
723 {
724  WAVDemuxContext *wav = s->priv_data;
725  AVStream *st;
726  wav->smv_eof = 0;
727  wav->audio_eof = 0;
728  if (wav->smv_data_ofs > 0) {
729  int64_t smv_timestamp = timestamp;
730  if (stream_index == 0)
731  smv_timestamp = av_rescale_q(timestamp, s->streams[0]->time_base, s->streams[1]->time_base);
732  else
733  timestamp = av_rescale_q(smv_timestamp, s->streams[1]->time_base, s->streams[0]->time_base);
734  if (wav->smv_frames_per_jpeg > 0) {
735  wav->smv_block = smv_timestamp / wav->smv_frames_per_jpeg;
736  wav->smv_cur_pt = smv_timestamp % wav->smv_frames_per_jpeg;
737  }
738  }
739 
740  st = s->streams[0];
741  switch (st->codecpar->codec_id) {
742  case AV_CODEC_ID_MP2:
743  case AV_CODEC_ID_MP3:
744  case AV_CODEC_ID_AC3:
745  case AV_CODEC_ID_DTS:
746  case AV_CODEC_ID_XMA2:
747  /* use generic seeking with dynamically generated indexes */
748  return -1;
749  default:
750  break;
751  }
752  return ff_pcm_read_seek(s, stream_index, timestamp, flags);
753 }
754 
755 #define OFFSET(x) offsetof(WAVDemuxContext, x)
756 #define DEC AV_OPT_FLAG_DECODING_PARAM
757 static const AVOption demux_options[] = {
758  { "ignore_length", "Ignore length", OFFSET(ignore_length), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, DEC },
759  { NULL },
760 };
761 
762 static const AVClass wav_demuxer_class = {
763  .class_name = "WAV demuxer",
764  .item_name = av_default_item_name,
765  .option = demux_options,
766  .version = LIBAVUTIL_VERSION_INT,
767 };
769  .name = "wav",
770  .long_name = NULL_IF_CONFIG_SMALL("WAV / WAVE (Waveform Audio)"),
771  .priv_data_size = sizeof(WAVDemuxContext),
772  .read_probe = wav_probe,
773  .read_header = wav_read_header,
774  .read_packet = wav_read_packet,
775  .read_seek = wav_read_seek,
777  .codec_tag = (const AVCodecTag * const []) { ff_codec_wav_tags, 0 },
778  .priv_class = &wav_demuxer_class,
779 };
780 #endif /* CONFIG_WAV_DEMUXER */
781 
782 #if CONFIG_W64_DEMUXER
783 static int w64_probe(const AVProbeData *p)
784 {
785  if (p->buf_size <= 40)
786  return 0;
787  if (!memcmp(p->buf, ff_w64_guid_riff, 16) &&
788  !memcmp(p->buf + 24, ff_w64_guid_wave, 16))
789  return AVPROBE_SCORE_MAX;
790  else
791  return 0;
792 }
793 
794 static int w64_read_header(AVFormatContext *s)
795 {
796  int64_t size, data_ofs = 0;
797  AVIOContext *pb = s->pb;
798  WAVDemuxContext *wav = s->priv_data;
799  AVStream *st;
800  uint8_t guid[16];
801  int ret;
802 
803  avio_read(pb, guid, 16);
804  if (memcmp(guid, ff_w64_guid_riff, 16))
805  return AVERROR_INVALIDDATA;
806 
807  /* riff + wave + fmt + sizes */
808  if (avio_rl64(pb) < 16 + 8 + 16 + 8 + 16 + 8)
809  return AVERROR_INVALIDDATA;
810 
811  avio_read(pb, guid, 16);
812  if (memcmp(guid, ff_w64_guid_wave, 16)) {
813  av_log(s, AV_LOG_ERROR, "could not find wave guid\n");
814  return AVERROR_INVALIDDATA;
815  }
816 
817  wav->w64 = 1;
818 
819  st = avformat_new_stream(s, NULL);
820  if (!st)
821  return AVERROR(ENOMEM);
822 
823  while (!avio_feof(pb)) {
824  if (avio_read(pb, guid, 16) != 16)
825  break;
826  size = avio_rl64(pb);
827  if (size <= 24 || INT64_MAX - size < avio_tell(pb))
828  return AVERROR_INVALIDDATA;
829 
830  if (!memcmp(guid, ff_w64_guid_fmt, 16)) {
831  /* subtract chunk header size - normal wav file doesn't count it */
832  ret = ff_get_wav_header(s, pb, st->codecpar, size - 24, 0);
833  if (ret < 0)
834  return ret;
835  avio_skip(pb, FFALIGN(size, INT64_C(8)) - size);
836 
837  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
838  } else if (!memcmp(guid, ff_w64_guid_fact, 16)) {
839  int64_t samples;
840 
841  samples = avio_rl64(pb);
842  if (samples > 0)
843  st->duration = samples;
844  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 32);
845  } else if (!memcmp(guid, ff_w64_guid_data, 16)) {
846  wav->data_end = avio_tell(pb) + size - 24;
847 
848  data_ofs = avio_tell(pb);
849  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
850  break;
851 
852  avio_skip(pb, size - 24);
853  } else if (!memcmp(guid, ff_w64_guid_summarylist, 16)) {
854  int64_t start, end, cur;
855  uint32_t count, chunk_size, i;
856  int64_t filesize = avio_size(s->pb);
857 
858  start = avio_tell(pb);
859  end = start + FFALIGN(size, INT64_C(8)) - 24;
860  count = avio_rl32(pb);
861 
862  for (i = 0; i < count; i++) {
863  char chunk_key[5], *value;
864 
865  if (avio_feof(pb) || (cur = avio_tell(pb)) < 0 || cur > end - 8 /* = tag + size */)
866  break;
867 
868  chunk_key[4] = 0;
869  avio_read(pb, chunk_key, 4);
870  chunk_size = avio_rl32(pb);
871  if (chunk_size == UINT32_MAX || (filesize >= 0 && chunk_size > filesize))
872  return AVERROR_INVALIDDATA;
873 
874  value = av_mallocz(chunk_size + 1);
875  if (!value)
876  return AVERROR(ENOMEM);
877 
878  ret = avio_get_str16le(pb, chunk_size, value, chunk_size);
879  if (ret < 0) {
880  av_free(value);
881  return ret;
882  }
883  avio_skip(pb, chunk_size - ret);
884 
885  av_dict_set(&s->metadata, chunk_key, value, AV_DICT_DONT_STRDUP_VAL);
886  }
887 
888  avio_skip(pb, end - avio_tell(pb));
889  } else {
890  av_log(s, AV_LOG_DEBUG, "unknown guid: "FF_PRI_GUID"\n", FF_ARG_GUID(guid));
891  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
892  }
893  }
894 
895  if (!data_ofs)
896  return AVERROR_EOF;
897 
898  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
900 
901  handle_stream_probing(st);
903 
904  avio_seek(pb, data_ofs, SEEK_SET);
905 
906  set_spdif(s, wav);
907 
908  return 0;
909 }
910 
912  .name = "w64",
913  .long_name = NULL_IF_CONFIG_SMALL("Sony Wave64"),
914  .priv_data_size = sizeof(WAVDemuxContext),
915  .read_probe = w64_probe,
916  .read_header = w64_read_header,
917  .read_packet = wav_read_packet,
918  .read_seek = wav_read_seek,
920  .codec_tag = (const AVCodecTag * const []) { ff_codec_wav_tags, 0 },
921 };
922 #endif /* CONFIG_W64_DEMUXER */
WAVDemuxContext
Definition: wavdec.c:45
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:301
WAVDemuxContext::unaligned
int unaligned
Definition: wavdec.c:60
WAVDemuxContext::smv_block
int smv_block
Definition: wavdec.c:52
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:182
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:346
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:74
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:413
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
avformat_new_stream
AVStream * avformat_new_stream(AVFormatContext *s, const AVCodec *c)
Add a new stream to a media file.
Definition: utils.c:4526
pcm.h
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:56
AV_WL32
#define AV_WL32(p, v)
Definition: intreadwrite.h:426
av_compare_ts
int av_compare_ts(int64_t ts_a, AVRational tb_a, int64_t ts_b, AVRational tb_b)
Compare two timestamps each in its own time base.
Definition: mathematics.c:147
ff_get_extradata
int ff_get_extradata(AVFormatContext *s, AVCodecParameters *par, AVIOContext *pb, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0 and f...
Definition: utils.c:3346
AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:55
MKTAG
#define MKTAG(a, b, c, d)
Definition: common.h:406
WAVDemuxContext::smv_data_ofs
int64_t smv_data_ofs
Definition: wavdec.c:49
audio_dts
int64_t audio_dts
Definition: movenc.c:60
WAVDemuxContext::smv_frames_per_jpeg
int smv_frames_per_jpeg
Definition: wavdec.c:51
WAVDemuxContext::smv_cur_pt
int smv_cur_pt
Definition: wavdec.c:58
id3v2.h
end
static av_cold int end(AVCodecContext *avctx)
Definition: avrndec.c:92
AVOption
AVOption.
Definition: opt.h:246
AVMetadataConv
Definition: metadata.h:34
ff_codec_wav_tags
const AVCodecTag ff_codec_wav_tags[]
Definition: riff.c:506
mathematics.h
AVProbeData::buf_size
int buf_size
Size of buf except extra allocated bytes.
Definition: avformat.h:444
ff_id3v2_parse_chapters
int ff_id3v2_parse_chapters(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Create chapters for all CHAP tags found in the ID3v2 header.
Definition: id3v2.c:1180
avio_size
int64_t avio_size(AVIOContext *s)
Get the filesize.
Definition: aviobuf.c:334
WAVDemuxContext::data_end
int64_t data_end
Definition: wavdec.c:47
video_dts
int64_t video_dts
Definition: movenc.c:60
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31
WAVDemuxContext::w64
int w64
Definition: wavdec.c:48
ff_wav_demuxer
AVInputFormat ff_wav_demuxer
AVPROBE_SCORE_MAX
#define AVPROBE_SCORE_MAX
maximum score
Definition: avformat.h:453
return
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a it should return
Definition: filter_design.txt:264
AVCodecParameters::channels
int channels
Audio only.
Definition: codec_par.h:166
ff_w64_guid_summarylist
const uint8_t ff_w64_guid_summarylist[16]
Definition: w64.c:47
read_seek
static int read_seek(AVFormatContext *ctx, int stream_index, int64_t timestamp, int flags)
Definition: libcdio.c:153
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:557
AVFMT_GENERIC_INDEX
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:463
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:411
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:914
avio_rl16
unsigned int avio_rl16(AVIOContext *s)
Definition: aviobuf.c:731
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:74
ff_w64_demuxer
AVInputFormat ff_w64_demuxer
avassert.h
avio_rb32
unsigned int avio_rb32(AVIOContext *s)
Definition: aviobuf.c:778
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176
AVInputFormat
Definition: avformat.h:636
AVCodecTag
Definition: internal.h:42
ID3v2ExtraMeta
Definition: id3v2.h:84
avio_get_str16le
int avio_get_str16le(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a UTF-16 string from pb and convert it to UTF-8.
FF_ARG_GUID
#define FF_ARG_GUID(g)
Definition: riff.h:105
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:257
AV_CODEC_ID_XMA1
@ AV_CODEC_ID_XMA1
Definition: codec_id.h:490
AVInputFormat::name
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:641
AVProbeData::buf
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:443
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
AVCodecParameters::width
int width
Video only.
Definition: codec_par.h:126
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:410
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:37
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:197
AVStream::need_parsing
enum AVStreamParseType need_parsing
Definition: avformat.h:1083
AV_CODEC_ID_PCM_F24LE
@ AV_CODEC_ID_PCM_F24LE
Definition: codec_id.h:336
channels
channels
Definition: aptx.h:33
AV_RL16
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_RL16
Definition: bytestream.h:90
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
ff_read_riff_info
int ff_read_riff_info(AVFormatContext *s, int64_t size)
Definition: riffdec.c:228
MAX_SIZE
#define MAX_SIZE
Definition: vf_unsharp.c:305
key
const char * key
Definition: hwcontext_opencl.c:168
int32_t
int32_t
Definition: audio_convert.c:194
if
if(ret)
Definition: filter_design.txt:179
AVFormatContext
Format I/O context.
Definition: avformat.h:1335
internal.h
ff_metadata_conv_ctx
void ff_metadata_conv_ctx(AVFormatContext *ctx, const AVMetadataConv *d_conv, const AVMetadataConv *s_conv)
Definition: metadata.c:59
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:1012
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
read_header
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:527
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:67
NULL
#define NULL
Definition: coverity.c:32
read_probe
static int read_probe(const AVProbeData *pd)
Definition: jvdec.c:55
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:235
ff_id3v2_parse_apic
int ff_id3v2_parse_apic(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Create a stream for each APIC (attached picture) extracted from the ID3v2 header.
Definition: id3v2.c:1140
avio_rb64
uint64_t avio_rb64(AVIOContext *s)
Definition: aviobuf.c:899
AVProbeData
This structure contains the data a format has to probe a file.
Definition: avformat.h:441
AVPROBE_SCORE_EXTENSION
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:451
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:170
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:46
ff_w64_guid_fmt
const uint8_t ff_w64_guid_fmt[16]
Definition: w64.c:33
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:78
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:1574
WAVDemuxContext::smv_last_stream
int smv_last_stream
Definition: wavdec.c:53
avio_rl32
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:747
AVIOContext
Bytestream IO Context.
Definition: avio.h:161
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:313
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:188
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:260
ff_spdif_probe
int ff_spdif_probe(const uint8_t *p_buf, int buf_size, enum AVCodecID *codec)
Definition: spdifdec.c:116
WAVDemuxContext::smv_eof
int smv_eof
Definition: wavdec.c:54
avpriv_set_pts_info
void avpriv_set_pts_info(AVStream *s, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: utils.c:4948
AV_CODEC_ID_DTS
@ AV_CODEC_ID_DTS
Definition: codec_id.h:414
AVStream::probe_packets
int probe_packets
Number of packets to buffer for codec probing.
Definition: avformat.h:1075
size
int size
Definition: twinvq_data.h:11134
AV_CODEC_ID_SMVJPEG
@ AV_CODEC_ID_SMVJPEG
Definition: codec_id.h:258
avio.h
ID3v2_DEFAULT_MAGIC
#define ID3v2_DEFAULT_MAGIC
Default magic bytes for ID3v2 header: "ID3".
Definition: id3v2.h:35
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:248
ff_riff_info_conv
const AVMetadataConv ff_riff_info_conv[]
Definition: riff.c:591
avio_r8
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:616
FFMIN
#define FFMIN(a, b)
Definition: common.h:96
ffio_ensure_seekback
int ffio_ensure_seekback(AVIOContext *s, int64_t buf_size)
Ensures that the requested seekback buffer size will be available.
Definition: aviobuf.c:982
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
version
version
Definition: libkvazaar.c:292
ff_spdif_read_packet
int ff_spdif_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: spdifdec.c:173
WAVDemuxContext::rifx
int rifx
Definition: wavdec.c:61
log.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:269
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:348
avio_rl24
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:739
avio_internal.h
WAVDemuxContext::audio_eof
int audio_eof
Definition: wavdec.c:55
ff_w64_guid_wave
const uint8_t ff_w64_guid_wave[16]
Definition: w64.c:28
AVCodecParameters::height
int height
Definition: codec_par.h:127
AVCodecParameters::block_align
int block_align
Audio only.
Definition: codec_par.h:177
WAVDemuxContext::smv_block_size
int smv_block_size
Definition: wavdec.c:50
ff_id3v2_read_dict
void ff_id3v2_read_dict(AVIOContext *pb, AVDictionary **metadata, const char *magic, ID3v2ExtraMeta **extra_meta)
Read an ID3v2 tag into specified dictionary and retrieve supported extra metadata.
Definition: id3v2.c:1112
value
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
Definition: writing_filters.txt:86
uint8_t
uint8_t
Definition: audio_convert.c:194
av_mallocz
void * av_mallocz(size_t size)
Allocate a memory block with alignment suitable for all memory accesses (including vectors if availab...
Definition: mem.c:237
AV_CODEC_ID_PCM_F16LE
@ AV_CODEC_ID_PCM_F16LE
Definition: codec_id.h:335
ff_w64_guid_fact
const uint8_t ff_w64_guid_fact[16]
Definition: w64.c:38
len
int len
Definition: vorbis_enc_data.h:452
ff_get_wav_header
int ff_get_wav_header(AVFormatContext *s, AVIOContext *pb, AVCodecParameters *par, int size, int big_endian)
Definition: riffdec.c:91
av_get_exact_bits_per_sample
int av_get_exact_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:1490
av_get_packet
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:307
av_uninit
#define av_uninit(x)
Definition: attributes.h:154
tag
uint32_t tag
Definition: movenc.c:1532
AVStream::id
int id
Format-specific stream ID.
Definition: avformat.h:872
ret
ret
Definition: filter_design.txt:187
read_packet
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_reading.c:42
AVStream
Stream structure.
Definition: avformat.h:865
WAVDemuxContext::spdif
int spdif
Definition: wavdec.c:57
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:241
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:72
ff_pcm_read_seek
int ff_pcm_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
Definition: pcm.c:56
metadata.h
pos
unsigned int pos
Definition: spdifenc.c:412
avformat.h
dict.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: avcodec.h:215
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
set_spdif
static void set_spdif(AVFormatContext *s, WAVDemuxContext *wav)
Definition: wavdec.c:64
OFFSET
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default minimum maximum flags name is the option keep it simple and lowercase description are in without and describe what they for example set the foo of the bar offset is the offset of the field in your see the OFFSET() macro
WAVDemuxContext::smv_given_first
int smv_given_first
Definition: wavdec.c:59
AV_CODEC_ID_G729
@ AV_CODEC_ID_G729
Definition: codec_id.h:463
w64.h
WAVDemuxContext::ignore_length
int ignore_length
Definition: wavdec.c:56
pkt
static AVPacket pkt
Definition: demuxing_decoding.c:54
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:40
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:625
temp
else temp
Definition: vf_mcdeint.c:256
AVSTREAM_PARSE_FULL_RAW
@ AVSTREAM_PARSE_FULL_RAW
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:790
samples
Filter the word “frame” indicates either a video frame or a group of audio samples
Definition: filter_design.txt:8
AVStream::request_probe
int request_probe
stream probing state -1 -> probing finished 0 -> no probing requested rest -> perform probing with re...
Definition: avformat.h:1122
AVPacket::stream_index
int stream_index
Definition: packet.h:357
avio_skip
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:329
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
ff_w64_guid_data
const uint8_t ff_w64_guid_data[16]
Definition: w64.c:42
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:309
AVCodecParameters::bits_per_coded_sample
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: codec_par.h:102
find_guid
static const GUIDParseTable * find_guid(ff_asf_guid guid)
Definition: asfdec_o.c:1642
AV_CODEC_ID_XMA2
@ AV_CODEC_ID_XMA2
Definition: codec_id.h:491
ff_w64_guid_riff
const uint8_t ff_w64_guid_riff[16]
Definition: w64.c:23
av_free
#define av_free(p)
Definition: tableprint_vlc.h:34
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:48
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:60
AVPacket
This structure stores compressed data.
Definition: packet.h:332
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Definition: opt.h:240
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:70
riff.h
ff_id3v2_free_extra_meta
void ff_id3v2_free_extra_meta(ID3v2ExtraMeta **extra_meta)
Free memory allocated parsing special (non-text) metadata.
Definition: id3v2.c:1124
AVPacket::pos
int64_t pos
byte position in stream, -1 if unknown
Definition: packet.h:375
avio_rl64
uint64_t avio_rl64(AVIOContext *s)
Definition: aviobuf.c:755
flags
#define flags(name, subs,...)
Definition: cbs_av1.c:565
AVCodecParameters::bit_rate
int64_t bit_rate
The average bitrate of the encoded data (in bits per second).
Definition: codec_par.h:89
ff_id3v2_parse_priv
int ff_id3v2_parse_priv(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Add metadata for all PRIV tags in the ID3v2 header.
Definition: id3v2.c:1271
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
snprintf
#define snprintf
Definition: snprintf.h:34
spdif.h
FF_PRI_GUID
#define FF_PRI_GUID
Definition: riff.h:101
av_fourcc2str
#define av_fourcc2str(fourcc)
Definition: avutil.h:348
ff_alloc_extradata
int ff_alloc_extradata(AVCodecParameters *par, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0.
Definition: utils.c:3328
avio_feof
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:356
DEC
#define DEC
Definition: librsvgdec.c:105