FFmpeg
wavdec.c
Go to the documentation of this file.
1 /*
2  * WAV demuxer
3  * Copyright (c) 2001, 2002 Fabrice Bellard
4  *
5  * Sony Wave64 demuxer
6  * RF64 demuxer
7  * Copyright (c) 2009 Daniel Verkamp
8  *
9  * BW64 demuxer
10  *
11  * This file is part of FFmpeg.
12  *
13  * FFmpeg is free software; you can redistribute it and/or
14  * modify it under the terms of the GNU Lesser General Public
15  * License as published by the Free Software Foundation; either
16  * version 2.1 of the License, or (at your option) any later version.
17  *
18  * FFmpeg is distributed in the hope that it will be useful,
19  * but WITHOUT ANY WARRANTY; without even the implied warranty of
20  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
21  * Lesser General Public License for more details.
22  *
23  * You should have received a copy of the GNU Lesser General Public
24  * License along with FFmpeg; if not, write to the Free Software
25  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
26  */
27 
28 #include <stdint.h>
29 
30 #include "config_components.h"
31 #include "libavutil/avassert.h"
32 #include "libavutil/dict.h"
33 #include "libavutil/intreadwrite.h"
34 #include "libavutil/log.h"
35 #include "libavutil/mathematics.h"
36 #include "libavutil/mem.h"
37 #include "libavutil/opt.h"
38 #include "libavcodec/internal.h"
39 #include "avformat.h"
40 #include "avio.h"
41 #include "avio_internal.h"
42 #include "demux.h"
43 #include "id3v2.h"
44 #include "internal.h"
45 #include "metadata.h"
46 #include "pcm.h"
47 #include "riff.h"
48 #include "w64.h"
49 #include "spdif.h"
50 
51 typedef struct WAVDemuxContext {
52  const AVClass *class;
53  int64_t data_end;
54  int w64;
56  int64_t smv_data_ofs;
59  int smv_block;
61  int smv_eof;
62  int audio_eof;
64  int max_size;
65  int spdif;
67  int unaligned; // e.g. if an odd number of bytes ID3 tag was prepended
68  int rifx; // RIFX: integer byte order for parameters is big endian
70 
71 #define OFFSET(x) offsetof(WAVDemuxContext, x)
72 #define DEC AV_OPT_FLAG_DECODING_PARAM
73 static const AVOption demux_options[] = {
74 #define W64_DEMUXER_OPTIONS_OFFSET (1 * CONFIG_WAV_DEMUXER)
75 #if CONFIG_WAV_DEMUXER
76  { "ignore_length", "Ignore length", OFFSET(ignore_length), AV_OPT_TYPE_BOOL, { .i64 = 0 }, 0, 1, DEC },
77 #endif
78  { "max_size", "max size of single packet", OFFSET(max_size), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1 << 22, DEC },
79  { NULL },
80 };
81 
82 static void set_max_size(AVStream *st, WAVDemuxContext *wav)
83 {
84  if (wav->max_size <= 0) {
85  int max_size = ff_pcm_default_packet_size(st->codecpar);
86  wav->max_size = max_size < 0 ? 4096 : max_size;
87  }
88 }
89 
91 {
92  if (CONFIG_SPDIF_DEMUXER && s->streams[0]->codecpar->codec_tag == 1) {
93  enum AVCodecID codec;
94  int len = 1<<16;
95  int ret = ffio_ensure_seekback(s->pb, len);
96 
97  if (ret >= 0) {
98  uint8_t *buf = av_malloc(len + AV_INPUT_BUFFER_PADDING_SIZE);
99  if (!buf) {
100  ret = AVERROR(ENOMEM);
101  } else {
102  int64_t pos = avio_tell(s->pb);
103  len = ret = avio_read(s->pb, buf, len);
104  if (len >= 0) {
105  ret = ff_spdif_probe(buf, len, &codec);
107  s->streams[0]->codecpar->codec_id = codec;
108  wav->spdif = 1;
109  }
110  }
111  avio_seek(s->pb, pos, SEEK_SET);
112  av_free(buf);
113  }
114  }
115 
116  if (ret < 0)
117  av_log(s, AV_LOG_WARNING, "Cannot check for SPDIF\n");
118  }
119 }
120 
121 #if CONFIG_WAV_DEMUXER
122 
123 static int64_t next_tag(AVIOContext *pb, uint32_t *tag, int big_endian)
124 {
125  *tag = avio_rl32(pb);
126  if (!big_endian) {
127  return avio_rl32(pb);
128  } else {
129  return avio_rb32(pb);
130  }
131 }
132 
133 /* RIFF chunks are always at even offsets relative to where they start. */
134 static int64_t wav_seek_tag(WAVDemuxContext * wav, AVIOContext *s, int64_t offset, int whence)
135 {
136  offset += offset < INT64_MAX && offset + wav->unaligned & 1;
137 
138  return avio_seek(s, offset, whence);
139 }
140 
141 /* return the size of the found tag */
142 static int64_t find_tag(WAVDemuxContext * wav, AVIOContext *pb, uint32_t tag1)
143 {
144  unsigned int tag;
145  int64_t size;
146 
147  for (;;) {
148  if (avio_feof(pb))
149  return AVERROR_EOF;
150  size = next_tag(pb, &tag, wav->rifx);
151  if (tag == tag1)
152  break;
153  wav_seek_tag(wav, pb, size, SEEK_CUR);
154  }
155  return size;
156 }
157 
158 static int wav_probe(const AVProbeData *p)
159 {
160  /* check file header */
161  if (p->buf_size <= 32)
162  return 0;
163  if (!memcmp(p->buf + 8, "WAVE", 4)) {
164  if (!memcmp(p->buf, "RIFF", 4) || !memcmp(p->buf, "RIFX", 4))
165  /* Since the ACT demuxer has a standard WAV header at the top of
166  * its own, the returned score is decreased to avoid a probe
167  * conflict between ACT and WAV. */
168  return AVPROBE_SCORE_MAX - 1;
169  else if ((!memcmp(p->buf, "RF64", 4) ||
170  !memcmp(p->buf, "BW64", 4)) &&
171  !memcmp(p->buf + 12, "ds64", 4))
172  return AVPROBE_SCORE_MAX;
173  }
174  return 0;
175 }
176 
177 static void handle_stream_probing(AVStream *st)
178 {
180  FFStream *const sti = ffstream(st);
182  sti->probe_packets = FFMIN(sti->probe_packets, 32);
183  }
184 }
185 
186 static int wav_parse_fmt_tag(AVFormatContext *s, int64_t size, AVStream *st)
187 {
188  AVIOContext *pb = s->pb;
189  WAVDemuxContext *wav = s->priv_data;
190  int ret;
191 
192  /* parse fmt header */
193  ret = ff_get_wav_header(s, pb, st->codecpar, size, wav->rifx);
194  if (ret < 0)
195  return ret;
196  handle_stream_probing(st);
197 
199 
200  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
201 
202  return 0;
203 }
204 
205 static int wav_parse_xma2_tag(AVFormatContext *s, int64_t size, AVStream *st)
206 {
207  AVIOContext *pb = s->pb;
208  int version, num_streams, i, channels = 0, ret;
209 
210  if (size < 36)
211  return AVERROR_INVALIDDATA;
212 
216 
217  version = avio_r8(pb);
218  if (version != 3 && version != 4)
219  return AVERROR_INVALIDDATA;
220  num_streams = avio_r8(pb);
221  if (size != (32 + ((version==3)?0:8) + 4*num_streams))
222  return AVERROR_INVALIDDATA;
223  avio_skip(pb, 10);
224  st->codecpar->sample_rate = avio_rb32(pb);
225  if (version == 4)
226  avio_skip(pb, 8);
227  avio_skip(pb, 4);
228  st->duration = avio_rb32(pb);
229  avio_skip(pb, 8);
230 
231  for (i = 0; i < num_streams; i++) {
232  channels += avio_r8(pb);
233  avio_skip(pb, 3);
234  }
238 
239  if (st->codecpar->ch_layout.nb_channels <= 0 || st->codecpar->sample_rate <= 0)
240  return AVERROR_INVALIDDATA;
241 
242  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
243 
244  avio_seek(pb, -size, SEEK_CUR);
245  if ((ret = ff_get_extradata(s, st->codecpar, pb, size)) < 0)
246  return ret;
247 
248  return 0;
249 }
250 
251 static inline int wav_parse_bext_string(AVFormatContext *s, const char *key,
252  int length)
253 {
254  char temp[257];
255  int ret;
256 
257  av_assert0(length < sizeof(temp));
258  if ((ret = ffio_read_size(s->pb, temp, length)) < 0)
259  return ret;
260 
261  temp[length] = 0;
262 
263  if (strlen(temp))
264  return av_dict_set(&s->metadata, key, temp, 0);
265 
266  return 0;
267 }
268 
269 static int wav_parse_bext_tag(AVFormatContext *s, int64_t size)
270 {
271  char temp[131], *coding_history;
272  int ret, x;
273  uint64_t time_reference;
274  int64_t umid_parts[8], umid_mask = 0;
275 
276  if ((ret = wav_parse_bext_string(s, "description", 256)) < 0 ||
277  (ret = wav_parse_bext_string(s, "originator", 32)) < 0 ||
278  (ret = wav_parse_bext_string(s, "originator_reference", 32)) < 0 ||
279  (ret = wav_parse_bext_string(s, "origination_date", 10)) < 0 ||
280  (ret = wav_parse_bext_string(s, "origination_time", 8)) < 0)
281  return ret;
282 
283  time_reference = avio_rl64(s->pb);
284  snprintf(temp, sizeof(temp), "%"PRIu64, time_reference);
285  if ((ret = av_dict_set(&s->metadata, "time_reference", temp, 0)) < 0)
286  return ret;
287 
288  /* check if version is >= 1, in which case an UMID may be present */
289  if (avio_rl16(s->pb) >= 1) {
290  for (x = 0; x < 8; x++)
291  umid_mask |= umid_parts[x] = avio_rb64(s->pb);
292 
293  if (umid_mask) {
294  /* the string formatting below is per SMPTE 330M-2004 Annex C */
295  if (umid_parts[4] == 0 && umid_parts[5] == 0 &&
296  umid_parts[6] == 0 && umid_parts[7] == 0) {
297  /* basic UMID */
298  snprintf(temp, sizeof(temp),
299  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
300  umid_parts[0], umid_parts[1],
301  umid_parts[2], umid_parts[3]);
302  } else {
303  /* extended UMID */
304  snprintf(temp, sizeof(temp),
305  "0x%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64
306  "%016"PRIX64"%016"PRIX64"%016"PRIX64"%016"PRIX64,
307  umid_parts[0], umid_parts[1],
308  umid_parts[2], umid_parts[3],
309  umid_parts[4], umid_parts[5],
310  umid_parts[6], umid_parts[7]);
311  }
312 
313  if ((ret = av_dict_set(&s->metadata, "umid", temp, 0)) < 0)
314  return ret;
315  }
316 
317  avio_skip(s->pb, 190);
318  } else
319  avio_skip(s->pb, 254);
320 
321  if (size > 602) {
322  /* CodingHistory present */
323  size -= 602;
324 
325  if (!(coding_history = av_malloc(size + 1)))
326  return AVERROR(ENOMEM);
327 
328  if ((ret = ffio_read_size(s->pb, coding_history, size)) < 0) {
329  av_free(coding_history);
330  return ret;
331  }
332 
333  coding_history[size] = 0;
334  if ((ret = av_dict_set(&s->metadata, "coding_history", coding_history,
336  return ret;
337  }
338 
339  return 0;
340 }
341 
342 static const AVMetadataConv wav_metadata_conv[] = {
343  { "description", "comment" },
344  { "originator", "encoded_by" },
345  { "origination_date", "date" },
346  { "origination_time", "creation_time" },
347  { 0 },
348 };
349 
350 /* wav input */
351 static int wav_read_header(AVFormatContext *s)
352 {
353  int64_t size, av_uninit(data_size);
354  int64_t sample_count = 0;
355  int rf64 = 0, bw64 = 0;
356  uint32_t tag;
357  AVIOContext *pb = s->pb;
358  AVStream *st = NULL;
359  WAVDemuxContext *wav = s->priv_data;
360  int ret, got_fmt = 0, got_xma2 = 0;
361  int64_t next_tag_ofs, data_ofs = -1;
362 
363  wav->unaligned = avio_tell(s->pb) & 1;
364 
365  wav->smv_data_ofs = -1;
366 
367  /* read chunk ID */
368  tag = avio_rl32(pb);
369  switch (tag) {
370  case MKTAG('R', 'I', 'F', 'F'):
371  break;
372  case MKTAG('R', 'I', 'F', 'X'):
373  wav->rifx = 1;
374  break;
375  case MKTAG('R', 'F', '6', '4'):
376  rf64 = 1;
377  break;
378  case MKTAG('B', 'W', '6', '4'):
379  bw64 = 1;
380  break;
381  default:
382  av_log(s, AV_LOG_ERROR, "invalid start code %s in RIFF header\n",
383  av_fourcc2str(tag));
384  return AVERROR_INVALIDDATA;
385  }
386 
387  /* read chunk size */
388  avio_rl32(pb);
389 
390  /* read format */
391  if (avio_rl32(pb) != MKTAG('W', 'A', 'V', 'E')) {
392  av_log(s, AV_LOG_ERROR, "invalid format in RIFF header\n");
393  return AVERROR_INVALIDDATA;
394  }
395 
396  if (rf64 || bw64) {
397  if (avio_rl32(pb) != MKTAG('d', 's', '6', '4'))
398  return AVERROR_INVALIDDATA;
399  size = avio_rl32(pb);
400  if (size < 24)
401  return AVERROR_INVALIDDATA;
402  avio_rl64(pb); /* RIFF size */
403 
404  data_size = avio_rl64(pb);
405  sample_count = avio_rl64(pb);
406 
407  if (data_size < 0 || sample_count < 0) {
408  av_log(s, AV_LOG_ERROR, "negative data_size and/or sample_count in "
409  "ds64: data_size = %"PRId64", sample_count = %"PRId64"\n",
410  data_size, sample_count);
411  return AVERROR_INVALIDDATA;
412  }
413  avio_skip(pb, size - 24); /* skip rest of ds64 chunk */
414 
415  }
416 
417  /* Create the audio stream now so that its index is always zero */
418  st = avformat_new_stream(s, NULL);
419  if (!st)
420  return AVERROR(ENOMEM);
421 
422  for (;;) {
423  AVStream *vst;
424  size = next_tag(pb, &tag, wav->rifx);
425  next_tag_ofs = avio_tell(pb) + size;
426 
427  if (avio_feof(pb))
428  break;
429 
430  switch (tag) {
431  case MKTAG('f', 'm', 't', ' '):
432  /* only parse the first 'fmt ' tag found */
433  if (!got_xma2 && !got_fmt && (ret = wav_parse_fmt_tag(s, size, st)) < 0) {
434  return ret;
435  } else if (got_fmt)
436  av_log(s, AV_LOG_WARNING, "found more than one 'fmt ' tag\n");
437 
438  got_fmt = 1;
439  break;
440  case MKTAG('X', 'M', 'A', '2'):
441  /* only parse the first 'XMA2' tag found */
442  if (!got_fmt && !got_xma2 && (ret = wav_parse_xma2_tag(s, size, st)) < 0) {
443  return ret;
444  } else if (got_xma2)
445  av_log(s, AV_LOG_WARNING, "found more than one 'XMA2' tag\n");
446 
447  got_xma2 = 1;
448  break;
449  case MKTAG('d', 'a', 't', 'a'):
450  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) && !got_fmt && !got_xma2) {
452  "found no 'fmt ' tag before the 'data' tag\n");
453  return AVERROR_INVALIDDATA;
454  }
455 
456  if (rf64 || bw64) {
457  next_tag_ofs = wav->data_end = av_sat_add64(avio_tell(pb), data_size);
458  } else if (size != 0xFFFFFFFF) {
459  data_size = size;
460  next_tag_ofs = wav->data_end = size ? next_tag_ofs : INT64_MAX;
461  } else {
462  av_log(s, AV_LOG_WARNING, "Ignoring maximum wav data size, "
463  "file may be invalid\n");
464  data_size = 0;
465  next_tag_ofs = wav->data_end = INT64_MAX;
466  }
467 
468  data_ofs = avio_tell(pb);
469 
470  /* don't look for footer metadata if we can't seek or if we don't
471  * know where the data tag ends
472  */
473  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL) || (!(rf64 && !bw64) && !size))
474  goto break_loop;
475  break;
476  case MKTAG('f', 'a', 'c', 't'):
477  if (!sample_count)
478  sample_count = (!wav->rifx ? avio_rl32(pb) : avio_rb32(pb));
479  break;
480  case MKTAG('b', 'e', 'x', 't'):
481  if ((ret = wav_parse_bext_tag(s, size)) < 0)
482  return ret;
483  break;
484  case MKTAG('S','M','V','0'):
485  if (!got_fmt) {
486  av_log(s, AV_LOG_ERROR, "found no 'fmt ' tag before the 'SMV0' tag\n");
487  return AVERROR_INVALIDDATA;
488  }
489  // SMV file, a wav file with video appended.
490  if (size != MKTAG('0','2','0','0')) {
491  av_log(s, AV_LOG_ERROR, "Unknown SMV version found\n");
492  goto break_loop;
493  }
494  av_log(s, AV_LOG_DEBUG, "Found SMV data\n");
495  wav->smv_given_first = 0;
496  vst = avformat_new_stream(s, NULL);
497  if (!vst)
498  return AVERROR(ENOMEM);
499  wav->vst = vst;
500  avio_r8(pb);
501  vst->id = 1;
504  vst->codecpar->width = avio_rl24(pb);
505  vst->codecpar->height = avio_rl24(pb);
506  if ((ret = ff_alloc_extradata(vst->codecpar, 4)) < 0) {
507  av_log(s, AV_LOG_ERROR, "Could not allocate extradata.\n");
508  return ret;
509  }
510  size = avio_rl24(pb);
511  wav->smv_data_ofs = avio_tell(pb) + (size - 5) * 3;
512  avio_rl24(pb);
513  wav->smv_block_size = avio_rl24(pb);
514  if (!wav->smv_block_size)
515  return AVERROR_INVALIDDATA;
516  avpriv_set_pts_info(vst, 32, 1, avio_rl24(pb));
517  vst->duration = avio_rl24(pb);
518  avio_rl24(pb);
519  avio_rl24(pb);
520  wav->smv_frames_per_jpeg = avio_rl24(pb);
521  if (wav->smv_frames_per_jpeg > 65536) {
522  av_log(s, AV_LOG_ERROR, "too many frames per jpeg\n");
523  return AVERROR_INVALIDDATA;
524  }
526  goto break_loop;
527  case MKTAG('L', 'I', 'S', 'T'):
528  case MKTAG('l', 'i', 's', 't'):
529  if (size < 4) {
530  av_log(s, AV_LOG_ERROR, "too short LIST tag\n");
531  return AVERROR_INVALIDDATA;
532  }
533  switch (avio_rl32(pb)) {
534  case MKTAG('I', 'N', 'F', 'O'):
535  ff_read_riff_info(s, size - 4);
536  break;
537  case MKTAG('a', 'd', 't', 'l'):
538  if (s->nb_chapters > 0) {
539  while (avio_tell(pb) < next_tag_ofs &&
540  !avio_feof(pb)) {
541  char cue_label[512];
542  unsigned id, sub_size;
543 
544  if (avio_rl32(pb) != MKTAG('l', 'a', 'b', 'l'))
545  break;
546 
547  sub_size = avio_rl32(pb);
548  if (sub_size < 5)
549  break;
550  id = avio_rl32(pb);
551  avio_get_str(pb, sub_size - 4, cue_label, sizeof(cue_label));
552  avio_skip(pb, avio_tell(pb) & 1);
553 
554  for (int i = 0; i < s->nb_chapters; i++) {
555  if (s->chapters[i]->id == id) {
556  av_dict_set(&s->chapters[i]->metadata, "title", cue_label, 0);
557  break;
558  }
559  }
560  }
561  }
562  break;
563  }
564  break;
565  case MKTAG('I', 'D', '3', ' '):
566  case MKTAG('i', 'd', '3', ' '): {
567  ID3v2ExtraMeta *id3v2_extra_meta;
568  ff_id3v2_read(s, ID3v2_DEFAULT_MAGIC, &id3v2_extra_meta, 0);
569  if (id3v2_extra_meta) {
570  ff_id3v2_parse_apic(s, id3v2_extra_meta);
571  ff_id3v2_parse_chapters(s, id3v2_extra_meta);
572  ff_id3v2_parse_priv(s, id3v2_extra_meta);
573  }
574  ff_id3v2_free_extra_meta(&id3v2_extra_meta);
575  }
576  break;
577  case MKTAG('c', 'u', 'e', ' '):
578  if (size >= 4 && got_fmt && st->codecpar->sample_rate > 0) {
579  AVRational tb = {1, st->codecpar->sample_rate};
580  unsigned nb_cues = avio_rl32(pb);
581 
582  if (size >= nb_cues * 24LL + 4LL) {
583  for (int i = 0; i < nb_cues; i++) {
584  unsigned offset, id = avio_rl32(pb);
585 
586  if (avio_feof(pb))
587  return AVERROR_INVALIDDATA;
588 
589  avio_skip(pb, 16);
590  offset = avio_rl32(pb);
591 
593  return AVERROR(ENOMEM);
594  }
595  }
596  }
597  break;
598  }
599 
600  /* seek to next tag unless we know that we'll run into EOF */
601  if ((avio_size(pb) > 0 && next_tag_ofs >= avio_size(pb)) ||
602  wav_seek_tag(wav, pb, next_tag_ofs, SEEK_SET) < 0) {
603  break;
604  }
605  }
606 
607 break_loop:
608  if (!got_fmt && !got_xma2) {
609  av_log(s, AV_LOG_ERROR, "no 'fmt ' or 'XMA2' tag found\n");
610  return AVERROR_INVALIDDATA;
611  }
612 
613  if (data_ofs < 0) {
614  av_log(s, AV_LOG_ERROR, "no 'data' tag found\n");
615  return AVERROR_INVALIDDATA;
616  }
617 
618  avio_seek(pb, data_ofs, SEEK_SET);
619 
620  if (data_size > (INT64_MAX>>3)) {
621  av_log(s, AV_LOG_WARNING, "Data size %"PRId64" is too large\n", data_size);
622  data_size = 0;
623  }
624 
625  if ( st->codecpar->bit_rate > 0 && data_size > 0
626  && st->codecpar->sample_rate > 0
627  && sample_count > 0 && st->codecpar->ch_layout.nb_channels > 1
628  && sample_count % st->codecpar->ch_layout.nb_channels == 0) {
629  if (fabs(8.0 * data_size * st->codecpar->ch_layout.nb_channels * st->codecpar->sample_rate /
630  sample_count /st->codecpar->bit_rate - 1.0) < 0.3)
631  sample_count /= st->codecpar->ch_layout.nb_channels;
632  }
633 
634  if (data_size > 0 && sample_count && st->codecpar->ch_layout.nb_channels &&
635  (data_size << 3) / sample_count / st->codecpar->ch_layout.nb_channels > st->codecpar->bits_per_coded_sample + 1) {
636  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
637  sample_count = 0;
638  }
639 
640  /* G.729 hack (for Ticket4577)
641  * FIXME: Come up with cleaner, more general solution */
642  if (st->codecpar->codec_id == AV_CODEC_ID_G729 && sample_count && (data_size << 3) > sample_count) {
643  av_log(s, AV_LOG_WARNING, "ignoring wrong sample_count %"PRId64"\n", sample_count);
644  sample_count = 0;
645  }
646 
647  if (!sample_count || av_get_exact_bits_per_sample(st->codecpar->codec_id) > 0)
648  if ( st->codecpar->ch_layout.nb_channels
649  && data_size
651  && wav->data_end <= avio_size(pb))
652  sample_count = (data_size << 3)
653  /
655 
656  if (sample_count)
657  st->duration = sample_count;
658 
661  st->codecpar->bits_per_coded_sample == 32 &&
662  st->codecpar->extradata_size == 2 &&
663  AV_RL16(st->codecpar->extradata) == 1) {
666  } else if (st->codecpar->codec_id == AV_CODEC_ID_PCM_S24LE &&
668  st->codecpar->bits_per_coded_sample == 24) {
670  } else if (st->codecpar->codec_id == AV_CODEC_ID_XMA1 ||
672  st->codecpar->block_align = 2048;
673  } else if (st->codecpar->codec_id == AV_CODEC_ID_ADPCM_MS && st->codecpar->ch_layout.nb_channels > 2 &&
674  st->codecpar->block_align < INT_MAX / st->codecpar->ch_layout.nb_channels) {
676  }
677 
678  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
680 
681  set_spdif(s, wav);
682  set_max_size(st, wav);
683 
684  return 0;
685 }
686 
687 /**
688  * Find chunk with w64 GUID by skipping over other chunks.
689  * @return the size of the found chunk
690  */
691 static int64_t find_guid(AVIOContext *pb, const uint8_t guid1[16])
692 {
693  uint8_t guid[16];
694  int64_t size;
695 
696  while (!avio_feof(pb)) {
697  avio_read(pb, guid, 16);
698  size = avio_rl64(pb);
699  if (size <= 24 || size > INT64_MAX - 8)
700  return AVERROR_INVALIDDATA;
701  if (!memcmp(guid, guid1, 16))
702  return size;
703  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
704  }
705  return AVERROR_EOF;
706 }
707 
708 static int wav_read_packet(AVFormatContext *s, AVPacket *pkt)
709 {
710  int ret, size;
711  int64_t left;
712  WAVDemuxContext *wav = s->priv_data;
713  AVStream *st = s->streams[0];
714 
715  if (CONFIG_SPDIF_DEMUXER && wav->spdif == 1)
716  return ff_spdif_read_packet(s, pkt);
717 
718  if (wav->smv_data_ofs > 0) {
719  int64_t audio_dts, video_dts;
720  AVStream *vst = wav->vst;
721 smv_retry:
724 
726  /*We always return a video frame first to get the pixel format first*/
727  wav->smv_last_stream = wav->smv_given_first ?
729  audio_dts, st->time_base) > 0 : 0;
730  wav->smv_given_first = 1;
731  }
732  wav->smv_last_stream = !wav->smv_last_stream;
733  wav->smv_last_stream |= wav->audio_eof;
734  wav->smv_last_stream &= !wav->smv_eof;
735  if (wav->smv_last_stream) {
736  uint64_t old_pos = avio_tell(s->pb);
737  uint64_t new_pos = wav->smv_data_ofs +
738  wav->smv_block * (int64_t)wav->smv_block_size;
739  if (avio_seek(s->pb, new_pos, SEEK_SET) < 0) {
740  ret = AVERROR_EOF;
741  goto smv_out;
742  }
743  size = avio_rl24(s->pb);
744  if (size > wav->smv_block_size) {
745  ret = AVERROR_EOF;
746  goto smv_out;
747  }
748  ret = av_get_packet(s->pb, pkt, size);
749  if (ret < 0)
750  goto smv_out;
751  pkt->pos -= 3;
752  pkt->pts = wav->smv_block * wav->smv_frames_per_jpeg;
754  wav->smv_block++;
755 
756  pkt->stream_index = vst->index;
757 smv_out:
758  avio_seek(s->pb, old_pos, SEEK_SET);
759  if (ret == AVERROR_EOF) {
760  wav->smv_eof = 1;
761  goto smv_retry;
762  }
763  return ret;
764  }
765  }
766 
767  left = wav->data_end - avio_tell(s->pb);
768  if (wav->ignore_length)
769  left = INT_MAX;
770  if (left <= 0) {
771  if (CONFIG_W64_DEMUXER && wav->w64)
772  left = find_guid(s->pb, ff_w64_guid_data) - 24;
773  else
774  left = find_tag(wav, s->pb, MKTAG('d', 'a', 't', 'a'));
775  if (left < 0) {
776  wav->audio_eof = 1;
777  if (wav->smv_data_ofs > 0 && !wav->smv_eof)
778  goto smv_retry;
779  return AVERROR_EOF;
780  }
781  if (INT64_MAX - left < avio_tell(s->pb))
782  return AVERROR_INVALIDDATA;
783  wav->data_end = avio_tell(s->pb) + left;
784  }
785 
786  size = wav->max_size;
787  if (st->codecpar->block_align > 1) {
788  if (size < st->codecpar->block_align)
789  size = st->codecpar->block_align;
790  size = (size / st->codecpar->block_align) * st->codecpar->block_align;
791  }
792  size = FFMIN(size, left);
793  ret = av_get_packet(s->pb, pkt, size);
794  if (ret < 0)
795  return ret;
796  pkt->stream_index = 0;
797 
798  return ret;
799 }
800 
801 static int wav_read_seek(AVFormatContext *s,
802  int stream_index, int64_t timestamp, int flags)
803 {
804  WAVDemuxContext *wav = s->priv_data;
805  AVStream *ast = s->streams[0], *vst = wav->vst;
806  wav->smv_eof = 0;
807  wav->audio_eof = 0;
808 
809  if (stream_index != 0 && (!vst || stream_index != vst->index))
810  return AVERROR(EINVAL);
811  if (wav->smv_data_ofs > 0) {
812  int64_t smv_timestamp = timestamp;
813  if (stream_index == 0)
814  smv_timestamp = av_rescale_q(timestamp, ast->time_base, vst->time_base);
815  else
816  timestamp = av_rescale_q(smv_timestamp, vst->time_base, ast->time_base);
817  if (wav->smv_frames_per_jpeg > 0) {
818  wav->smv_block = smv_timestamp / wav->smv_frames_per_jpeg;
819  }
820  }
821 
822  switch (ast->codecpar->codec_id) {
823  case AV_CODEC_ID_MP2:
824  case AV_CODEC_ID_MP3:
825  case AV_CODEC_ID_AC3:
826  case AV_CODEC_ID_DTS:
827  case AV_CODEC_ID_XMA2:
828  /* use generic seeking with dynamically generated indexes */
829  return -1;
830  default:
831  break;
832  }
833  return ff_pcm_read_seek(s, 0, timestamp, flags);
834 }
835 
836 static const AVClass wav_demuxer_class = {
837  .class_name = "WAV demuxer",
838  .item_name = av_default_item_name,
839  .option = demux_options,
840  .version = LIBAVUTIL_VERSION_INT,
841 };
843  .p.name = "wav",
844  .p.long_name = NULL_IF_CONFIG_SMALL("WAV / WAVE (Waveform Audio)"),
845  .p.flags = AVFMT_GENERIC_INDEX,
846  .p.codec_tag = ff_wav_codec_tags_list,
847  .p.priv_class = &wav_demuxer_class,
848  .priv_data_size = sizeof(WAVDemuxContext),
849  .read_probe = wav_probe,
850  .read_header = wav_read_header,
851  .read_packet = wav_read_packet,
852  .read_seek = wav_read_seek,
853 };
854 #endif /* CONFIG_WAV_DEMUXER */
855 
856 #if CONFIG_W64_DEMUXER
857 static int w64_probe(const AVProbeData *p)
858 {
859  if (p->buf_size <= 40)
860  return 0;
861  if (!memcmp(p->buf, ff_w64_guid_riff, 16) &&
862  !memcmp(p->buf + 24, ff_w64_guid_wave, 16))
863  return AVPROBE_SCORE_MAX;
864  else
865  return 0;
866 }
867 
868 static int w64_read_header(AVFormatContext *s)
869 {
870  int64_t size, data_ofs = 0;
871  AVIOContext *pb = s->pb;
872  WAVDemuxContext *wav = s->priv_data;
873  AVStream *st;
874  uint8_t guid[16];
875  int ret;
876 
877  avio_read(pb, guid, 16);
878  if (memcmp(guid, ff_w64_guid_riff, 16))
879  return AVERROR_INVALIDDATA;
880 
881  /* riff + wave + fmt + sizes */
882  if (avio_rl64(pb) < 16 + 8 + 16 + 8 + 16 + 8)
883  return AVERROR_INVALIDDATA;
884 
885  avio_read(pb, guid, 16);
886  if (memcmp(guid, ff_w64_guid_wave, 16)) {
887  av_log(s, AV_LOG_ERROR, "could not find wave guid\n");
888  return AVERROR_INVALIDDATA;
889  }
890 
891  wav->w64 = 1;
892 
893  st = avformat_new_stream(s, NULL);
894  if (!st)
895  return AVERROR(ENOMEM);
896 
897  while (!avio_feof(pb)) {
898  if (avio_read(pb, guid, 16) != 16)
899  break;
900  size = avio_rl64(pb);
901  if (size <= 24 || INT64_MAX - size < avio_tell(pb)) {
902  if (data_ofs)
903  break;
904  return AVERROR_INVALIDDATA;
905  }
906 
907  if (!memcmp(guid, ff_w64_guid_fmt, 16)) {
908  /* subtract chunk header size - normal wav file doesn't count it */
909  ret = ff_get_wav_header(s, pb, st->codecpar, size - 24, 0);
910  if (ret < 0)
911  return ret;
912  avio_skip(pb, FFALIGN(size, INT64_C(8)) - size);
913  if (st->codecpar->block_align &&
915  st->codecpar->bits_per_coded_sample < 128) {
916  int block_align = st->codecpar->block_align;
917 
918  block_align = FFMAX(block_align,
919  ((st->codecpar->bits_per_coded_sample + 7) / 8) *
921  if (block_align > st->codecpar->block_align) {
922  av_log(s, AV_LOG_WARNING, "invalid block_align: %d, broken file.\n",
923  st->codecpar->block_align);
924  st->codecpar->block_align = block_align;
925  }
926  }
927  avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
928  } else if (!memcmp(guid, ff_w64_guid_fact, 16)) {
929  int64_t samples;
930 
931  samples = avio_rl64(pb);
932  if (samples > 0)
933  st->duration = samples;
934  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 32);
935  } else if (!memcmp(guid, ff_w64_guid_data, 16)) {
936  wav->data_end = avio_tell(pb) + size - 24;
937 
938  data_ofs = avio_tell(pb);
939  if (!(pb->seekable & AVIO_SEEKABLE_NORMAL))
940  break;
941 
942  avio_skip(pb, size - 24);
943  } else if (!memcmp(guid, ff_w64_guid_summarylist, 16)) {
944  int64_t start, end, cur;
945  uint32_t count, chunk_size, i;
946  int64_t filesize = avio_size(s->pb);
947 
948  start = avio_tell(pb);
949  end = start + FFALIGN(size, INT64_C(8)) - 24;
950  count = avio_rl32(pb);
951 
952  for (i = 0; i < count; i++) {
953  char chunk_key[5], *value;
954 
955  if (avio_feof(pb) || (cur = avio_tell(pb)) < 0 || cur > end - 8 /* = tag + size */)
956  break;
957 
958  chunk_key[4] = 0;
959  avio_read(pb, chunk_key, 4);
960  chunk_size = avio_rl32(pb);
961  if (chunk_size == UINT32_MAX || (filesize >= 0 && chunk_size > filesize))
962  return AVERROR_INVALIDDATA;
963 
964  value = av_malloc(chunk_size + 1);
965  if (!value)
966  return AVERROR(ENOMEM);
967 
968  ret = avio_get_str16le(pb, chunk_size, value, chunk_size);
969  if (ret < 0) {
970  av_free(value);
971  return ret;
972  }
973  avio_skip(pb, chunk_size - ret);
974 
975  av_dict_set(&s->metadata, chunk_key, value, AV_DICT_DONT_STRDUP_VAL);
976  }
977 
978  avio_skip(pb, end - avio_tell(pb));
979  } else {
980  av_log(s, AV_LOG_DEBUG, "unknown guid: "FF_PRI_GUID"\n", FF_ARG_GUID(guid));
981  avio_skip(pb, FFALIGN(size, INT64_C(8)) - 24);
982  }
983  }
984 
985  if (!data_ofs)
986  return AVERROR_EOF;
987 
988  ff_metadata_conv_ctx(s, NULL, wav_metadata_conv);
990 
991  handle_stream_probing(st);
993 
994  avio_seek(pb, data_ofs, SEEK_SET);
995 
996  set_spdif(s, wav);
997  set_max_size(st, wav);
998 
999  return 0;
1000 }
1001 
1002 static const AVClass w64_demuxer_class = {
1003  .class_name = "W64 demuxer",
1004  .item_name = av_default_item_name,
1006  .version = LIBAVUTIL_VERSION_INT,
1007 };
1008 
1009 const FFInputFormat ff_w64_demuxer = {
1010  .p.name = "w64",
1011  .p.long_name = NULL_IF_CONFIG_SMALL("Sony Wave64"),
1012  .p.flags = AVFMT_GENERIC_INDEX,
1013  .p.codec_tag = ff_wav_codec_tags_list,
1014  .p.priv_class = &w64_demuxer_class,
1015  .priv_data_size = sizeof(WAVDemuxContext),
1016  .read_probe = w64_probe,
1017  .read_header = w64_read_header,
1018  .read_packet = wav_read_packet,
1019  .read_seek = wav_read_seek,
1020 };
1021 #endif /* CONFIG_W64_DEMUXER */
avpriv_new_chapter
AVChapter * avpriv_new_chapter(AVFormatContext *s, int64_t id, AVRational time_base, int64_t start, int64_t end, const char *title)
Add a new chapter.
Definition: demux_utils.c:42
WAVDemuxContext
Definition: wavdec.c:51
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:328
WAVDemuxContext::unaligned
int unaligned
Definition: wavdec.c:67
WAVDemuxContext::smv_block
int smv_block
Definition: wavdec.c:59
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:373
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:69
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:443
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
opt.h
pcm.h
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:51
AV_WL32
#define AV_WL32(p, v)
Definition: intreadwrite.h:424
av_compare_ts
int av_compare_ts(int64_t ts_a, AVRational tb_a, int64_t ts_b, AVRational tb_b)
Compare two timestamps each in its own time base.
Definition: mathematics.c:147
W64_DEMUXER_OPTIONS_OFFSET
#define W64_DEMUXER_OPTIONS_OFFSET
avformat_new_stream
AVStream * avformat_new_stream(AVFormatContext *s, const struct AVCodec *c)
Add a new stream to a media file.
AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:57
WAVDemuxContext::smv_data_ofs
int64_t smv_data_ofs
Definition: wavdec.c:56
audio_dts
int64_t audio_dts
Definition: movenc.c:62
WAVDemuxContext::smv_frames_per_jpeg
int smv_frames_per_jpeg
Definition: wavdec.c:58
id3v2.h
WAVDemuxContext::max_size
int max_size
Definition: wavdec.c:64
internal.h
AVOption
AVOption.
Definition: opt.h:346
ff_id3v2_read
void ff_id3v2_read(AVFormatContext *s, const char *magic, ID3v2ExtraMeta **extra_meta, unsigned int max_search_size)
Read an ID3v2 tag, including supported extra metadata.
Definition: id3v2.c:1140
AVMetadataConv
Definition: metadata.h:34
ff_get_wav_header
int ff_get_wav_header(void *logctx, AVIOContext *pb, AVCodecParameters *par, int size, int big_endian)
Definition: riffdec.c:95
AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: packet.h:542
mathematics.h
AVProbeData::buf_size
int buf_size
Size of buf except extra allocated bytes.
Definition: avformat.h:454
AVChannelLayout::order
enum AVChannelOrder order
Channel order used in this layout.
Definition: channel_layout.h:308
FFMAX
#define FFMAX(a, b)
Definition: macros.h:47
AVChannelLayout::nb_channels
int nb_channels
Number of channels in this layout.
Definition: channel_layout.h:313
avio_size
int64_t avio_size(AVIOContext *s)
Get the filesize.
Definition: aviobuf.c:323
sample_rate
sample_rate
Definition: ffmpeg_filter.c:424
WAVDemuxContext::data_end
int64_t data_end
Definition: wavdec.c:53
video_dts
int64_t video_dts
Definition: movenc.c:62
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:30
WAVDemuxContext::w64
int w64
Definition: wavdec.c:54
ff_get_extradata
int ff_get_extradata(void *logctx, AVCodecParameters *par, AVIOContext *pb, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0 and f...
Definition: demux_utils.c:335
AVPROBE_SCORE_MAX
#define AVPROBE_SCORE_MAX
maximum score
Definition: avformat.h:463
return
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several the filter must be ready for frames arriving randomly on any input any filter with several inputs will most likely require some kind of queuing mechanism It is perfectly acceptable to have a limited queue and to drop frames when the inputs are too unbalanced request_frame For filters that do not use the this method is called when a frame is wanted on an output For a it should directly call filter_frame on the corresponding output For a if there are queued frames already one of these frames should be pushed If the filter should request a frame on one of its repeatedly until at least one frame has been pushed Return or at least make progress towards producing a it should return
Definition: filter_design.txt:264
avpriv_set_pts_info
void avpriv_set_pts_info(AVStream *st, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: avformat.c:853
ff_w64_guid_summarylist
const uint8_t ff_w64_guid_summarylist[16]
Definition: w64.c:47
ff_wav_demuxer
const FFInputFormat ff_wav_demuxer
ffstream
static av_always_inline FFStream * ffstream(AVStream *st)
Definition: internal.h:417
read_seek
static int read_seek(AVFormatContext *ctx, int stream_index, int64_t timestamp, int flags)
Definition: libcdio.c:151
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:494
AVFMT_GENERIC_INDEX
#define AVFMT_GENERIC_INDEX
Use generic index building code.
Definition: avformat.h:480
demux_options
static const AVOption demux_options[]
Definition: wavdec.c:73
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:441
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:802
avio_rl16
unsigned int avio_rl16(AVIOContext *s)
Definition: aviobuf.c:714
ff_id3v2_parse_chapters
int ff_id3v2_parse_chapters(AVFormatContext *s, ID3v2ExtraMeta *cur)
Create chapters for all CHAP tags found in the ID3v2 header.
Definition: id3v2.c:1193
AV_DICT_DONT_STRDUP_VAL
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that's been allocated with av_malloc() or another memory allocation functio...
Definition: dict.h:79
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:547
avassert.h
avio_rb32
unsigned int avio_rb32(AVIOContext *s)
Definition: aviobuf.c:761
pkt
AVPacket * pkt
Definition: movenc.c:60
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
ID3v2ExtraMeta
Definition: id3v2.h:84
read_packet
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_read_callback.c:42
avio_get_str16le
int avio_get_str16le(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a UTF-16 string from pb and convert it to UTF-8.
FF_ARG_GUID
#define FF_ARG_GUID(g)
Definition: riff.h:109
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:198
AV_CODEC_ID_XMA1
@ AV_CODEC_ID_XMA1
Definition: codec_id.h:519
AVInputFormat::name
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:553
AVProbeData::buf
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:453
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
AVCodecParameters::width
int width
Video only.
Definition: codec_par.h:134
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:440
AV_CHANNEL_ORDER_UNSPEC
@ AV_CHANNEL_ORDER_UNSPEC
Only the channel count is specified, without any further information about the channel order.
Definition: channel_layout.h:112
av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:40
AV_LOG_DEBUG
#define AV_LOG_DEBUG
Stuff which is only useful for libav* developers.
Definition: log.h:201
AV_CODEC_ID_PCM_F24LE
@ AV_CODEC_ID_PCM_F24LE
Definition: codec_id.h:362
channels
channels
Definition: aptx.h:31
AV_RL16
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_RL16
Definition: bytestream.h:94
av_rescale_q
int64_t av_rescale_q(int64_t a, AVRational bq, AVRational cq)
Rescale a 64-bit integer by 2 rational numbers.
Definition: mathematics.c:142
ff_read_riff_info
int ff_read_riff_info(AVFormatContext *s, int64_t size)
Definition: riffdec.c:243
key
const char * key
Definition: hwcontext_opencl.c:189
if
if(ret)
Definition: filter_design.txt:179
FFStream::need_parsing
enum AVStreamParseType need_parsing
Definition: internal.h:386
AVFormatContext
Format I/O context.
Definition: avformat.h:1255
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:766
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
read_header
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:550
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:66
fabs
static __device__ float fabs(float a)
Definition: cuda_runtime.h:182
AVStream::time_base
AVRational time_base
This is the fundamental unit of time (in seconds) in terms of which frame timestamps are represented.
Definition: avformat.h:782
NULL
#define NULL
Definition: coverity.c:32
ff_pcm_default_packet_size
int ff_pcm_default_packet_size(AVCodecParameters *par)
Definition: pcm.c:29
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:237
ff_id3v2_parse_apic
int ff_id3v2_parse_apic(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Create a stream for each APIC (attached picture) extracted from the ID3v2 header.
Definition: id3v2.c:1162
avio_rb64
uint64_t avio_rb64(AVIOContext *s)
Definition: aviobuf.c:908
AVProbeData
This structure contains the data a format has to probe a file.
Definition: avformat.h:451
AVCodecParameters::ch_layout
AVChannelLayout ch_layout
Audio only.
Definition: codec_par.h:180
AVPROBE_SCORE_EXTENSION
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:461
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:184
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:49
ff_w64_guid_fmt
const uint8_t ff_w64_guid_fmt[16]
Definition: w64.c:33
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:73
WAVDemuxContext::smv_last_stream
int smv_last_stream
Definition: wavdec.c:60
av_get_exact_bits_per_sample
int av_get_exact_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:454
avio_rl32
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:730
AVIOContext
Bytestream IO Context.
Definition: avio.h:160
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:340
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:94
DEC
#define DEC
Definition: wavdec.c:72
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:261
FFStream
Definition: internal.h:193
ff_spdif_probe
int ff_spdif_probe(const uint8_t *p_buf, int buf_size, enum AVCodecID *codec)
Definition: spdifdec.c:122
WAVDemuxContext::smv_eof
int smv_eof
Definition: wavdec.c:61
AV_CODEC_ID_DTS
@ AV_CODEC_ID_DTS
Definition: codec_id.h:444
avio_get_str
int avio_get_str(AVIOContext *pb, int maxlen, char *buf, int buflen)
Read a string from pb into buf.
Definition: aviobuf.c:866
size
int size
Definition: twinvq_data.h:10344
AV_CODEC_ID_SMVJPEG
@ AV_CODEC_ID_SMVJPEG
Definition: codec_id.h:264
avio.h
ID3v2_DEFAULT_MAGIC
#define ID3v2_DEFAULT_MAGIC
Default magic bytes for ID3v2 header: "ID3".
Definition: id3v2.h:35
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:248
ff_riff_info_conv
const AVMetadataConv ff_riff_info_conv[]
Definition: riff.c:621
FFInputFormat::p
AVInputFormat p
The public AVInputFormat.
Definition: demux.h:41
avio_r8
int avio_r8(AVIOContext *s)
Definition: aviobuf.c:603
ffio_ensure_seekback
int ffio_ensure_seekback(AVIOContext *s, int64_t buf_size)
Ensures that the requested seekback buffer size will be available.
Definition: aviobuf.c:1023
offset
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf offset
Definition: writing_filters.txt:86
version
version
Definition: libkvazaar.c:321
FFStream::probe_packets
int probe_packets
Number of packets to buffer for codec probing.
Definition: internal.h:383
ff_spdif_read_packet
int ff_spdif_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: spdifdec.c:189
filesize
static int64_t filesize(AVIOContext *pb)
Definition: ffmpeg_mux.c:51
set_max_size
static void set_max_size(AVStream *st, WAVDemuxContext *wav)
Definition: wavdec.c:82
WAVDemuxContext::rifx
int rifx
Definition: wavdec.c:68
log.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:517
avio_rl24
unsigned int avio_rl24(AVIOContext *s)
Definition: aviobuf.c:722
avio_internal.h
WAVDemuxContext::audio_eof
int audio_eof
Definition: wavdec.c:62
ff_w64_guid_wave
const uint8_t ff_w64_guid_wave[16]
Definition: w64.c:28
AVCodecParameters::height
int height
Definition: codec_par.h:135
AVCodecParameters::block_align
int block_align
Audio only.
Definition: codec_par.h:191
WAVDemuxContext::smv_block_size
int smv_block_size
Definition: wavdec.c:57
value
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf default value
Definition: writing_filters.txt:86
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
tb
#define tb
Definition: regdef.h:68
demux.h
AV_CODEC_ID_PCM_F16LE
@ AV_CODEC_ID_PCM_F16LE
Definition: codec_id.h:361
ff_w64_guid_fact
const uint8_t ff_w64_guid_fact[16]
Definition: w64.c:38
len
int len
Definition: vorbis_enc_data.h:426
av_get_packet
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
Definition: utils.c:104
av_uninit
#define av_uninit(x)
Definition: attributes.h:154
tag
uint32_t tag
Definition: movenc.c:1787
AVStream::id
int id
Format-specific stream ID.
Definition: avformat.h:755
ret
ret
Definition: filter_design.txt:187
AVStream
Stream structure.
Definition: avformat.h:743
WAVDemuxContext::spdif
int spdif
Definition: wavdec.c:65
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:231
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:71
ff_pcm_read_seek
int ff_pcm_read_seek(AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
Definition: pcm.c:73
metadata.h
pos
unsigned int pos
Definition: spdifenc.c:414
avformat.h
dict.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
id
enum AVCodecID id
Definition: dts2pts.c:365
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
av_sat_add64
#define av_sat_add64
Definition: common.h:141
set_spdif
static void set_spdif(AVFormatContext *s, WAVDemuxContext *wav)
Definition: wavdec.c:90
AVStream::index
int index
stream index in AVFormatContext
Definition: avformat.h:749
WAVDemuxContext::smv_given_first
int smv_given_first
Definition: wavdec.c:66
AV_CODEC_ID_G729
@ AV_CODEC_ID_G729
Definition: codec_id.h:493
w64.h
WAVDemuxContext::ignore_length
int ignore_length
Definition: wavdec.c:63
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:41
AV_OPT_TYPE_INT
@ AV_OPT_TYPE_INT
Definition: opt.h:235
av_channel_layout_uninit
void av_channel_layout_uninit(AVChannelLayout *channel_layout)
Free any allocated data in the channel layout and reset the channel count to 0.
Definition: channel_layout.c:433
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:612
temp
else temp
Definition: vf_mcdeint.c:263
AVSTREAM_PARSE_FULL_RAW
@ AVSTREAM_PARSE_FULL_RAW
full parsing and repack with timestamp and position generation by parser for raw this assumes that ea...
Definition: avformat.h:597
OFFSET
#define OFFSET(x)
Definition: wavdec.c:71
samples
Filter the word “frame” indicates either a video frame or a group of audio samples
Definition: filter_design.txt:8
AVPacket::stream_index
int stream_index
Definition: packet.h:526
avio_skip
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:318
AVMEDIA_TYPE_VIDEO
@ AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201
read_probe
static int read_probe(const AVProbeData *p)
Definition: cdg.c:30
ff_w64_guid_data
const uint8_t ff_w64_guid_data[16]
Definition: w64.c:42
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:336
AVCodecParameters::bits_per_coded_sample
int bits_per_coded_sample
The number of bits per sample in the codedwords.
Definition: codec_par.h:110
mem.h
find_guid
static const GUIDParseTable * find_guid(ff_asf_guid guid)
Definition: asfdec_o.c:1546
AV_CODEC_ID_XMA2
@ AV_CODEC_ID_XMA2
Definition: codec_id.h:520
FFStream::request_probe
int request_probe
stream probing state -1 -> probing finished 0 -> no probing requested rest -> perform probing with re...
Definition: internal.h:263
ff_w64_guid_riff
const uint8_t ff_w64_guid_riff[16]
Definition: w64.c:23
av_free
#define av_free(p)
Definition: tableprint_vlc.h:33
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:55
AVPacket
This structure stores compressed data.
Definition: packet.h:501
AV_OPT_TYPE_BOOL
@ AV_OPT_TYPE_BOOL
Definition: opt.h:251
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:88
riff.h
ff_id3v2_free_extra_meta
void ff_id3v2_free_extra_meta(ID3v2ExtraMeta **extra_meta)
Free memory allocated parsing special (non-text) metadata.
Definition: id3v2.c:1146
FFStream::cur_dts
int64_t cur_dts
Definition: internal.h:410
AVPacket::pos
int64_t pos
byte position in stream, -1 if unknown
Definition: packet.h:544
FFInputFormat
Definition: demux.h:37
avio_rl64
uint64_t avio_rl64(AVIOContext *s)
Definition: aviobuf.c:738
int32_t
int32_t
Definition: audioconvert.c:56
flags
#define flags(name, subs,...)
Definition: cbs_av1.c:474
AVCodecParameters::bit_rate
int64_t bit_rate
The average bitrate of the encoded data (in bits per second).
Definition: codec_par.h:97
ff_id3v2_parse_priv
int ff_id3v2_parse_priv(AVFormatContext *s, ID3v2ExtraMeta *extra_meta)
Add metadata for all PRIV tags in the ID3v2 header.
Definition: id3v2.c:1258
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
MKTAG
#define MKTAG(a, b, c, d)
Definition: macros.h:55
ffio_read_size
int ffio_read_size(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:662
FF_SANE_NB_CHANNELS
#define FF_SANE_NB_CHANNELS
Definition: internal.h:37
snprintf
#define snprintf
Definition: snprintf.h:34
WAVDemuxContext::vst
AVStream * vst
Definition: wavdec.c:55
ff_w64_demuxer
const FFInputFormat ff_w64_demuxer
spdif.h
FF_PRI_GUID
#define FF_PRI_GUID
Definition: riff.h:105
ff_wav_codec_tags_list
const AVCodecTag *const ff_wav_codec_tags_list[]
ff_metadata_conv_ctx
void ff_metadata_conv_ctx(AVFormatContext *ctx, const AVMetadataConv *d_conv, const AVMetadataConv *s_conv)
Definition: metadata.c:59
av_fourcc2str
#define av_fourcc2str(fourcc)
Definition: avutil.h:345
ff_alloc_extradata
int ff_alloc_extradata(AVCodecParameters *par, int size)
Allocate extradata with additional AV_INPUT_BUFFER_PADDING_SIZE at end which is always set to 0.
Definition: utils.c:240
avio_feof
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:346