FFmpeg
cafenc.c
Go to the documentation of this file.
1 /*
2  * Core Audio Format muxer
3  * Copyright (c) 2011 Carl Eugen Hoyos
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "avformat.h"
23 #include "caf.h"
24 #include "isom.h"
25 #include "avio_internal.h"
26 #include "mux.h"
27 #include "libavutil/intfloat.h"
28 #include "libavutil/dict.h"
29 
30 #define FRAME_SIZE_OFFSET 40
31 
32 typedef struct {
33  int64_t data;
36  int packets;
37 } CAFContext;
38 
39 static uint32_t codec_flags(enum AVCodecID codec_id) {
40  switch (codec_id) {
43  return 1; //< kCAFLinearPCMFormatFlagIsFloat
47  return 2; //< kCAFLinearPCMFormatFlagIsLittleEndian
50  return 3; //< kCAFLinearPCMFormatFlagIsFloat | kCAFLinearPCMFormatFlagIsLittleEndian
51  default:
52  return 0;
53  }
54 }
55 
56 static uint32_t samples_per_packet(enum AVCodecID codec_id, int channels, int block_align) {
57  switch (codec_id) {
58  case AV_CODEC_ID_PCM_S8:
71  return 1;
72  case AV_CODEC_ID_MACE3:
73  case AV_CODEC_ID_MACE6:
74  return 6;
76  return 64;
77  case AV_CODEC_ID_AMR_NB:
78  case AV_CODEC_ID_GSM:
79  case AV_CODEC_ID_ILBC:
80  case AV_CODEC_ID_QCELP:
81  return 160;
82  case AV_CODEC_ID_GSM_MS:
83  return 320;
84  case AV_CODEC_ID_MP1:
85  return 384;
86  case AV_CODEC_ID_MP2:
87  case AV_CODEC_ID_MP3:
88  return 1152;
89  case AV_CODEC_ID_AC3:
90  return 1536;
91  case AV_CODEC_ID_QDM2:
92  case AV_CODEC_ID_QDMC:
93  return 2048 * channels;
94  case AV_CODEC_ID_ALAC:
95  return 4096;
97  return (block_align - 4 * channels) * 8 / (4 * channels) + 1;
99  return (block_align - 7 * channels) * 2 / channels + 2;
100  default:
101  return 0;
102  }
103 }
104 
106 {
107  AVIOContext *pb = s->pb;
108  AVCodecParameters *par = s->streams[0]->codecpar;
109  CAFContext *caf = s->priv_data;
110  AVDictionaryEntry *t = NULL;
111  unsigned int codec_tag = ff_codec_get_tag(ff_codec_caf_tags, par->codec_id);
112  int64_t chunk_size = 0;
113  int frame_size = par->frame_size;
114 
115  if (s->nb_streams != 1) {
116  av_log(s, AV_LOG_ERROR, "CAF files have exactly one stream\n");
117  return AVERROR(EINVAL);
118  }
119 
120  switch (par->codec_id) {
121  case AV_CODEC_ID_AAC:
122  av_log(s, AV_LOG_ERROR, "muxing codec currently unsupported\n");
123  return AVERROR_PATCHWELCOME;
124  }
125 
126  if (par->codec_id == AV_CODEC_ID_OPUS && par->ch_layout.nb_channels > 2) {
127  av_log(s, AV_LOG_ERROR, "Only mono and stereo are supported for Opus\n");
128  return AVERROR_INVALIDDATA;
129  }
130 
131  if (!codec_tag) {
132  av_log(s, AV_LOG_ERROR, "unsupported codec\n");
133  return AVERROR_INVALIDDATA;
134  }
135 
136  if (!par->block_align && !(pb->seekable & AVIO_SEEKABLE_NORMAL)) {
137  av_log(s, AV_LOG_ERROR, "Muxing variable packet size not supported on non seekable output\n");
138  return AVERROR_INVALIDDATA;
139  }
140 
141  if (par->codec_id != AV_CODEC_ID_MP3 || frame_size != 576)
143 
144  ffio_wfourcc(pb, "caff"); //< mFileType
145  avio_wb16(pb, 1); //< mFileVersion
146  avio_wb16(pb, 0); //< mFileFlags
147 
148  ffio_wfourcc(pb, "desc"); //< Audio Description chunk
149  avio_wb64(pb, 32); //< mChunkSize
150  avio_wb64(pb, av_double2int(par->sample_rate)); //< mSampleRate
151  avio_wl32(pb, codec_tag); //< mFormatID
152  avio_wb32(pb, codec_flags(par->codec_id)); //< mFormatFlags
153  avio_wb32(pb, par->block_align); //< mBytesPerPacket
154  avio_wb32(pb, frame_size); //< mFramesPerPacket
155  avio_wb32(pb, par->ch_layout.nb_channels); //< mChannelsPerFrame
156  avio_wb32(pb, av_get_bits_per_sample(par->codec_id)); //< mBitsPerChannel
157 
159  ffio_wfourcc(pb, "chan");
160  avio_wb64(pb, 12);
161  ff_mov_write_chan(pb, par->ch_layout.u.mask);
162  }
163 
164  if (par->codec_id == AV_CODEC_ID_ALAC) {
165  ffio_wfourcc(pb, "kuki");
166  avio_wb64(pb, 12 + par->extradata_size);
167  avio_write(pb, "\0\0\0\14frmaalac", 12);
168  avio_write(pb, par->extradata, par->extradata_size);
169  } else if (par->codec_id == AV_CODEC_ID_AMR_NB) {
170  ffio_wfourcc(pb, "kuki");
171  avio_wb64(pb, 29);
172  avio_write(pb, "\0\0\0\14frmasamr", 12);
173  avio_wb32(pb, 0x11); /* size */
174  avio_write(pb, "samrFFMP", 8);
175  avio_w8(pb, 0); /* decoder version */
176 
177  avio_wb16(pb, 0x81FF); /* Mode set (all modes for AMR_NB) */
178  avio_w8(pb, 0x00); /* Mode change period (no restriction) */
179  avio_w8(pb, 0x01); /* Frames per sample */
180  } else if (par->codec_id == AV_CODEC_ID_QDM2 || par->codec_id == AV_CODEC_ID_QDMC) {
181  ffio_wfourcc(pb, "kuki");
182  avio_wb64(pb, par->extradata_size);
183  avio_write(pb, par->extradata, par->extradata_size);
184  }
185 
187  if (av_dict_count(s->metadata)) {
188  ffio_wfourcc(pb, "info"); //< Information chunk
189  while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
190  chunk_size += strlen(t->key) + strlen(t->value) + 2;
191  }
192  avio_wb64(pb, chunk_size + 4);
193  avio_wb32(pb, av_dict_count(s->metadata));
194  t = NULL;
195  while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
196  avio_put_str(pb, t->key);
197  avio_put_str(pb, t->value);
198  }
199  }
200 
201  ffio_wfourcc(pb, "data"); //< Audio Data chunk
202  caf->data = avio_tell(pb);
203  avio_wb64(pb, -1); //< mChunkSize
204  avio_wb32(pb, 0); //< mEditCount
205 
206  return 0;
207 }
208 
210 {
211  CAFContext *caf = s->priv_data;
212  AVStream *const st = s->streams[0];
213 
214  if (!st->codecpar->block_align) {
215  uint8_t *pkt_sizes;
216  int i, alloc_size = caf->size_entries_used + 5U;
217  if (alloc_size < 0)
218  return AVERROR(ERANGE);
219 
220  pkt_sizes = av_fast_realloc(st->priv_data,
221  &caf->size_buffer_size,
222  alloc_size);
223  if (!pkt_sizes)
224  return AVERROR(ENOMEM);
225  st->priv_data = pkt_sizes;
226  for (i = 4; i > 0; i--) {
227  unsigned top = pkt->size >> i * 7;
228  if (top)
229  pkt_sizes[caf->size_entries_used++] = 128 | top;
230  }
231  pkt_sizes[caf->size_entries_used++] = pkt->size & 127;
232  caf->packets++;
233  }
234  avio_write(s->pb, pkt->data, pkt->size);
235  return 0;
236 }
237 
239 {
240  CAFContext *caf = s->priv_data;
241  AVIOContext *pb = s->pb;
242  AVStream *st = s->streams[0];
243  AVCodecParameters *par = st->codecpar;
244 
245  if (pb->seekable & AVIO_SEEKABLE_NORMAL) {
246  int64_t file_size = avio_tell(pb);
247 
248  avio_seek(pb, caf->data, SEEK_SET);
249  avio_wb64(pb, file_size - caf->data - 8);
250  if (!par->block_align) {
251  int packet_size = samples_per_packet(par->codec_id, par->ch_layout.nb_channels, par->block_align);
252  if (!packet_size) {
253  packet_size = st->duration / (caf->packets - 1);
254  avio_seek(pb, FRAME_SIZE_OFFSET, SEEK_SET);
255  avio_wb32(pb, packet_size);
256  }
257  avio_seek(pb, file_size, SEEK_SET);
258  ffio_wfourcc(pb, "pakt");
259  avio_wb64(pb, caf->size_entries_used + 24U);
260  avio_wb64(pb, caf->packets); ///< mNumberPackets
261  avio_wb64(pb, caf->packets * packet_size); ///< mNumberValidFrames
262  avio_wb32(pb, 0); ///< mPrimingFrames
263  avio_wb32(pb, 0); ///< mRemainderFrames
264  avio_write(pb, st->priv_data, caf->size_entries_used);
265  }
266  }
267  return 0;
268 }
269 
271  .name = "caf",
272  .long_name = NULL_IF_CONFIG_SMALL("Apple CAF (Core Audio Format)"),
273  .mime_type = "audio/x-caf",
274  .extensions = "caf",
275  .priv_data_size = sizeof(CAFContext),
276  .audio_codec = AV_CODEC_ID_PCM_S16BE,
277  .video_codec = AV_CODEC_ID_NONE,
281  .codec_tag = ff_caf_codec_tags_list,
282 };
CAFContext::data
int64_t data
Definition: cafenc.c:33
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:318
AV_CODEC_ID_MACE6
@ AV_CODEC_ID_MACE6
Definition: codec_id.h:437
AV_CODEC_ID_PCM_F32BE
@ AV_CODEC_ID_PCM_F32BE
Definition: codec_id.h:338
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:75
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:363
AV_CODEC_ID_ADPCM_IMA_QT
@ AV_CODEC_ID_ADPCM_IMA_QT
Definition: codec_id.h:357
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:430
AVOutputFormat::name
const char * name
Definition: avformat.h:510
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
ffio_wfourcc
static av_always_inline void ffio_wfourcc(AVIOContext *pb, const uint8_t *s)
Definition: avio_internal.h:116
caf.h
AVCodecParameters
This struct describes the properties of an encoded stream.
Definition: codec_par.h:53
caf_write_packet
static int caf_write_packet(AVFormatContext *s, AVPacket *pkt)
Definition: cafenc.c:209
AVStream::priv_data
void * priv_data
Definition: avformat.h:964
av_dict_count
int av_dict_count(const AVDictionary *m)
Get number of entries in dictionary.
Definition: dict.c:35
AVPacket::data
uint8_t * data
Definition: packet.h:374
AV_CODEC_ID_ALAC
@ AV_CODEC_ID_ALAC
Definition: codec_id.h:443
AV_DICT_IGNORE_SUFFIX
#define AV_DICT_IGNORE_SUFFIX
Return first entry in a dictionary whose first part corresponds to the search key,...
Definition: dict.h:68
AV_CODEC_ID_AMR_NB
@ AV_CODEC_ID_AMR_NB
Definition: codec_id.h:410
AVChannelLayout::order
enum AVChannelOrder order
Channel order used in this layout.
Definition: channel_layout.h:295
CAFContext::size_entries_used
int size_entries_used
Definition: cafenc.c:35
AVChannelLayout::mask
uint64_t mask
This member must be used for AV_CHANNEL_ORDER_NATIVE, and may be used for AV_CHANNEL_ORDER_AMBISONIC ...
Definition: channel_layout.h:322
AVChannelLayout::nb_channels
int nb_channels
Number of channels in this layout.
Definition: channel_layout.h:300
intfloat.h
AV_CODEC_ID_PCM_S16BE
@ AV_CODEC_ID_PCM_S16BE
Definition: codec_id.h:319
U
#define U(x)
Definition: vp56_arith.h:37
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:505
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:428
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:998
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:586
AV_CODEC_ID_PCM_S8
@ AV_CODEC_ID_PCM_S8
Definition: codec_id.h:322
pkt
AVPacket * pkt
Definition: movenc.c:59
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
AV_CODEC_ID_MACE3
@ AV_CODEC_ID_MACE3
Definition: codec_id.h:436
AV_CHANNEL_ORDER_NATIVE
@ AV_CHANNEL_ORDER_NATIVE
The native channel order, i.e.
Definition: channel_layout.h:112
AVCodecParameters::frame_size
int frame_size
Audio only.
Definition: codec_par.h:188
av_dict_get
AVDictionaryEntry * av_dict_get(const AVDictionary *m, const char *key, const AVDictionaryEntry *prev, int flags)
Get a dictionary entry with matching key.
Definition: dict.c:40
av_fast_realloc
void * av_fast_realloc(void *ptr, unsigned int *size, size_t min_size)
Reallocate the given buffer if it is not large enough, otherwise do nothing.
Definition: mem.c:505
s
#define s(width, name)
Definition: cbs_vp9.c:256
AVDictionaryEntry::key
char * key
Definition: dict.h:80
frame_size
int frame_size
Definition: mxfenc.c:2201
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:427
channels
channels
Definition: aptx.h:32
AV_CODEC_ID_PCM_MULAW
@ AV_CODEC_ID_PCM_MULAW
Definition: codec_id.h:324
codec_id
enum AVCodecID codec_id
Definition: vaapi_decode.c:371
caf_write_header
static int caf_write_header(AVFormatContext *s)
Definition: cafenc.c:105
AVFormatContext
Format I/O context.
Definition: avformat.h:1213
AV_CODEC_ID_PCM_ALAW
@ AV_CODEC_ID_PCM_ALAW
Definition: codec_id.h:325
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:1108
AVChannelLayout::u
union AVChannelLayout::@296 u
Details about which channels are present in this layout.
samples_per_packet
static uint32_t samples_per_packet(enum AVCodecID codec_id, int channels, int block_align)
Definition: cafenc.c:56
NULL
#define NULL
Definition: coverity.c:32
AVERROR_PATCHWELCOME
#define AVERROR_PATCHWELCOME
Not yet implemented in FFmpeg, patches welcome.
Definition: error.h:64
isom.h
write_trailer
static int write_trailer(AVFormatContext *s1)
Definition: v4l2enc.c:100
avio_w8
void avio_w8(AVIOContext *s, int b)
Definition: aviobuf.c:210
AV_CODEC_ID_QDM2
@ AV_CODEC_ID_QDM2
Definition: codec_id.h:446
AVCodecParameters::ch_layout
AVChannelLayout ch_layout
Audio only.
Definition: codec_par.h:212
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:177
AV_CODEC_ID_GSM
@ AV_CODEC_ID_GSM
as in Berlin toast format
Definition: codec_id.h:445
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:47
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:79
AV_CODEC_ID_AAC
@ AV_CODEC_ID_AAC
Definition: codec_id.h:429
AV_CODEC_ID_QCELP
@ AV_CODEC_ID_QCELP
Definition: codec_id.h:451
AVIOContext
Bytestream IO Context.
Definition: avio.h:162
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:330
AVPacket::size
int size
Definition: packet.h:375
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:117
ff_caf_muxer
const AVOutputFormat ff_caf_muxer
Definition: cafenc.c:270
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:263
ff_standardize_creation_time
int ff_standardize_creation_time(AVFormatContext *s)
Standardize creation_time metadata in AVFormatContext to an ISO-8601 timestamp string.
Definition: mux_utils.c:169
FRAME_SIZE_OFFSET
#define FRAME_SIZE_OFFSET
Definition: cafenc.c:30
AV_CODEC_ID_QDMC
@ AV_CODEC_ID_QDMC
Definition: codec_id.h:477
AV_CODEC_ID_OPUS
@ AV_CODEC_ID_OPUS
Definition: codec_id.h:487
avio_write
void avio_write(AVIOContext *s, const unsigned char *buf, int size)
Definition: aviobuf.c:232
avio_wb32
void avio_wb32(AVIOContext *s, unsigned int val)
Definition: aviobuf.c:394
avio_wl32
void avio_wl32(AVIOContext *s, unsigned int val)
Definition: aviobuf.c:386
av_double2int
static av_always_inline uint64_t av_double2int(double f)
Reinterpret a double as a 64-bit integer.
Definition: intfloat.h:70
AV_CODEC_ID_NONE
@ AV_CODEC_ID_NONE
Definition: codec_id.h:48
AVOutputFormat
Definition: avformat.h:509
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:269
avio_internal.h
AVCodecParameters::block_align
int block_align
Audio only.
Definition: codec_par.h:184
AV_CODEC_ID_PCM_F64BE
@ AV_CODEC_ID_PCM_F64BE
Definition: codec_id.h:340
AV_CODEC_ID_PCM_S32BE
@ AV_CODEC_ID_PCM_S32BE
Definition: codec_id.h:327
ff_codec_caf_tags
const AVCodecTag ff_codec_caf_tags[]
Known codec tags for CAF.
Definition: caf.c:34
caf_write_trailer
static int caf_write_trailer(AVFormatContext *s)
Definition: cafenc.c:238
AV_CODEC_ID_GSM_MS
@ AV_CODEC_ID_GSM_MS
Definition: codec_id.h:457
AVStream
Stream structure.
Definition: avformat.h:948
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:260
avformat.h
dict.h
ff_caf_codec_tags_list
const AVCodecTag *const ff_caf_codec_tags_list[]
Definition: caf.c:82
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:41
ff_codec_get_tag
unsigned int ff_codec_get_tag(const AVCodecTag *tags, enum AVCodecID id)
Definition: utils.c:134
CAFContext::packets
int packets
Definition: cafenc.c:36
avio_wb64
void avio_wb64(AVIOContext *s, uint64_t val)
Definition: aviobuf.c:460
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:326
AV_CODEC_ID_PCM_F64LE
@ AV_CODEC_ID_PCM_F64LE
Definition: codec_id.h:341
AVDictionaryEntry
Definition: dict.h:79
CAFContext
Definition: cafenc.c:32
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:61
AVPacket
This structure stores compressed data.
Definition: packet.h:351
AV_CODEC_ID_ADPCM_IMA_WAV
@ AV_CODEC_ID_ADPCM_IMA_WAV
Definition: codec_id.h:358
AV_CODEC_ID_ILBC
@ AV_CODEC_ID_ILBC
Definition: codec_id.h:486
CAFContext::size_buffer_size
int size_buffer_size
Definition: cafenc.c:34
avio_wb16
void avio_wb16(AVIOContext *s, unsigned int val)
Definition: aviobuf.c:472
AV_CODEC_ID_PCM_F32LE
@ AV_CODEC_ID_PCM_F32LE
Definition: codec_id.h:339
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
codec_flags
static uint32_t codec_flags(enum AVCodecID codec_id)
Definition: cafenc.c:39
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
AVDictionaryEntry::value
char * value
Definition: dict.h:81
write_packet
static int write_packet(AVFormatContext *s1, AVPacket *pkt)
Definition: v4l2enc.c:92
write_header
static void write_header(FFV1Context *f)
Definition: ffv1enc.c:346
ff_mov_write_chan
void ff_mov_write_chan(AVIOContext *pb, int64_t channel_layout)
Definition: isom.c:413
avio_put_str
int avio_put_str(AVIOContext *s, const char *str)
Write a NULL-terminated string.
Definition: aviobuf.c:402
AV_CODEC_ID_MP1
@ AV_CODEC_ID_MP1
Definition: codec_id.h:469
AV_CODEC_ID_PCM_S24BE
@ AV_CODEC_ID_PCM_S24BE
Definition: codec_id.h:331
mux.h