FFmpeg
cafenc.c
Go to the documentation of this file.
1 /*
2  * Core Audio Format muxer
3  * Copyright (c) 2011 Carl Eugen Hoyos
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "avformat.h"
23 #include "caf.h"
24 #include "isom.h"
25 #include "avio_internal.h"
26 #include "mux.h"
27 #include "libavutil/intfloat.h"
28 #include "libavutil/dict.h"
29 
30 #define FRAME_SIZE_OFFSET 40
31 
32 typedef struct {
33  int64_t data;
36  int packets;
37 } CAFContext;
38 
39 static uint32_t codec_flags(enum AVCodecID codec_id) {
40  switch (codec_id) {
43  return 1; //< kCAFLinearPCMFormatFlagIsFloat
47  return 2; //< kCAFLinearPCMFormatFlagIsLittleEndian
50  return 3; //< kCAFLinearPCMFormatFlagIsFloat | kCAFLinearPCMFormatFlagIsLittleEndian
51  default:
52  return 0;
53  }
54 }
55 
56 static uint32_t samples_per_packet(const AVCodecParameters *par) {
57  enum AVCodecID codec_id = par->codec_id;
58  int channels = par->ch_layout.nb_channels, block_align = par->block_align;
59  int frame_size = par->frame_size, sample_rate = par->sample_rate;
60 
61  switch (codec_id) {
62  case AV_CODEC_ID_PCM_S8:
75  return 1;
76  case AV_CODEC_ID_MACE3:
77  case AV_CODEC_ID_MACE6:
78  return 6;
80  return 64;
81  case AV_CODEC_ID_AMR_NB:
82  case AV_CODEC_ID_GSM:
83  case AV_CODEC_ID_ILBC:
84  case AV_CODEC_ID_QCELP:
85  return 160;
86  case AV_CODEC_ID_GSM_MS:
87  return 320;
88  case AV_CODEC_ID_MP1:
89  return 384;
90  case AV_CODEC_ID_OPUS:
91  return frame_size * 48000 / sample_rate;
92  case AV_CODEC_ID_MP2:
93  case AV_CODEC_ID_MP3:
94  return 1152;
95  case AV_CODEC_ID_AC3:
96  return 1536;
97  case AV_CODEC_ID_QDM2:
98  case AV_CODEC_ID_QDMC:
99  return 2048 * channels;
100  case AV_CODEC_ID_ALAC:
101  return 4096;
103  return (block_align - 4 * channels) * 8 / (4 * channels) + 1;
105  return (block_align - 7 * channels) * 2 / channels + 2;
106  default:
107  return 0;
108  }
109 }
110 
112 {
113  AVIOContext *pb = s->pb;
114  AVCodecParameters *par = s->streams[0]->codecpar;
115  CAFContext *caf = s->priv_data;
116  const AVDictionaryEntry *t = NULL;
117  unsigned int codec_tag = ff_codec_get_tag(ff_codec_caf_tags, par->codec_id);
118  int64_t chunk_size = 0;
119  int frame_size = par->frame_size, sample_rate = par->sample_rate;
120 
121  if (s->nb_streams != 1) {
122  av_log(s, AV_LOG_ERROR, "CAF files have exactly one stream\n");
123  return AVERROR(EINVAL);
124  }
125 
126  switch (par->codec_id) {
127  case AV_CODEC_ID_AAC:
128  av_log(s, AV_LOG_ERROR, "muxing codec currently unsupported\n");
129  return AVERROR_PATCHWELCOME;
130  }
131 
132  if (par->codec_id == AV_CODEC_ID_OPUS && par->ch_layout.nb_channels > 2) {
133  av_log(s, AV_LOG_ERROR, "Only mono and stereo are supported for Opus\n");
134  return AVERROR_INVALIDDATA;
135  }
136 
137  if (!codec_tag) {
138  av_log(s, AV_LOG_ERROR, "unsupported codec\n");
139  return AVERROR_INVALIDDATA;
140  }
141 
142  if (!par->block_align && !(pb->seekable & AVIO_SEEKABLE_NORMAL)) {
143  av_log(s, AV_LOG_ERROR, "Muxing variable packet size not supported on non seekable output\n");
144  return AVERROR_INVALIDDATA;
145  }
146 
147  if (par->codec_id != AV_CODEC_ID_MP3 || frame_size != 576)
149 
150  if (par->codec_id == AV_CODEC_ID_OPUS)
151  sample_rate = 48000;
152 
153  ffio_wfourcc(pb, "caff"); //< mFileType
154  avio_wb16(pb, 1); //< mFileVersion
155  avio_wb16(pb, 0); //< mFileFlags
156 
157  ffio_wfourcc(pb, "desc"); //< Audio Description chunk
158  avio_wb64(pb, 32); //< mChunkSize
159  avio_wb64(pb, av_double2int(sample_rate)); //< mSampleRate
160  avio_wl32(pb, codec_tag); //< mFormatID
161  avio_wb32(pb, codec_flags(par->codec_id)); //< mFormatFlags
162  avio_wb32(pb, par->block_align); //< mBytesPerPacket
163  avio_wb32(pb, frame_size); //< mFramesPerPacket
164  avio_wb32(pb, par->ch_layout.nb_channels); //< mChannelsPerFrame
165  avio_wb32(pb, av_get_bits_per_sample(par->codec_id)); //< mBitsPerChannel
166 
168  ffio_wfourcc(pb, "chan");
169  avio_wb64(pb, 12);
170  ff_mov_write_chan(pb, par->ch_layout.u.mask);
171  }
172 
173  if (par->codec_id == AV_CODEC_ID_ALAC) {
174  ffio_wfourcc(pb, "kuki");
175  avio_wb64(pb, 12 + par->extradata_size);
176  avio_write(pb, "\0\0\0\14frmaalac", 12);
177  avio_write(pb, par->extradata, par->extradata_size);
178  } else if (par->codec_id == AV_CODEC_ID_AMR_NB) {
179  ffio_wfourcc(pb, "kuki");
180  avio_wb64(pb, 29);
181  avio_write(pb, "\0\0\0\14frmasamr", 12);
182  avio_wb32(pb, 0x11); /* size */
183  avio_write(pb, "samrFFMP", 8);
184  avio_w8(pb, 0); /* decoder version */
185 
186  avio_wb16(pb, 0x81FF); /* Mode set (all modes for AMR_NB) */
187  avio_w8(pb, 0x00); /* Mode change period (no restriction) */
188  avio_w8(pb, 0x01); /* Frames per sample */
189  } else if (par->codec_id == AV_CODEC_ID_QDM2 || par->codec_id == AV_CODEC_ID_QDMC) {
190  ffio_wfourcc(pb, "kuki");
191  avio_wb64(pb, par->extradata_size);
192  avio_write(pb, par->extradata, par->extradata_size);
193  }
194 
196  if (av_dict_count(s->metadata)) {
197  ffio_wfourcc(pb, "info"); //< Information chunk
198  while ((t = av_dict_iterate(s->metadata, t))) {
199  chunk_size += strlen(t->key) + strlen(t->value) + 2;
200  }
201  avio_wb64(pb, chunk_size + 4);
202  avio_wb32(pb, av_dict_count(s->metadata));
203  t = NULL;
204  while ((t = av_dict_iterate(s->metadata, t))) {
205  avio_put_str(pb, t->key);
206  avio_put_str(pb, t->value);
207  }
208  }
209 
210  ffio_wfourcc(pb, "data"); //< Audio Data chunk
211  caf->data = avio_tell(pb);
212  avio_wb64(pb, -1); //< mChunkSize
213  avio_wb32(pb, 0); //< mEditCount
214 
215  return 0;
216 }
217 
219 {
220  CAFContext *caf = s->priv_data;
221  AVStream *const st = s->streams[0];
222 
223  if (!st->codecpar->block_align) {
224  uint8_t *pkt_sizes;
225  int i, alloc_size = caf->size_entries_used + 5U;
226  if (alloc_size < 0)
227  return AVERROR(ERANGE);
228 
229  pkt_sizes = av_fast_realloc(st->priv_data,
230  &caf->size_buffer_size,
231  alloc_size);
232  if (!pkt_sizes)
233  return AVERROR(ENOMEM);
234  st->priv_data = pkt_sizes;
235  for (i = 4; i > 0; i--) {
236  unsigned top = pkt->size >> i * 7;
237  if (top)
238  pkt_sizes[caf->size_entries_used++] = 128 | top;
239  }
240  pkt_sizes[caf->size_entries_used++] = pkt->size & 127;
241  caf->packets++;
242  }
243  avio_write(s->pb, pkt->data, pkt->size);
244  return 0;
245 }
246 
248 {
249  CAFContext *caf = s->priv_data;
250  AVIOContext *pb = s->pb;
251  AVStream *st = s->streams[0];
252  AVCodecParameters *par = st->codecpar;
253 
254  if (pb->seekable & AVIO_SEEKABLE_NORMAL) {
255  int64_t file_size = avio_tell(pb);
256 
257  avio_seek(pb, caf->data, SEEK_SET);
258  avio_wb64(pb, file_size - caf->data - 8);
259  if (!par->block_align) {
260  int packet_size = samples_per_packet(par);
261  if (!packet_size) {
262  packet_size = st->duration / (caf->packets - 1);
263  avio_seek(pb, FRAME_SIZE_OFFSET, SEEK_SET);
264  avio_wb32(pb, packet_size);
265  }
266  avio_seek(pb, file_size, SEEK_SET);
267  ffio_wfourcc(pb, "pakt");
268  avio_wb64(pb, caf->size_entries_used + 24U);
269  avio_wb64(pb, caf->packets); ///< mNumberPackets
270  avio_wb64(pb, caf->packets * packet_size); ///< mNumberValidFrames
271  avio_wb32(pb, 0); ///< mPrimingFrames
272  avio_wb32(pb, 0); ///< mRemainderFrames
273  avio_write(pb, st->priv_data, caf->size_entries_used);
274  }
275  }
276  return 0;
277 }
278 
280  .p.name = "caf",
281  .p.long_name = NULL_IF_CONFIG_SMALL("Apple CAF (Core Audio Format)"),
282  .p.mime_type = "audio/x-caf",
283  .p.extensions = "caf",
284  .priv_data_size = sizeof(CAFContext),
285  .p.audio_codec = AV_CODEC_ID_PCM_S16BE,
286  .p.video_codec = AV_CODEC_ID_NONE,
287  .write_header = caf_write_header,
288  .write_packet = caf_write_packet,
289  .write_trailer = caf_write_trailer,
290  .p.codec_tag = ff_caf_codec_tags_list,
291 };
CAFContext::data
int64_t data
Definition: cafenc.c:33
AV_CODEC_ID_PCM_S16LE
@ AV_CODEC_ID_PCM_S16LE
Definition: codec_id.h:330
AV_CODEC_ID_MACE6
@ AV_CODEC_ID_MACE6
Definition: codec_id.h:452
AV_CODEC_ID_PCM_F32BE
@ AV_CODEC_ID_PCM_F32BE
Definition: codec_id.h:350
AVCodecParameters::extradata
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: codec_par.h:69
AV_CODEC_ID_ADPCM_MS
@ AV_CODEC_ID_ADPCM_MS
Definition: codec_id.h:375
AV_CODEC_ID_ADPCM_IMA_QT
@ AV_CODEC_ID_ADPCM_IMA_QT
Definition: codec_id.h:369
AV_CODEC_ID_AC3
@ AV_CODEC_ID_AC3
Definition: codec_id.h:445
AVOutputFormat::name
const char * name
Definition: avformat.h:511
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
ffio_wfourcc
static av_always_inline void ffio_wfourcc(AVIOContext *pb, const uint8_t *s)
Definition: avio_internal.h:128
caf.h
AVCodecParameters
This struct describes the properties of an encoded stream.
Definition: codec_par.h:47
caf_write_packet
static int caf_write_packet(AVFormatContext *s, AVPacket *pkt)
Definition: cafenc.c:218
AVStream::priv_data
void * priv_data
Definition: avformat.h:866
av_dict_count
int av_dict_count(const AVDictionary *m)
Get number of entries in dictionary.
Definition: dict.c:39
AVPacket::data
uint8_t * data
Definition: packet.h:491
AV_CODEC_ID_ALAC
@ AV_CODEC_ID_ALAC
Definition: codec_id.h:458
AV_CODEC_ID_AMR_NB
@ AV_CODEC_ID_AMR_NB
Definition: codec_id.h:423
AVChannelLayout::order
enum AVChannelOrder order
Channel order used in this layout.
Definition: channel_layout.h:312
CAFContext::size_entries_used
int size_entries_used
Definition: cafenc.c:35
AVChannelLayout::mask
uint64_t mask
This member must be used for AV_CHANNEL_ORDER_NATIVE, and may be used for AV_CHANNEL_ORDER_AMBISONIC ...
Definition: channel_layout.h:339
AVChannelLayout::nb_channels
int nb_channels
Number of channels in this layout.
Definition: channel_layout.h:317
intfloat.h
sample_rate
sample_rate
Definition: ffmpeg_filter.c:368
FFOutputFormat::p
AVOutputFormat p
The public AVOutputFormat.
Definition: mux.h:36
AV_CODEC_ID_PCM_S16BE
@ AV_CODEC_ID_PCM_S16BE
Definition: codec_id.h:331
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:513
AVChannelLayout::u
union AVChannelLayout::@332 u
Details about which channels are present in this layout.
AV_CODEC_ID_MP3
@ AV_CODEC_ID_MP3
preferred ID for decoding MPEG audio layer 1, 2 or 3
Definition: codec_id.h:443
AVStream::duration
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:900
av_get_bits_per_sample
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
Definition: utils.c:558
AV_CODEC_ID_PCM_S8
@ AV_CODEC_ID_PCM_S8
Definition: codec_id.h:334
pkt
AVPacket * pkt
Definition: movenc.c:59
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
AV_CODEC_ID_MACE3
@ AV_CODEC_ID_MACE3
Definition: codec_id.h:451
AVCodecParameters::frame_size
int frame_size
Audio only.
Definition: codec_par.h:182
av_fast_realloc
void * av_fast_realloc(void *ptr, unsigned int *size, size_t min_size)
Reallocate the given buffer if it is not large enough, otherwise do nothing.
Definition: mem.c:495
s
#define s(width, name)
Definition: cbs_vp9.c:198
AVDictionaryEntry::key
char * key
Definition: dict.h:90
frame_size
int frame_size
Definition: mxfenc.c:2311
AV_CODEC_ID_MP2
@ AV_CODEC_ID_MP2
Definition: codec_id.h:442
channels
channels
Definition: aptx.h:31
AV_CODEC_ID_PCM_MULAW
@ AV_CODEC_ID_PCM_MULAW
Definition: codec_id.h:336
codec_id
enum AVCodecID codec_id
Definition: vaapi_decode.c:389
caf_write_header
static int caf_write_header(AVFormatContext *s)
Definition: cafenc.c:111
AVFormatContext
Format I/O context.
Definition: avformat.h:1115
AV_CODEC_ID_PCM_ALAW
@ AV_CODEC_ID_PCM_ALAW
Definition: codec_id.h:337
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:864
NULL
#define NULL
Definition: coverity.c:32
AVERROR_PATCHWELCOME
#define AVERROR_PATCHWELCOME
Not yet implemented in FFmpeg, patches welcome.
Definition: error.h:64
isom.h
FFOutputFormat
Definition: mux.h:32
avio_w8
void avio_w8(AVIOContext *s, int b)
Definition: aviobuf.c:226
AV_CODEC_ID_QDM2
@ AV_CODEC_ID_QDM2
Definition: codec_id.h:461
AVCodecParameters::ch_layout
AVChannelLayout ch_layout
Audio only.
Definition: codec_par.h:206
AVCodecParameters::sample_rate
int sample_rate
Audio only.
Definition: codec_par.h:171
AV_CODEC_ID_GSM
@ AV_CODEC_ID_GSM
as in Berlin toast format
Definition: codec_id.h:460
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:49
AVCodecParameters::extradata_size
int extradata_size
Size of the extradata content in bytes.
Definition: codec_par.h:73
AV_CODEC_ID_AAC
@ AV_CODEC_ID_AAC
Definition: codec_id.h:444
AV_CODEC_ID_QCELP
@ AV_CODEC_ID_QCELP
Definition: codec_id.h:466
AVIOContext
Bytestream IO Context.
Definition: avio.h:166
AV_CODEC_ID_PCM_S24LE
@ AV_CODEC_ID_PCM_S24LE
Definition: codec_id.h:342
AVPacket::size
int size
Definition: packet.h:492
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:106
AVIOContext::seekable
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:271
ff_standardize_creation_time
int ff_standardize_creation_time(AVFormatContext *s)
Standardize creation_time metadata in AVFormatContext to an ISO-8601 timestamp string.
Definition: mux_utils.c:143
FRAME_SIZE_OFFSET
#define FRAME_SIZE_OFFSET
Definition: cafenc.c:30
AV_CODEC_ID_QDMC
@ AV_CODEC_ID_QDMC
Definition: codec_id.h:492
AV_CODEC_ID_OPUS
@ AV_CODEC_ID_OPUS
Definition: codec_id.h:502
avio_write
void avio_write(AVIOContext *s, const unsigned char *buf, int size)
Definition: aviobuf.c:248
avio_wb32
void avio_wb32(AVIOContext *s, unsigned int val)
Definition: aviobuf.c:412
avio_wl32
void avio_wl32(AVIOContext *s, unsigned int val)
Definition: aviobuf.c:404
AV_CHANNEL_ORDER_NATIVE
@ AV_CHANNEL_ORDER_NATIVE
The native channel order, i.e.
Definition: channel_layout.h:118
av_double2int
static av_always_inline uint64_t av_double2int(double f)
Reinterpret a double as a 64-bit integer.
Definition: intfloat.h:70
AV_CODEC_ID_NONE
@ AV_CODEC_ID_NONE
Definition: codec_id.h:50
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:255
avio_internal.h
AVCodecParameters::block_align
int block_align
Audio only.
Definition: codec_par.h:178
AV_CODEC_ID_PCM_F64BE
@ AV_CODEC_ID_PCM_F64BE
Definition: codec_id.h:352
AV_CODEC_ID_PCM_S32BE
@ AV_CODEC_ID_PCM_S32BE
Definition: codec_id.h:339
ff_codec_caf_tags
const AVCodecTag ff_codec_caf_tags[]
Known codec tags for CAF.
Definition: caf.c:34
caf_write_trailer
static int caf_write_trailer(AVFormatContext *s)
Definition: cafenc.c:247
AV_CODEC_ID_GSM_MS
@ AV_CODEC_ID_GSM_MS
Definition: codec_id.h:472
AVStream
Stream structure.
Definition: avformat.h:841
avio_seek
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:278
avformat.h
dict.h
U
#define U(x)
Definition: vpx_arith.h:37
ff_caf_codec_tags_list
const AVCodecTag *const ff_caf_codec_tags_list[]
Definition: caf.c:82
AVIO_SEEKABLE_NORMAL
#define AVIO_SEEKABLE_NORMAL
Seeking works like for a local file.
Definition: avio.h:41
ff_codec_get_tag
unsigned int ff_codec_get_tag(const AVCodecTag *tags, enum AVCodecID id)
Definition: utils.c:135
CAFContext::packets
int packets
Definition: cafenc.c:36
avio_wb64
void avio_wb64(AVIOContext *s, uint64_t val)
Definition: aviobuf.c:478
AV_CODEC_ID_PCM_S32LE
@ AV_CODEC_ID_PCM_S32LE
Definition: codec_id.h:338
AV_CODEC_ID_PCM_F64LE
@ AV_CODEC_ID_PCM_F64LE
Definition: codec_id.h:353
AVDictionaryEntry
Definition: dict.h:89
CAFContext
Definition: cafenc.c:32
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:55
AVPacket
This structure stores compressed data.
Definition: packet.h:468
AV_CODEC_ID_ADPCM_IMA_WAV
@ AV_CODEC_ID_ADPCM_IMA_WAV
Definition: codec_id.h:370
AV_CODEC_ID_ILBC
@ AV_CODEC_ID_ILBC
Definition: codec_id.h:501
CAFContext::size_buffer_size
int size_buffer_size
Definition: cafenc.c:34
avio_wb16
void avio_wb16(AVIOContext *s, unsigned int val)
Definition: aviobuf.c:490
AV_CODEC_ID_PCM_F32LE
@ AV_CODEC_ID_PCM_F32LE
Definition: codec_id.h:351
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
codec_flags
static uint32_t codec_flags(enum AVCodecID codec_id)
Definition: cafenc.c:39
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
ff_caf_muxer
const FFOutputFormat ff_caf_muxer
Definition: cafenc.c:279
AVDictionaryEntry::value
char * value
Definition: dict.h:91
ff_mov_write_chan
void ff_mov_write_chan(AVIOContext *pb, int64_t channel_layout)
Definition: isom.c:413
avio_put_str
int avio_put_str(AVIOContext *s, const char *str)
Write a NULL-terminated string.
Definition: aviobuf.c:420
AV_CODEC_ID_MP1
@ AV_CODEC_ID_MP1
Definition: codec_id.h:484
samples_per_packet
static uint32_t samples_per_packet(const AVCodecParameters *par)
Definition: cafenc.c:56
AV_CODEC_ID_PCM_S24BE
@ AV_CODEC_ID_PCM_S24BE
Definition: codec_id.h:343
av_dict_iterate
const AVDictionaryEntry * av_dict_iterate(const AVDictionary *m, const AVDictionaryEntry *prev)
Iterate over a dictionary.
Definition: dict.c:44
mux.h