cafenc.c
Go to the documentation of this file.
1 /*
2  * Core Audio Format muxer
3  * Copyright (c) 2011 Carl Eugen Hoyos
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "avformat.h"
23 #include "caf.h"
24 #include "isom.h"
25 #include "avio_internal.h"
26 #include "libavutil/intfloat.h"
27 #include "libavutil/dict.h"
28 
29 typedef struct {
30  int64_t data;
34  int packets;
35 } CAFContext;
36 
37 static uint32_t codec_flags(enum AVCodecID codec_id) {
38  switch (codec_id) {
41  return 1; //< kCAFLinearPCMFormatFlagIsFloat
45  return 2; //< kCAFLinearPCMFormatFlagIsLittleEndian
48  return 3; //< kCAFLinearPCMFormatFlagIsFloat | kCAFLinearPCMFormatFlagIsLittleEndian
49  default:
50  return 0;
51  }
52 }
53 
54 static uint32_t samples_per_packet(enum AVCodecID codec_id, int channels) {
55  switch (codec_id) {
56  case AV_CODEC_ID_PCM_S8:
69  return 1;
70  case AV_CODEC_ID_MACE3:
71  case AV_CODEC_ID_MACE6:
72  return 6;
74  return 64;
75  case AV_CODEC_ID_AMR_NB:
76  case AV_CODEC_ID_GSM:
77  case AV_CODEC_ID_ILBC:
78  case AV_CODEC_ID_QCELP:
79  return 160;
80  case AV_CODEC_ID_GSM_MS:
81  return 320;
82  case AV_CODEC_ID_MP1:
83  return 384;
84  case AV_CODEC_ID_MP2:
85  case AV_CODEC_ID_MP3:
86  return 1152;
87  case AV_CODEC_ID_AC3:
88  return 1536;
89  case AV_CODEC_ID_ALAC:
90  case AV_CODEC_ID_QDM2:
91  return 4096;
93  return (1024 - 4 * channels) * 8 / (4 * channels) + 1;
95  return (1024 - 7 * channels) * 2 / channels + 2;
96  default:
97  return 0;
98  }
99 }
100 
102 {
103  AVIOContext *pb = s->pb;
104  AVCodecContext *enc = s->streams[0]->codec;
105  CAFContext *caf = s->priv_data;
107  unsigned int codec_tag = ff_codec_get_tag(ff_codec_caf_tags, enc->codec_id);
108  int64_t chunk_size = 0;
109 
110  switch (enc->codec_id) {
111  case AV_CODEC_ID_AAC:
112  case AV_CODEC_ID_AC3:
113  av_log(s, AV_LOG_ERROR, "muxing codec currently unsupported\n");
114  return AVERROR_PATCHWELCOME;
115  }
116 
117  switch (enc->codec_id) {
118  case AV_CODEC_ID_PCM_S8:
131  codec_tag = MKTAG('l','p','c','m');
132  }
133 
134  if (!codec_tag) {
135  av_log(s, AV_LOG_ERROR, "unsupported codec\n");
136  return AVERROR_INVALIDDATA;
137  }
138 
139  if (!enc->block_align && !pb->seekable) {
140  av_log(s, AV_LOG_ERROR, "Muxing variable packet size not supported on non seekable output\n");
141  return AVERROR_INVALIDDATA;
142  }
143 
144  ffio_wfourcc(pb, "caff"); //< mFileType
145  avio_wb16(pb, 1); //< mFileVersion
146  avio_wb16(pb, 0); //< mFileFlags
147 
148  ffio_wfourcc(pb, "desc"); //< Audio Description chunk
149  avio_wb64(pb, 32); //< mChunkSize
150  avio_wb64(pb, av_double2int(enc->sample_rate)); //< mSampleRate
151  avio_wl32(pb, codec_tag); //< mFormatID
152  avio_wb32(pb, codec_flags(enc->codec_id)); //< mFormatFlags
153  avio_wb32(pb, enc->block_align); //< mBytesPerPacket
154  avio_wb32(pb, samples_per_packet(enc->codec_id, enc->channels)); //< mFramesPerPacket
155  avio_wb32(pb, enc->channels); //< mChannelsPerFrame
156  avio_wb32(pb, av_get_bits_per_sample(enc->codec_id)); //< mBitsPerChannel
157 
158  if (enc->channel_layout) {
159  ffio_wfourcc(pb, "chan");
160  avio_wb64(pb, 12);
162  }
163 
164  if (enc->codec_id == AV_CODEC_ID_ALAC) {
165  ffio_wfourcc(pb, "kuki");
166  avio_wb64(pb, 12 + enc->extradata_size);
167  avio_write(pb, "\0\0\0\14frmaalac", 12);
168  avio_write(pb, enc->extradata, enc->extradata_size);
169  } else if (enc->codec_id == AV_CODEC_ID_AMR_NB) {
170  ffio_wfourcc(pb, "kuki");
171  avio_wb64(pb, 29);
172  avio_write(pb, "\0\0\0\14frmasamr", 12);
173  avio_wb32(pb, 0x11); /* size */
174  avio_write(pb, "samrFFMP", 8);
175  avio_w8(pb, 0); /* decoder version */
176 
177  avio_wb16(pb, 0x81FF); /* Mode set (all modes for AMR_NB) */
178  avio_w8(pb, 0x00); /* Mode change period (no restriction) */
179  avio_w8(pb, 0x01); /* Frames per sample */
180  } else if (enc->codec_id == AV_CODEC_ID_QDM2) {
181  ffio_wfourcc(pb, "kuki");
182  avio_wb64(pb, enc->extradata_size);
183  avio_write(pb, enc->extradata, enc->extradata_size);
184  }
185 
186  if (av_dict_count(s->metadata)) {
187  ffio_wfourcc(pb, "info"); //< Information chunk
188  while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
189  chunk_size += strlen(t->key) + strlen(t->value) + 2;
190  }
191  avio_wb64(pb, chunk_size + 4);
193  t = NULL;
194  while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) {
195  avio_put_str(pb, t->key);
196  avio_put_str(pb, t->value);
197  }
198  }
199 
200  ffio_wfourcc(pb, "data"); //< Audio Data chunk
201  caf->data = avio_tell(pb);
202  avio_wb64(pb, -1); //< mChunkSize
203  avio_wb32(pb, 0); //< mEditCount
204 
205  avio_flush(pb);
206  return 0;
207 }
208 
210 {
211  CAFContext *caf = s->priv_data;
212 
213  avio_write(s->pb, pkt->data, pkt->size);
214  if (!s->streams[0]->codec->block_align) {
215  void *pkt_sizes = caf->pkt_sizes;
216  int i, alloc_size = caf->size_entries_used + 5;
217  if (alloc_size < 0) {
218  caf->pkt_sizes = NULL;
219  } else {
220  caf->pkt_sizes = av_fast_realloc(caf->pkt_sizes,
221  &caf->size_buffer_size,
222  alloc_size);
223  }
224  if (!caf->pkt_sizes) {
225  av_free(pkt_sizes);
226  return AVERROR(ENOMEM);
227  }
228  for (i = 4; i > 0; i--) {
229  unsigned top = pkt->size >> i * 7;
230  if (top)
231  caf->pkt_sizes[caf->size_entries_used++] = 128 | top;
232  }
233  caf->pkt_sizes[caf->size_entries_used++] = pkt->size & 127;
234  caf->packets++;
235  }
236  return 0;
237 }
238 
240 {
241  CAFContext *caf = s->priv_data;
242  AVIOContext *pb = s->pb;
243  AVCodecContext *enc = s->streams[0]->codec;
244 
245  if (pb->seekable) {
246  int64_t file_size = avio_tell(pb);
247 
248  avio_seek(pb, caf->data, SEEK_SET);
249  avio_wb64(pb, file_size - caf->data - 8);
250  avio_seek(pb, file_size, SEEK_SET);
251  if (!enc->block_align) {
252  ffio_wfourcc(pb, "pakt");
253  avio_wb64(pb, caf->size_entries_used + 24);
254  avio_wb64(pb, caf->packets); ///< mNumberPackets
255  avio_wb64(pb, caf->packets * samples_per_packet(enc->codec_id, enc->channels)); ///< mNumberValidFrames
256  avio_wb32(pb, 0); ///< mPrimingFrames
257  avio_wb32(pb, 0); ///< mRemainderFrames
258  avio_write(pb, caf->pkt_sizes, caf->size_entries_used);
259  caf->size_buffer_size = 0;
260  }
261  avio_flush(pb);
262  }
263  av_freep(&caf->pkt_sizes);
264  return 0;
265 }
266 
268  .name = "caf",
269  .long_name = NULL_IF_CONFIG_SMALL("Apple CAF (Core Audio Format)"),
270  .mime_type = "audio/x-caf",
271  .extensions = "caf",
272  .priv_data_size = sizeof(CAFContext),
273  .audio_codec = AV_CODEC_ID_PCM_S16BE,
274  .video_codec = AV_CODEC_ID_NONE,
278  .codec_tag = (const AVCodecTag* const []){ff_codec_caf_tags, 0},
279 };
void avio_wb64(AVIOContext *s, uint64_t val)
Definition: aviobuf.c:361
const char * s
Definition: avisynth_c.h:668
Bytestream IO Context.
Definition: avio.h:68
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
int packets
Definition: cafenc.c:34
static int write_packet(AVFormatContext *s, AVPacket *pkt)
int av_dict_count(const AVDictionary *m)
Get number of entries in dictionary.
Definition: dict.c:33
int64_t avio_seek(AVIOContext *s, int64_t offset, int whence)
fseek() equivalent for AVIOContext.
Definition: aviobuf.c:199
CAF common code.
static av_always_inline uint64_t av_double2int(double f)
Reinterpret a double as a 64-bit integer.
Definition: intfloat.h:70
unsigned int ff_codec_get_tag(const AVCodecTag *tags, enum AVCodecID id)
AVDictionaryEntry * av_dict_get(AVDictionary *m, const char *key, const AVDictionaryEntry *prev, int flags)
Get a dictionary entry with matching key.
Definition: dict.c:39
int block_align
number of bytes per packet if constant and known or 0 Used by some WAV based audio codecs...
void av_freep(void *arg)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc() and set the pointer ...
Definition: mem.c:198
Format I/O context.
Definition: avformat.h:944
Public dictionary API.
void avio_wl32(AVIOContext *s, unsigned int val)
Definition: aviobuf.c:291
uint8_t
static AVPacket pkt
Definition: demuxing.c:56
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
AVStream ** streams
Definition: avformat.h:992
uint8_t * pkt_sizes
Definition: cafenc.c:31
uint8_t * data
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:248
void avio_write(AVIOContext *s, const unsigned char *buf, int size)
Definition: aviobuf.c:173
static av_always_inline void ffio_wfourcc(AVIOContext *pb, const uint8_t *s)
Definition: avio_internal.h:50
static int write_trailer(AVFormatContext *s)
AVCodecID
Identify the syntax and semantics of the bitstream.
int size_entries_used
Definition: cafenc.c:33
AVDictionary * metadata
Definition: avformat.h:1092
int av_get_bits_per_sample(enum AVCodecID codec_id)
Return codec bits per sample.
void av_free(void *ptr)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc(). ...
Definition: mem.c:183
void * av_fast_realloc(void *ptr, unsigned int *size, size_t min_size)
Reallocate the given block if it is not large enough, otherwise do nothing.
static int caf_write_header(AVFormatContext *s)
Definition: cafenc.c:101
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
preferred ID for decoding MPEG audio layer 1, 2 or 3
void av_log(void *avcl, int level, const char *fmt,...)
Definition: log.c:246
enum AVCodecID codec_id
Definition: mov_chan.c:433
uint64_t channel_layout
Audio channel layout.
AVCodecContext * codec
Codec context associated with this stream.
Definition: avformat.h:662
int seekable
A combination of AVIO_SEEKABLE_ flags or 0 when the stream is not seekable.
Definition: avio.h:117
int void avio_flush(AVIOContext *s)
Force flushing of buffered data to the output s.
Definition: aviobuf.c:193
AVOutputFormat ff_caf_muxer
Definition: cafenc.c:267
t
Definition: genspecsines3.m:6
const char * name
Definition: avformat.h:378
static uint32_t codec_flags(enum AVCodecID codec_id)
Definition: cafenc.c:37
int avio_put_str(AVIOContext *s, const char *str)
Write a NULL-terminated string.
Definition: aviobuf.c:307
#define AVERROR_PATCHWELCOME
Not yet implemented in FFmpeg, patches welcome.
Definition: error.h:62
NULL
Definition: eval.c:55
enum AVCodecID codec_id
int sample_rate
samples per second
AVIOContext * pb
I/O context.
Definition: avformat.h:977
void avio_w8(AVIOContext *s, int b)
Definition: aviobuf.c:151
main external API structure.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:148
synthesis window for stochastic i
static int caf_write_packet(AVFormatContext *s, AVPacket *pkt)
Definition: cafenc.c:209
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFilterBuffer structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later.That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another.Buffer references ownership and permissions
void avio_wb16(AVIOContext *s, unsigned int val)
Definition: aviobuf.c:373
static int caf_write_trailer(AVFormatContext *s)
Definition: cafenc.c:239
static uint32_t samples_per_packet(enum AVCodecID codec_id, int channels)
Definition: cafenc.c:54
void ff_mov_write_chan(AVIOContext *pb, int64_t channel_layout)
Definition: isom.c:552
Main libavformat public API header.
int64_t data
Definition: cafenc.c:30
int size_buffer_size
Definition: cafenc.c:32
char * key
Definition: dict.h:81
char * value
Definition: dict.h:82
as in Berlin toast format
int channels
number of audio channels
void * priv_data
Format private data.
Definition: avformat.h:964
static void write_header(FFV1Context *f)
Definition: ffv1enc.c:470
void avio_wb32(AVIOContext *s, unsigned int val)
Definition: aviobuf.c:299
#define AV_DICT_IGNORE_SUFFIX
Definition: dict.h:68
const AVCodecTag ff_codec_caf_tags[]
Known codec tags for CAF.
Definition: caf.c:34
#define MKTAG(a, b, c, d)
Definition: common.h:282
This structure stores compressed data.