blob: 7aa9e8cee1095d2865dceef63850225e1753ac72
1 | /* |
2 | * Core Audio Format muxer |
3 | * Copyright (c) 2011 Carl Eugen Hoyos |
4 | * |
5 | * This file is part of FFmpeg. |
6 | * |
7 | * FFmpeg is free software; you can redistribute it and/or |
8 | * modify it under the terms of the GNU Lesser General Public |
9 | * License as published by the Free Software Foundation; either |
10 | * version 2.1 of the License, or (at your option) any later version. |
11 | * |
12 | * FFmpeg is distributed in the hope that it will be useful, |
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
15 | * Lesser General Public License for more details. |
16 | * |
17 | * You should have received a copy of the GNU Lesser General Public |
18 | * License along with FFmpeg; if not, write to the Free Software |
19 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
20 | */ |
21 | |
22 | #include "avformat.h" |
23 | #include "caf.h" |
24 | #include "isom.h" |
25 | #include "avio_internal.h" |
26 | #include "libavutil/intfloat.h" |
27 | #include "libavutil/dict.h" |
28 | |
29 | typedef struct { |
30 | int64_t data; |
31 | uint8_t *pkt_sizes; |
32 | int size_buffer_size; |
33 | int size_entries_used; |
34 | int packets; |
35 | } CAFContext; |
36 | |
37 | static uint32_t codec_flags(enum AVCodecID codec_id) { |
38 | switch (codec_id) { |
39 | case AV_CODEC_ID_PCM_F32BE: |
40 | case AV_CODEC_ID_PCM_F64BE: |
41 | return 1; //< kCAFLinearPCMFormatFlagIsFloat |
42 | case AV_CODEC_ID_PCM_S16LE: |
43 | case AV_CODEC_ID_PCM_S24LE: |
44 | case AV_CODEC_ID_PCM_S32LE: |
45 | return 2; //< kCAFLinearPCMFormatFlagIsLittleEndian |
46 | case AV_CODEC_ID_PCM_F32LE: |
47 | case AV_CODEC_ID_PCM_F64LE: |
48 | return 3; //< kCAFLinearPCMFormatFlagIsFloat | kCAFLinearPCMFormatFlagIsLittleEndian |
49 | default: |
50 | return 0; |
51 | } |
52 | } |
53 | |
54 | static uint32_t samples_per_packet(enum AVCodecID codec_id, int channels, int block_align) { |
55 | switch (codec_id) { |
56 | case AV_CODEC_ID_PCM_S8: |
57 | case AV_CODEC_ID_PCM_S16LE: |
58 | case AV_CODEC_ID_PCM_S16BE: |
59 | case AV_CODEC_ID_PCM_S24LE: |
60 | case AV_CODEC_ID_PCM_S24BE: |
61 | case AV_CODEC_ID_PCM_S32LE: |
62 | case AV_CODEC_ID_PCM_S32BE: |
63 | case AV_CODEC_ID_PCM_F32LE: |
64 | case AV_CODEC_ID_PCM_F32BE: |
65 | case AV_CODEC_ID_PCM_F64LE: |
66 | case AV_CODEC_ID_PCM_F64BE: |
67 | case AV_CODEC_ID_PCM_ALAW: |
68 | case AV_CODEC_ID_PCM_MULAW: |
69 | return 1; |
70 | case AV_CODEC_ID_MACE3: |
71 | case AV_CODEC_ID_MACE6: |
72 | return 6; |
73 | case AV_CODEC_ID_ADPCM_IMA_QT: |
74 | return 64; |
75 | case AV_CODEC_ID_AMR_NB: |
76 | case AV_CODEC_ID_GSM: |
77 | case AV_CODEC_ID_ILBC: |
78 | case AV_CODEC_ID_QCELP: |
79 | return 160; |
80 | case AV_CODEC_ID_GSM_MS: |
81 | return 320; |
82 | case AV_CODEC_ID_MP1: |
83 | return 384; |
84 | case AV_CODEC_ID_MP2: |
85 | case AV_CODEC_ID_MP3: |
86 | return 1152; |
87 | case AV_CODEC_ID_AC3: |
88 | return 1536; |
89 | case AV_CODEC_ID_QDM2: |
90 | case AV_CODEC_ID_QDMC: |
91 | return 2048 * channels; |
92 | case AV_CODEC_ID_ALAC: |
93 | return 4096; |
94 | case AV_CODEC_ID_ADPCM_IMA_WAV: |
95 | return (block_align - 4 * channels) * 8 / (4 * channels) + 1; |
96 | case AV_CODEC_ID_ADPCM_MS: |
97 | return (block_align - 7 * channels) * 2 / channels + 2; |
98 | default: |
99 | return 0; |
100 | } |
101 | } |
102 | |
103 | static int caf_write_header(AVFormatContext *s) |
104 | { |
105 | AVIOContext *pb = s->pb; |
106 | AVCodecParameters *par = s->streams[0]->codecpar; |
107 | CAFContext *caf = s->priv_data; |
108 | AVDictionaryEntry *t = NULL; |
109 | unsigned int codec_tag = ff_codec_get_tag(ff_codec_caf_tags, par->codec_id); |
110 | int64_t chunk_size = 0; |
111 | int frame_size = par->frame_size; |
112 | |
113 | if (s->nb_streams != 1) { |
114 | av_log(s, AV_LOG_ERROR, "CAF files have exactly one stream\n"); |
115 | return AVERROR(EINVAL); |
116 | } |
117 | |
118 | switch (par->codec_id) { |
119 | case AV_CODEC_ID_AAC: |
120 | av_log(s, AV_LOG_ERROR, "muxing codec currently unsupported\n"); |
121 | return AVERROR_PATCHWELCOME; |
122 | } |
123 | |
124 | if (!codec_tag) { |
125 | av_log(s, AV_LOG_ERROR, "unsupported codec\n"); |
126 | return AVERROR_INVALIDDATA; |
127 | } |
128 | |
129 | if (!par->block_align && !(pb->seekable & AVIO_SEEKABLE_NORMAL)) { |
130 | av_log(s, AV_LOG_ERROR, "Muxing variable packet size not supported on non seekable output\n"); |
131 | return AVERROR_INVALIDDATA; |
132 | } |
133 | |
134 | if (par->codec_id != AV_CODEC_ID_MP3 || frame_size != 576) |
135 | frame_size = samples_per_packet(par->codec_id, par->channels, par->block_align); |
136 | |
137 | ffio_wfourcc(pb, "caff"); //< mFileType |
138 | avio_wb16(pb, 1); //< mFileVersion |
139 | avio_wb16(pb, 0); //< mFileFlags |
140 | |
141 | ffio_wfourcc(pb, "desc"); //< Audio Description chunk |
142 | avio_wb64(pb, 32); //< mChunkSize |
143 | avio_wb64(pb, av_double2int(par->sample_rate)); //< mSampleRate |
144 | avio_wl32(pb, codec_tag); //< mFormatID |
145 | avio_wb32(pb, codec_flags(par->codec_id)); //< mFormatFlags |
146 | avio_wb32(pb, par->block_align); //< mBytesPerPacket |
147 | avio_wb32(pb, frame_size); //< mFramesPerPacket |
148 | avio_wb32(pb, par->channels); //< mChannelsPerFrame |
149 | avio_wb32(pb, av_get_bits_per_sample(par->codec_id)); //< mBitsPerChannel |
150 | |
151 | if (par->channel_layout) { |
152 | ffio_wfourcc(pb, "chan"); |
153 | avio_wb64(pb, 12); |
154 | ff_mov_write_chan(pb, par->channel_layout); |
155 | } |
156 | |
157 | if (par->codec_id == AV_CODEC_ID_ALAC) { |
158 | ffio_wfourcc(pb, "kuki"); |
159 | avio_wb64(pb, 12 + par->extradata_size); |
160 | avio_write(pb, "\0\0\0\14frmaalac", 12); |
161 | avio_write(pb, par->extradata, par->extradata_size); |
162 | } else if (par->codec_id == AV_CODEC_ID_AMR_NB) { |
163 | ffio_wfourcc(pb, "kuki"); |
164 | avio_wb64(pb, 29); |
165 | avio_write(pb, "\0\0\0\14frmasamr", 12); |
166 | avio_wb32(pb, 0x11); /* size */ |
167 | avio_write(pb, "samrFFMP", 8); |
168 | avio_w8(pb, 0); /* decoder version */ |
169 | |
170 | avio_wb16(pb, 0x81FF); /* Mode set (all modes for AMR_NB) */ |
171 | avio_w8(pb, 0x00); /* Mode change period (no restriction) */ |
172 | avio_w8(pb, 0x01); /* Frames per sample */ |
173 | } else if (par->codec_id == AV_CODEC_ID_QDM2 || par->codec_id == AV_CODEC_ID_QDMC) { |
174 | ffio_wfourcc(pb, "kuki"); |
175 | avio_wb64(pb, par->extradata_size); |
176 | avio_write(pb, par->extradata, par->extradata_size); |
177 | } |
178 | |
179 | ff_standardize_creation_time(s); |
180 | if (av_dict_count(s->metadata)) { |
181 | ffio_wfourcc(pb, "info"); //< Information chunk |
182 | while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) { |
183 | chunk_size += strlen(t->key) + strlen(t->value) + 2; |
184 | } |
185 | avio_wb64(pb, chunk_size + 4); |
186 | avio_wb32(pb, av_dict_count(s->metadata)); |
187 | t = NULL; |
188 | while ((t = av_dict_get(s->metadata, "", t, AV_DICT_IGNORE_SUFFIX))) { |
189 | avio_put_str(pb, t->key); |
190 | avio_put_str(pb, t->value); |
191 | } |
192 | } |
193 | |
194 | ffio_wfourcc(pb, "data"); //< Audio Data chunk |
195 | caf->data = avio_tell(pb); |
196 | avio_wb64(pb, -1); //< mChunkSize |
197 | avio_wb32(pb, 0); //< mEditCount |
198 | |
199 | avio_flush(pb); |
200 | return 0; |
201 | } |
202 | |
203 | static int caf_write_packet(AVFormatContext *s, AVPacket *pkt) |
204 | { |
205 | CAFContext *caf = s->priv_data; |
206 | |
207 | avio_write(s->pb, pkt->data, pkt->size); |
208 | if (!s->streams[0]->codecpar->block_align) { |
209 | void *pkt_sizes = caf->pkt_sizes; |
210 | int i, alloc_size = caf->size_entries_used + 5; |
211 | if (alloc_size < 0) { |
212 | caf->pkt_sizes = NULL; |
213 | } else { |
214 | caf->pkt_sizes = av_fast_realloc(caf->pkt_sizes, |
215 | &caf->size_buffer_size, |
216 | alloc_size); |
217 | } |
218 | if (!caf->pkt_sizes) { |
219 | av_free(pkt_sizes); |
220 | return AVERROR(ENOMEM); |
221 | } |
222 | for (i = 4; i > 0; i--) { |
223 | unsigned top = pkt->size >> i * 7; |
224 | if (top) |
225 | caf->pkt_sizes[caf->size_entries_used++] = 128 | top; |
226 | } |
227 | caf->pkt_sizes[caf->size_entries_used++] = pkt->size & 127; |
228 | caf->packets++; |
229 | } |
230 | return 0; |
231 | } |
232 | |
233 | static int caf_write_trailer(AVFormatContext *s) |
234 | { |
235 | CAFContext *caf = s->priv_data; |
236 | AVIOContext *pb = s->pb; |
237 | AVCodecParameters *par = s->streams[0]->codecpar; |
238 | |
239 | if (pb->seekable & AVIO_SEEKABLE_NORMAL) { |
240 | int64_t file_size = avio_tell(pb); |
241 | |
242 | avio_seek(pb, caf->data, SEEK_SET); |
243 | avio_wb64(pb, file_size - caf->data - 8); |
244 | avio_seek(pb, file_size, SEEK_SET); |
245 | if (!par->block_align) { |
246 | ffio_wfourcc(pb, "pakt"); |
247 | avio_wb64(pb, caf->size_entries_used + 24); |
248 | avio_wb64(pb, caf->packets); ///< mNumberPackets |
249 | avio_wb64(pb, caf->packets * samples_per_packet(par->codec_id, par->channels, par->block_align)); ///< mNumberValidFrames |
250 | avio_wb32(pb, 0); ///< mPrimingFrames |
251 | avio_wb32(pb, 0); ///< mRemainderFrames |
252 | avio_write(pb, caf->pkt_sizes, caf->size_entries_used); |
253 | caf->size_buffer_size = 0; |
254 | } |
255 | avio_flush(pb); |
256 | } |
257 | av_freep(&caf->pkt_sizes); |
258 | return 0; |
259 | } |
260 | |
261 | AVOutputFormat ff_caf_muxer = { |
262 | .name = "caf", |
263 | .long_name = NULL_IF_CONFIG_SMALL("Apple CAF (Core Audio Format)"), |
264 | .mime_type = "audio/x-caf", |
265 | .extensions = "caf", |
266 | .priv_data_size = sizeof(CAFContext), |
267 | .audio_codec = AV_CODEC_ID_PCM_S16BE, |
268 | .video_codec = AV_CODEC_ID_NONE, |
269 | .write_header = caf_write_header, |
270 | .write_packet = caf_write_packet, |
271 | .write_trailer = caf_write_trailer, |
272 | .codec_tag = (const AVCodecTag* const []){ff_codec_caf_tags, 0}, |
273 | }; |
274 |