2 * Audio Toolbox system codecs
4 * copyright (c) 2016 rcombs
6 * This file is part of FFmpeg.
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
23 #include <AudioToolbox/AudioToolbox.h>
27 #include "ac3_parser_internal.h"
28 #include "bytestream.h"
30 #include "mpegaudiodecheader.h"
31 #include "libavutil/avassert.h"
32 #include "libavutil/opt.h"
33 #include "libavutil/log.h"
35 #if __MAC_OS_X_VERSION_MIN_REQUIRED < 101100
36 #define kAudioFormatEnhancedAC3 'ec-3'
39 typedef struct ATDecodeContext {
42 AudioConverterRef converter;
43 AudioStreamPacketDescription pkt_desc;
56 static UInt32 ffat_get_format_id(enum AVCodecID codec, int profile)
60 return kAudioFormatMPEG4AAC;
62 return kAudioFormatAC3;
63 case AV_CODEC_ID_ADPCM_IMA_QT:
64 return kAudioFormatAppleIMA4;
65 case AV_CODEC_ID_ALAC:
66 return kAudioFormatAppleLossless;
67 case AV_CODEC_ID_AMR_NB:
68 return kAudioFormatAMR;
69 case AV_CODEC_ID_EAC3:
70 return kAudioFormatEnhancedAC3;
71 case AV_CODEC_ID_GSM_MS:
72 return kAudioFormatMicrosoftGSM;
73 case AV_CODEC_ID_ILBC:
74 return kAudioFormatiLBC;
76 return kAudioFormatMPEGLayer1;
78 return kAudioFormatMPEGLayer2;
80 return kAudioFormatMPEGLayer3;
81 case AV_CODEC_ID_PCM_ALAW:
82 return kAudioFormatALaw;
83 case AV_CODEC_ID_PCM_MULAW:
84 return kAudioFormatULaw;
85 case AV_CODEC_ID_QDMC:
86 return kAudioFormatQDesign;
87 case AV_CODEC_ID_QDM2:
88 return kAudioFormatQDesign2;
90 av_assert0(!"Invalid codec ID!");
95 static int ffat_get_channel_id(AudioChannelLabel label)
99 else if (label <= kAudioChannelLabel_LFEScreen)
101 else if (label <= kAudioChannelLabel_RightSurround)
103 else if (label <= kAudioChannelLabel_CenterSurround)
105 else if (label <= kAudioChannelLabel_RightSurroundDirect)
107 else if (label <= kAudioChannelLabel_TopBackRight)
109 else if (label < kAudioChannelLabel_RearSurroundLeft)
111 else if (label <= kAudioChannelLabel_RearSurroundRight)
113 else if (label <= kAudioChannelLabel_RightWide)
115 else if (label == kAudioChannelLabel_LFE2)
116 return ff_ctzll(AV_CH_LOW_FREQUENCY_2);
117 else if (label == kAudioChannelLabel_Mono)
118 return ff_ctzll(AV_CH_FRONT_CENTER);
123 static int ffat_compare_channel_descriptions(const void* a, const void* b)
125 const AudioChannelDescription* da = a;
126 const AudioChannelDescription* db = b;
127 return ffat_get_channel_id(da->mChannelLabel) - ffat_get_channel_id(db->mChannelLabel);
130 static AudioChannelLayout *ffat_convert_layout(AudioChannelLayout *layout, UInt32* size)
132 AudioChannelLayoutTag tag = layout->mChannelLayoutTag;
133 AudioChannelLayout *new_layout;
134 if (tag == kAudioChannelLayoutTag_UseChannelDescriptions)
136 else if (tag == kAudioChannelLayoutTag_UseChannelBitmap)
137 AudioFormatGetPropertyInfo(kAudioFormatProperty_ChannelLayoutForBitmap,
138 sizeof(UInt32), &layout->mChannelBitmap, size);
140 AudioFormatGetPropertyInfo(kAudioFormatProperty_ChannelLayoutForTag,
141 sizeof(AudioChannelLayoutTag), &tag, size);
142 new_layout = av_malloc(*size);
147 if (tag == kAudioChannelLayoutTag_UseChannelBitmap)
148 AudioFormatGetProperty(kAudioFormatProperty_ChannelLayoutForBitmap,
149 sizeof(UInt32), &layout->mChannelBitmap, size, new_layout);
151 AudioFormatGetProperty(kAudioFormatProperty_ChannelLayoutForTag,
152 sizeof(AudioChannelLayoutTag), &tag, size, new_layout);
153 new_layout->mChannelLayoutTag = kAudioChannelLayoutTag_UseChannelDescriptions;
158 static int ffat_update_ctx(AVCodecContext *avctx)
160 ATDecodeContext *at = avctx->priv_data;
161 AudioStreamBasicDescription format;
162 UInt32 size = sizeof(format);
163 if (!AudioConverterGetProperty(at->converter,
164 kAudioConverterCurrentInputStreamDescription,
166 if (format.mSampleRate)
167 avctx->sample_rate = format.mSampleRate;
168 avctx->channels = format.mChannelsPerFrame;
169 avctx->channel_layout = av_get_default_channel_layout(avctx->channels);
170 avctx->frame_size = format.mFramesPerPacket;
173 if (!AudioConverterGetProperty(at->converter,
174 kAudioConverterCurrentOutputStreamDescription,
176 format.mSampleRate = avctx->sample_rate;
177 format.mChannelsPerFrame = avctx->channels;
178 AudioConverterSetProperty(at->converter,
179 kAudioConverterCurrentOutputStreamDescription,
183 if (!AudioConverterGetPropertyInfo(at->converter, kAudioConverterOutputChannelLayout,
184 &size, NULL) && size) {
185 AudioChannelLayout *layout = av_malloc(size);
186 uint64_t layout_mask = 0;
189 return AVERROR(ENOMEM);
190 AudioConverterGetProperty(at->converter, kAudioConverterOutputChannelLayout,
192 if (!(layout = ffat_convert_layout(layout, &size)))
193 return AVERROR(ENOMEM);
194 for (i = 0; i < layout->mNumberChannelDescriptions; i++) {
195 int id = ffat_get_channel_id(layout->mChannelDescriptions[i].mChannelLabel);
198 if (layout_mask & (1 << id))
200 layout_mask |= 1 << id;
201 layout->mChannelDescriptions[i].mChannelFlags = i; // Abusing flags as index
203 avctx->channel_layout = layout_mask;
204 qsort(layout->mChannelDescriptions, layout->mNumberChannelDescriptions,
205 sizeof(AudioChannelDescription), &ffat_compare_channel_descriptions);
206 for (i = 0; i < layout->mNumberChannelDescriptions; i++)
207 at->channel_map[i] = layout->mChannelDescriptions[i].mChannelFlags;
212 if (!avctx->frame_size)
213 avctx->frame_size = 2048;
218 static void put_descr(PutByteContext *pb, int tag, unsigned int size)
221 bytestream2_put_byte(pb, tag);
223 bytestream2_put_byte(pb, (size >> (7 * i)) | 0x80);
224 bytestream2_put_byte(pb, size & 0x7F);
227 static uint8_t* ffat_get_magic_cookie(AVCodecContext *avctx, UInt32 *cookie_size)
229 ATDecodeContext *at = avctx->priv_data;
230 if (avctx->codec_id == AV_CODEC_ID_AAC) {
233 *cookie_size = 5 + 3 + 5+13 + 5+at->extradata_size;
234 if (!(extradata = av_malloc(*cookie_size)))
237 bytestream2_init_writer(&pb, extradata, *cookie_size);
240 put_descr(&pb, 0x03, 3 + 5+13 + 5+at->extradata_size);
241 bytestream2_put_be16(&pb, 0);
242 bytestream2_put_byte(&pb, 0x00); // flags (= no flags)
244 // DecoderConfig descriptor
245 put_descr(&pb, 0x04, 13 + 5+at->extradata_size);
247 // Object type indication
248 bytestream2_put_byte(&pb, 0x40);
250 bytestream2_put_byte(&pb, 0x15); // flags (= Audiostream)
252 bytestream2_put_be24(&pb, 0); // Buffersize DB
254 bytestream2_put_be32(&pb, 0); // maxbitrate
255 bytestream2_put_be32(&pb, 0); // avgbitrate
257 // DecoderSpecific info descriptor
258 put_descr(&pb, 0x05, at->extradata_size);
259 bytestream2_put_buffer(&pb, at->extradata, at->extradata_size);
262 *cookie_size = at->extradata_size;
263 return at->extradata;
267 static av_cold int ffat_usable_extradata(AVCodecContext *avctx)
269 ATDecodeContext *at = avctx->priv_data;
270 return at->extradata_size &&
271 (avctx->codec_id == AV_CODEC_ID_ALAC ||
272 avctx->codec_id == AV_CODEC_ID_QDM2 ||
273 avctx->codec_id == AV_CODEC_ID_QDMC ||
274 avctx->codec_id == AV_CODEC_ID_AAC);
277 static int ffat_set_extradata(AVCodecContext *avctx)
279 ATDecodeContext *at = avctx->priv_data;
280 if (ffat_usable_extradata(avctx)) {
283 uint8_t *cookie = ffat_get_magic_cookie(avctx, &cookie_size);
285 return AVERROR(ENOMEM);
287 status = AudioConverterSetProperty(at->converter,
288 kAudioConverterDecompressionMagicCookie,
289 cookie_size, cookie);
291 av_log(avctx, AV_LOG_WARNING, "AudioToolbox cookie error: %i\n", (int)status);
293 if (cookie != at->extradata)
299 static av_cold int ffat_create_decoder(AVCodecContext *avctx,
302 ATDecodeContext *at = avctx->priv_data;
306 enum AVSampleFormat sample_fmt = (avctx->bits_per_raw_sample == 32) ?
307 AV_SAMPLE_FMT_S32 : AV_SAMPLE_FMT_S16;
309 AudioStreamBasicDescription in_format = {
310 .mFormatID = ffat_get_format_id(avctx->codec_id, avctx->profile),
311 .mBytesPerPacket = (avctx->codec_id == AV_CODEC_ID_ILBC) ? avctx->block_align : 0,
313 AudioStreamBasicDescription out_format = {
314 .mFormatID = kAudioFormatLinearPCM,
315 .mFormatFlags = kAudioFormatFlagIsSignedInteger | kAudioFormatFlagIsPacked,
316 .mFramesPerPacket = 1,
317 .mBitsPerChannel = av_get_bytes_per_sample(sample_fmt) * 8,
320 avctx->sample_fmt = sample_fmt;
322 if (ffat_usable_extradata(avctx)) {
323 UInt32 format_size = sizeof(in_format);
325 uint8_t *cookie = ffat_get_magic_cookie(avctx, &cookie_size);
327 return AVERROR(ENOMEM);
328 status = AudioFormatGetProperty(kAudioFormatProperty_FormatInfo,
329 cookie_size, cookie, &format_size, &in_format);
330 if (cookie != at->extradata)
333 av_log(avctx, AV_LOG_ERROR, "AudioToolbox header-parse error: %i\n", (int)status);
334 return AVERROR_UNKNOWN;
336 #if CONFIG_MP1_AT_DECODER || CONFIG_MP2_AT_DECODER || CONFIG_MP3_AT_DECODER
337 } else if (pkt && pkt->size >= 4 &&
338 (avctx->codec_id == AV_CODEC_ID_MP1 ||
339 avctx->codec_id == AV_CODEC_ID_MP2 ||
340 avctx->codec_id == AV_CODEC_ID_MP3)) {
341 enum AVCodecID codec_id;
343 if (ff_mpa_decode_header(AV_RB32(pkt->data), &avctx->sample_rate,
344 &in_format.mChannelsPerFrame, &avctx->frame_size,
345 &bit_rate, &codec_id) < 0)
346 return AVERROR_INVALIDDATA;
347 avctx->bit_rate = bit_rate;
348 in_format.mSampleRate = avctx->sample_rate;
350 #if CONFIG_AC3_AT_DECODER || CONFIG_EAC3_AT_DECODER
351 } else if (pkt && pkt->size >= 7 &&
352 (avctx->codec_id == AV_CODEC_ID_AC3 ||
353 avctx->codec_id == AV_CODEC_ID_EAC3)) {
356 init_get_bits(&gbc, pkt->data, pkt->size);
357 if (ff_ac3_parse_header(&gbc, &hdr) < 0)
358 return AVERROR_INVALIDDATA;
359 in_format.mSampleRate = hdr.sample_rate;
360 in_format.mChannelsPerFrame = hdr.channels;
361 avctx->frame_size = hdr.num_blocks * 256;
362 avctx->bit_rate = hdr.bit_rate;
365 in_format.mSampleRate = avctx->sample_rate ? avctx->sample_rate : 44100;
366 in_format.mChannelsPerFrame = avctx->channels ? avctx->channels : 1;
369 avctx->sample_rate = out_format.mSampleRate = in_format.mSampleRate;
370 avctx->channels = out_format.mChannelsPerFrame = in_format.mChannelsPerFrame;
372 if (avctx->codec_id == AV_CODEC_ID_ADPCM_IMA_QT)
373 in_format.mFramesPerPacket = 64;
375 status = AudioConverterNew(&in_format, &out_format, &at->converter);
378 av_log(avctx, AV_LOG_ERROR, "AudioToolbox init error: %i\n", (int)status);
379 return AVERROR_UNKNOWN;
382 if ((status = ffat_set_extradata(avctx)) < 0)
385 for (i = 0; i < (sizeof(at->channel_map) / sizeof(at->channel_map[0])); i++)
386 at->channel_map[i] = i;
388 ffat_update_ctx(avctx);
390 if(!(at->decoded_data = av_malloc(av_get_bytes_per_sample(avctx->sample_fmt)
391 * avctx->frame_size * avctx->channels)))
392 return AVERROR(ENOMEM);
394 at->last_pts = AV_NOPTS_VALUE;
399 static av_cold int ffat_init_decoder(AVCodecContext *avctx)
401 ATDecodeContext *at = avctx->priv_data;
402 if (avctx->extradata_size) {
403 at->extradata = av_mallocz(avctx->extradata_size + AV_INPUT_BUFFER_PADDING_SIZE);
405 return AVERROR(ENOMEM);
406 at->extradata_size = avctx->extradata_size;
407 memcpy(at->extradata, avctx->extradata, avctx->extradata_size);
410 if ((avctx->channels && avctx->sample_rate) || ffat_usable_extradata(avctx))
411 return ffat_create_decoder(avctx, NULL);
416 static OSStatus ffat_decode_callback(AudioConverterRef converter, UInt32 *nb_packets,
417 AudioBufferList *data,
418 AudioStreamPacketDescription **packets,
421 AVCodecContext *avctx = inctx;
422 ATDecodeContext *at = avctx->priv_data;
427 *packets = &at->pkt_desc;
428 at->pkt_desc.mDataByteSize = 0;
433 av_packet_unref(&at->in_pkt);
434 av_packet_move_ref(&at->in_pkt, &at->new_in_pkt);
436 if (!at->in_pkt.data) {
441 data->mNumberBuffers = 1;
442 data->mBuffers[0].mNumberChannels = 0;
443 data->mBuffers[0].mDataByteSize = at->in_pkt.size;
444 data->mBuffers[0].mData = at->in_pkt.data;
448 *packets = &at->pkt_desc;
449 at->pkt_desc.mDataByteSize = at->in_pkt.size;
455 #define COPY_SAMPLES(type) \
456 type *in_ptr = (type*)at->decoded_data; \
457 type *end_ptr = in_ptr + frame->nb_samples * avctx->channels; \
458 type *out_ptr = (type*)frame->data[0]; \
459 for (; in_ptr < end_ptr; in_ptr += avctx->channels, out_ptr += avctx->channels) { \
461 for (c = 0; c < avctx->channels; c++) \
462 out_ptr[c] = in_ptr[at->channel_map[c]]; \
465 static void ffat_copy_samples(AVCodecContext *avctx, AVFrame *frame)
467 ATDecodeContext *at = avctx->priv_data;
468 if (avctx->sample_fmt == AV_SAMPLE_FMT_S32) {
469 COPY_SAMPLES(int32_t);
471 COPY_SAMPLES(int16_t);
475 static int ffat_decode(AVCodecContext *avctx, void *data,
476 int *got_frame_ptr, AVPacket *avpkt)
478 ATDecodeContext *at = avctx->priv_data;
479 AVFrame *frame = data;
480 int pkt_size = avpkt->size;
482 AudioBufferList out_buffers;
484 if (avctx->codec_id == AV_CODEC_ID_AAC) {
485 if (!at->extradata_size) {
487 size_t side_data_size;
489 side_data = av_packet_get_side_data(avpkt, AV_PKT_DATA_NEW_EXTRADATA,
491 if (side_data_size) {
492 at->extradata = av_mallocz(side_data_size + AV_INPUT_BUFFER_PADDING_SIZE);
494 return AVERROR(ENOMEM);
495 at->extradata_size = side_data_size;
496 memcpy(at->extradata, side_data, side_data_size);
501 if (!at->converter) {
502 if ((ret = ffat_create_decoder(avctx, avpkt)) < 0) {
507 out_buffers = (AudioBufferList){
511 .mNumberChannels = avctx->channels,
512 .mDataByteSize = av_get_bytes_per_sample(avctx->sample_fmt) * avctx->frame_size
518 av_packet_unref(&at->new_in_pkt);
521 if ((ret = av_packet_ref(&at->new_in_pkt, avpkt)) < 0) {
528 frame->sample_rate = avctx->sample_rate;
530 frame->nb_samples = avctx->frame_size;
532 out_buffers.mBuffers[0].mData = at->decoded_data;
534 ret = AudioConverterFillComplexBuffer(at->converter, ffat_decode_callback, avctx,
535 &frame->nb_samples, &out_buffers, NULL);
536 if ((!ret || ret == 1) && frame->nb_samples) {
537 if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
539 ffat_copy_samples(avctx, frame);
541 if (at->last_pts != AV_NOPTS_VALUE) {
542 frame->pts = at->last_pts;
543 at->last_pts = avpkt->pts;
545 } else if (ret && ret != 1) {
546 av_log(avctx, AV_LOG_WARNING, "Decode error: %i\n", ret);
548 at->last_pts = avpkt->pts;
554 static av_cold void ffat_decode_flush(AVCodecContext *avctx)
556 ATDecodeContext *at = avctx->priv_data;
557 AudioConverterReset(at->converter);
558 av_packet_unref(&at->new_in_pkt);
559 av_packet_unref(&at->in_pkt);
562 static av_cold int ffat_close_decoder(AVCodecContext *avctx)
564 ATDecodeContext *at = avctx->priv_data;
566 AudioConverterDispose(at->converter);
567 av_packet_unref(&at->new_in_pkt);
568 av_packet_unref(&at->in_pkt);
569 av_freep(&at->decoded_data);
570 av_freep(&at->extradata);
574 #define FFAT_DEC_CLASS(NAME) \
575 static const AVClass ffat_##NAME##_dec_class = { \
576 .class_name = "at_" #NAME "_dec", \
577 .version = LIBAVUTIL_VERSION_INT, \
580 #define FFAT_DEC(NAME, ID, bsf_name) \
581 FFAT_DEC_CLASS(NAME) \
582 AVCodec ff_##NAME##_at_decoder = { \
583 .name = #NAME "_at", \
584 .long_name = NULL_IF_CONFIG_SMALL(#NAME " (AudioToolbox)"), \
585 .type = AVMEDIA_TYPE_AUDIO, \
587 .priv_data_size = sizeof(ATDecodeContext), \
588 .init = ffat_init_decoder, \
589 .close = ffat_close_decoder, \
590 .decode = ffat_decode, \
591 .flush = ffat_decode_flush, \
592 .priv_class = &ffat_##NAME##_dec_class, \
594 .capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY | AV_CODEC_CAP_CHANNEL_CONF, \
595 .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE | FF_CODEC_CAP_INIT_CLEANUP, \
596 .wrapper_name = "at", \
599 FFAT_DEC(aac, AV_CODEC_ID_AAC, "aac_adtstoasc")
600 FFAT_DEC(ac3, AV_CODEC_ID_AC3, NULL)
601 FFAT_DEC(adpcm_ima_qt, AV_CODEC_ID_ADPCM_IMA_QT, NULL)
602 FFAT_DEC(alac, AV_CODEC_ID_ALAC, NULL)
603 FFAT_DEC(amr_nb, AV_CODEC_ID_AMR_NB, NULL)
604 FFAT_DEC(eac3, AV_CODEC_ID_EAC3, NULL)
605 FFAT_DEC(gsm_ms, AV_CODEC_ID_GSM_MS, NULL)
606 FFAT_DEC(ilbc, AV_CODEC_ID_ILBC, NULL)
607 FFAT_DEC(mp1, AV_CODEC_ID_MP1, NULL)
608 FFAT_DEC(mp2, AV_CODEC_ID_MP2, NULL)
609 FFAT_DEC(mp3, AV_CODEC_ID_MP3, NULL)
610 FFAT_DEC(pcm_alaw, AV_CODEC_ID_PCM_ALAW, NULL)
611 FFAT_DEC(pcm_mulaw, AV_CODEC_ID_PCM_MULAW, NULL)
612 FFAT_DEC(qdmc, AV_CODEC_ID_QDMC, NULL)
613 FFAT_DEC(qdm2, AV_CODEC_ID_QDM2, NULL)