doxygen/4.1/audiotoolboxenc_8c_source.html

 /*

  * Audio Toolbox system codecs

  *

  * copyright (c) 2016 Rodger Combs

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 #include <AudioToolbox/AudioToolbox.h>


 #define FF_BUFQUEUE_SIZE 256

 #include "libavfilter/bufferqueue.h"


 #include "config.h"

 #include "audio_frame_queue.h"

 #include "avcodec.h"

 #include "bytestream.h"

 #include "internal.h"

 #include "libavformat/isom.h"

 #include "libavutil/avassert.h"

 #include "libavutil/opt.h"

 #include "libavutil/log.h"


 typedef struct ATDecodeContext {

     AVClass *av_class;

     int mode;

     int quality;


     AudioConverterRef converter;

     struct FFBufQueue frame_queue;

     struct FFBufQueue used_frame_queue;


     unsigned pkt_size;

     AudioFrameQueue afq;

     int eof;

     int frame_size;


     AVFrame* encoding_frame;

 } ATDecodeContext;


 static UInt32 ffat_get_format_id(enum AVCodecID codec, int profile)

 {

     switch (codec) {

     case AV_CODEC_ID_AAC:

         switch (profile) {

         case FF_PROFILE_AAC_LOW:

         default:

             return kAudioFormatMPEG4AAC;

         case FF_PROFILE_AAC_HE:

             return kAudioFormatMPEG4AAC_HE;

         case FF_PROFILE_AAC_HE_V2:

             return kAudioFormatMPEG4AAC_HE_V2;

         case FF_PROFILE_AAC_LD:

             return kAudioFormatMPEG4AAC_LD;

         case FF_PROFILE_AAC_ELD:

             return kAudioFormatMPEG4AAC_ELD;

         }

     case AV_CODEC_ID_ADPCM_IMA_QT:

         return kAudioFormatAppleIMA4;

     case AV_CODEC_ID_ALAC:

         return kAudioFormatAppleLossless;

     case AV_CODEC_ID_ILBC:

         return kAudioFormatiLBC;

     case AV_CODEC_ID_PCM_ALAW:

         return kAudioFormatALaw;

     case AV_CODEC_ID_PCM_MULAW:

         return kAudioFormatULaw;

     default:

         av_assert0(!"Invalid codec ID!");

         return 0;

     }

 }


 static void ffat_update_ctx(AVCodecContext *avctx)

 {

     ATDecodeContext *at = avctx->priv_data;

     UInt32 size = sizeof(unsigned);

     AudioConverterPrimeInfo prime_info;

     AudioStreamBasicDescription out_format;


     AudioConverterGetProperty(at->converter,

                               kAudioConverterPropertyMaximumOutputPacketSize,

                               &size, &at->pkt_size);


     if (at->pkt_size <= 0)

         at->pkt_size = 1024 * 50;


     size = sizeof(prime_info);


     if (!AudioConverterGetProperty(at->converter,

                                    kAudioConverterPrimeInfo,

                                    &size, &prime_info)) {

         avctx->initial_padding = prime_info.leadingFrames;

     }


     size = sizeof(out_format);

     if (!AudioConverterGetProperty(at->converter,

                                    kAudioConverterCurrentOutputStreamDescription,

                                    &size, &out_format)) {

         if (out_format.mFramesPerPacket)

             avctx->frame_size = out_format.mFramesPerPacket;

         if (out_format.mBytesPerPacket && avctx->codec_id == AV_CODEC_ID_ILBC)

             avctx->block_align = out_format.mBytesPerPacket;

     }


     at->frame_size = avctx->frame_size;

     if (avctx->codec_id == AV_CODEC_ID_PCM_MULAW ||

         avctx->codec_id == AV_CODEC_ID_PCM_ALAW) {

         at->pkt_size *= 1024;

         avctx->frame_size *= 1024;

     }

 }


 static int read_descr(GetByteContext *gb, int *tag)

 {

     int len = 0;

     int count = 4;

     *tag = bytestream2_get_byte(gb);

     while (count--) {

         int c = bytestream2_get_byte(gb);

         len = (len << 7) | (c & 0x7f);

         if (!(c & 0x80))

             break;

     }

     return len;

 }


 static int get_ilbc_mode(AVCodecContext *avctx)

 {

     if (avctx->block_align == 38)

         return 20;

     else if (avctx->block_align == 50)

         return 30;

     else if (avctx->bit_rate > 0)

         return avctx->bit_rate <= 14000 ? 30 : 20;

     else

         return 30;

 }


 static av_cold int get_channel_label(int channel)

 {

     uint64_t map = 1 << channel;

     if (map <= AV_CH_LOW_FREQUENCY)

         return channel + 1;

     else if (map <= AV_CH_BACK_RIGHT)

         return channel + 29;

     else if (map <= AV_CH_BACK_CENTER)

         return channel - 1;

     else if (map <= AV_CH_SIDE_RIGHT)

         return channel - 4;

     else if (map <= AV_CH_TOP_BACK_RIGHT)

         return channel + 1;

     else if (map <= AV_CH_STEREO_RIGHT)

         return -1;

     else if (map <= AV_CH_WIDE_RIGHT)

         return channel + 4;

     else if (map <= AV_CH_SURROUND_DIRECT_RIGHT)

         return channel - 23;

     else if (map == AV_CH_LOW_FREQUENCY_2)

         return kAudioChannelLabel_LFE2;

     else

         return -1;

 }


 static int remap_layout(AudioChannelLayout *layout, uint64_t in_layout, int count)

 {

     int i;

     int c = 0;

     layout->mChannelLayoutTag = kAudioChannelLayoutTag_UseChannelDescriptions;

     layout->mNumberChannelDescriptions = count;

     for (i = 0; i < count; i++) {

         int label;

         while (!(in_layout & (1 << c)) && c < 64)

             c++;

         if (c == 64)

             return AVERROR(EINVAL); // This should never happen

         label = get_channel_label(c);

         layout->mChannelDescriptions[i].mChannelLabel = label;

         if (label < 0)

             return AVERROR(EINVAL);

         c++;

     }

     return 0;

 }


 static int get_aac_tag(uint64_t in_layout)

 {

     switch (in_layout) {

     case AV_CH_LAYOUT_MONO:

         return kAudioChannelLayoutTag_Mono;

     case AV_CH_LAYOUT_STEREO:

         return kAudioChannelLayoutTag_Stereo;

     case AV_CH_LAYOUT_QUAD:

         return kAudioChannelLayoutTag_AAC_Quadraphonic;

     case AV_CH_LAYOUT_OCTAGONAL:

         return kAudioChannelLayoutTag_AAC_Octagonal;

     case AV_CH_LAYOUT_SURROUND:

         return kAudioChannelLayoutTag_AAC_3_0;

     case AV_CH_LAYOUT_4POINT0:

         return kAudioChannelLayoutTag_AAC_4_0;

     case AV_CH_LAYOUT_5POINT0:

         return kAudioChannelLayoutTag_AAC_5_0;

     case AV_CH_LAYOUT_5POINT1:

         return kAudioChannelLayoutTag_AAC_5_1;

     case AV_CH_LAYOUT_6POINT0:

         return kAudioChannelLayoutTag_AAC_6_0;

     case AV_CH_LAYOUT_6POINT1:

         return kAudioChannelLayoutTag_AAC_6_1;

     case AV_CH_LAYOUT_7POINT0:

         return kAudioChannelLayoutTag_AAC_7_0;

     case AV_CH_LAYOUT_7POINT1_WIDE_BACK:

         return kAudioChannelLayoutTag_AAC_7_1;

     case AV_CH_LAYOUT_7POINT1:

         return kAudioChannelLayoutTag_MPEG_7_1_C;

     default:

         return 0;

     }

 }


 static av_cold int ffat_init_encoder(AVCodecContext *avctx)

 {

     ATDecodeContext *at = avctx->priv_data;

     OSStatus status;


     AudioStreamBasicDescription in_format = {

         .mSampleRate = avctx->sample_rate,

         .mFormatID = kAudioFormatLinearPCM,

         .mFormatFlags = ((avctx->sample_fmt == AV_SAMPLE_FMT_FLT ||

                           avctx->sample_fmt == AV_SAMPLE_FMT_DBL) ? kAudioFormatFlagIsFloat

                         : avctx->sample_fmt == AV_SAMPLE_FMT_U8 ? 0

                         : kAudioFormatFlagIsSignedInteger)

                         | kAudioFormatFlagIsPacked,

         .mBytesPerPacket = av_get_bytes_per_sample(avctx->sample_fmt) * avctx->channels,

         .mFramesPerPacket = 1,

         .mBytesPerFrame = av_get_bytes_per_sample(avctx->sample_fmt) * avctx->channels,

         .mChannelsPerFrame = avctx->channels,

         .mBitsPerChannel = av_get_bytes_per_sample(avctx->sample_fmt) * 8,

     };

     AudioStreamBasicDescription out_format = {

         .mSampleRate = avctx->sample_rate,

         .mFormatID = ffat_get_format_id(avctx->codec_id, avctx->profile),

         .mChannelsPerFrame = in_format.mChannelsPerFrame,

     };

     UInt32 layout_size = sizeof(AudioChannelLayout) +

                          sizeof(AudioChannelDescription) * avctx->channels;

     AudioChannelLayout *channel_layout = av_malloc(layout_size);


     if (!channel_layout)

         return AVERROR(ENOMEM);


     if (avctx->codec_id == AV_CODEC_ID_ILBC) {

         int mode = get_ilbc_mode(avctx);

         out_format.mFramesPerPacket  = 8000 * mode / 1000;

         out_format.mBytesPerPacket   = (mode == 20 ? 38 : 50);

     }


     status = AudioConverterNew(&in_format, &out_format, &at->converter);


     if (status != 0) {

         av_log(avctx, AV_LOG_ERROR, "AudioToolbox init error: %i\n", (int)status);

         av_free(channel_layout);

         return AVERROR_UNKNOWN;

     }


     if (!avctx->channel_layout)

         avctx->channel_layout = av_get_default_channel_layout(avctx->channels);


     if ((status = remap_layout(channel_layout, avctx->channel_layout, avctx->channels)) < 0) {

         av_log(avctx, AV_LOG_ERROR, "Invalid channel layout\n");

         av_free(channel_layout);

         return status;

     }


     if (AudioConverterSetProperty(at->converter, kAudioConverterInputChannelLayout,

                                   layout_size, channel_layout)) {

         av_log(avctx, AV_LOG_ERROR, "Unsupported input channel layout\n");

         av_free(channel_layout);

         return AVERROR(EINVAL);

     }

     if (avctx->codec_id == AV_CODEC_ID_AAC) {

         int tag = get_aac_tag(avctx->channel_layout);

         if (tag) {

             channel_layout->mChannelLayoutTag = tag;

             channel_layout->mNumberChannelDescriptions = 0;

         }

     }

     if (AudioConverterSetProperty(at->converter, kAudioConverterOutputChannelLayout,

                                   layout_size, channel_layout)) {

         av_log(avctx, AV_LOG_ERROR, "Unsupported output channel layout\n");

         av_free(channel_layout);

         return AVERROR(EINVAL);

     }

     av_free(channel_layout);


     if (avctx->bits_per_raw_sample)

         AudioConverterSetProperty(at->converter,

                                   kAudioConverterPropertyBitDepthHint,

                                   sizeof(avctx->bits_per_raw_sample),

                                   &avctx->bits_per_raw_sample);


 #if !TARGET_OS_IPHONE

     if (at->mode == -1)

         at->mode = (avctx->flags & AV_CODEC_FLAG_QSCALE) ?

                    kAudioCodecBitRateControlMode_Variable :

                    kAudioCodecBitRateControlMode_Constant;


     AudioConverterSetProperty(at->converter, kAudioCodecPropertyBitRateControlMode,

                               sizeof(at->mode), &at->mode);


     if (at->mode == kAudioCodecBitRateControlMode_Variable) {

         int q = avctx->global_quality / FF_QP2LAMBDA;

         if (q < 0 || q > 14) {

             av_log(avctx, AV_LOG_WARNING,

                    "VBR quality %d out of range, should be 0-14\n", q);

             q = av_clip(q, 0, 14);

         }

         q = 127 - q * 9;

         AudioConverterSetProperty(at->converter, kAudioCodecPropertySoundQualityForVBR,

                                   sizeof(q), &q);

     } else

 #endif

     if (avctx->bit_rate > 0) {

         UInt32 rate = avctx->bit_rate;

         UInt32 size;

         status = AudioConverterGetPropertyInfo(at->converter,

                                                kAudioConverterApplicableEncodeBitRates,

                                                &size, NULL);

         if (!status && size) {

             UInt32 new_rate = rate;

             int count;

             int i;

             AudioValueRange *ranges = av_malloc(size);

             if (!ranges)

                 return AVERROR(ENOMEM);

             AudioConverterGetProperty(at->converter,

                                       kAudioConverterApplicableEncodeBitRates,

                                       &size, ranges);

             count = size / sizeof(AudioValueRange);

             for (i = 0; i < count; i++) {

                 AudioValueRange *range = &ranges[i];

                 if (rate >= range->mMinimum && rate <= range->mMaximum) {

                     new_rate = rate;

                     break;

                 } else if (rate > range->mMaximum) {

                     new_rate = range->mMaximum;

                 } else {

                     new_rate = range->mMinimum;

                     break;

                 }

             }

             if (new_rate != rate) {

                 av_log(avctx, AV_LOG_WARNING,

                        "Bitrate %u not allowed; changing to %u\n", rate, new_rate);

                 rate = new_rate;

             }

             av_free(ranges);

         }

         AudioConverterSetProperty(at->converter, kAudioConverterEncodeBitRate,

                                   sizeof(rate), &rate);

     }


     at->quality = 96 - at->quality * 32;

     AudioConverterSetProperty(at->converter, kAudioConverterCodecQuality,

                               sizeof(at->quality), &at->quality);


     if (!AudioConverterGetPropertyInfo(at->converter, kAudioConverterCompressionMagicCookie,

                                        &avctx->extradata_size, NULL) &&

         avctx->extradata_size) {

         int extradata_size = avctx->extradata_size;

         uint8_t *extradata;

         if (!(avctx->extradata = av_mallocz(avctx->extradata_size + AV_INPUT_BUFFER_PADDING_SIZE)))

             return AVERROR(ENOMEM);

         if (avctx->codec_id == AV_CODEC_ID_ALAC) {

             avctx->extradata_size = 0x24;

             AV_WB32(avctx->extradata,     0x24);

             AV_WB32(avctx->extradata + 4, MKBETAG('a','l','a','c'));

             extradata = avctx->extradata + 12;

             avctx->extradata_size = 0x24;

         } else {

             extradata = avctx->extradata;

         }

         status = AudioConverterGetProperty(at->converter,

                                            kAudioConverterCompressionMagicCookie,

                                            &extradata_size, extradata);

         if (status != 0) {

             av_log(avctx, AV_LOG_ERROR, "AudioToolbox cookie error: %i\n", (int)status);

             return AVERROR_UNKNOWN;

         } else if (avctx->codec_id == AV_CODEC_ID_AAC) {

             GetByteContext gb;

             int tag, len;

             bytestream2_init(&gb, extradata, extradata_size);

             do {

                 len = read_descr(&gb, &tag);

                 if (tag == MP4DecConfigDescrTag) {

                     bytestream2_skip(&gb, 13);

                     len = read_descr(&gb, &tag);

                     if (tag == MP4DecSpecificDescrTag) {

                         len = FFMIN(gb.buffer_end - gb.buffer, len);

                         memmove(extradata, gb.buffer, len);

                         avctx->extradata_size = len;

                         break;

                     }

                 } else if (tag == MP4ESDescrTag) {

                     int flags;

                     bytestream2_skip(&gb, 2);

                     flags = bytestream2_get_byte(&gb);

                     if (flags & 0x80) //streamDependenceFlag

                         bytestream2_skip(&gb, 2);

                     if (flags & 0x40) //URL_Flag

                         bytestream2_skip(&gb, bytestream2_get_byte(&gb));

                     if (flags & 0x20) //OCRstreamFlag

                         bytestream2_skip(&gb, 2);

                 }

             } while (bytestream2_get_bytes_left(&gb));

         } else if (avctx->codec_id != AV_CODEC_ID_ALAC) {

             avctx->extradata_size = extradata_size;

         }

     }


     ffat_update_ctx(avctx);


 #if !TARGET_OS_IPHONE && defined(__MAC_10_9)

     if (at->mode == kAudioCodecBitRateControlMode_Variable && avctx->rc_max_rate) {

         UInt32 max_size = avctx->rc_max_rate * avctx->frame_size / avctx->sample_rate;

         if (max_size)

             AudioConverterSetProperty(at->converter, kAudioCodecPropertyPacketSizeLimitForVBR,

                                       sizeof(max_size), &max_size);

     }

 #endif


     ff_af_queue_init(avctx, &at->afq);


     at->encoding_frame = av_frame_alloc();

     if (!at->encoding_frame)

         return AVERROR(ENOMEM);


     return 0;

 }


 static OSStatus ffat_encode_callback(AudioConverterRef converter, UInt32 *nb_packets,

                                      AudioBufferList *data,

                                      AudioStreamPacketDescription **packets,

                                      void *inctx)

 {

     AVCodecContext *avctx = inctx;

     ATDecodeContext *at = avctx->priv_data;

     AVFrame *frame;

     int ret;


     if (!at->frame_queue.available) {

         if (at->eof) {

             *nb_packets = 0;

             return 0;

         } else {

             *nb_packets = 0;

             return 1;

         }

     }


     frame = ff_bufqueue_get(&at->frame_queue);


     data->mNumberBuffers              = 1;

     data->mBuffers[0].mNumberChannels = avctx->channels;

     data->mBuffers[0].mDataByteSize   = frame->nb_samples *

                                         av_get_bytes_per_sample(avctx->sample_fmt) *

                                         avctx->channels;

     data->mBuffers[0].mData           = frame->data[0];

     if (*nb_packets > frame->nb_samples)

         *nb_packets = frame->nb_samples;


     av_frame_unref(at->encoding_frame);

     ret = av_frame_ref(at->encoding_frame, frame);

     if (ret < 0) {

         *nb_packets = 0;

         return ret;

     }


     ff_bufqueue_add(avctx, &at->used_frame_queue, frame);


     return 0;

 }


 static int ffat_encode(AVCodecContext *avctx, AVPacket *avpkt,

                        const AVFrame *frame, int *got_packet_ptr)

 {

     ATDecodeContext *at = avctx->priv_data;

     OSStatus ret;


     AudioBufferList out_buffers = {

         .mNumberBuffers = 1,

         .mBuffers = {

             {

                 .mNumberChannels = avctx->channels,

                 .mDataByteSize = at->pkt_size,

             }

         }

     };

     AudioStreamPacketDescription out_pkt_desc = {0};


     if (frame) {

         AVFrame *in_frame;


         if (ff_bufqueue_is_full(&at->frame_queue)) {

             /*

              * The frame queue is significantly larger than needed in practice,

              * but no clear way to determine the minimum number of samples to

              * get output from AudioConverterFillComplexBuffer().

              */

             av_log(avctx, AV_LOG_ERROR, "Bug: frame queue is too small.\n");

             return AVERROR_BUG;

         }


         if ((ret = ff_af_queue_add(&at->afq, frame)) < 0)

             return ret;


         in_frame = av_frame_clone(frame);

         if (!in_frame)

             return AVERROR(ENOMEM);


         ff_bufqueue_add(avctx, &at->frame_queue, in_frame);

     } else {

         at->eof = 1;

     }


     if ((ret = ff_alloc_packet2(avctx, avpkt, at->pkt_size, 0)) < 0)

         return ret;


     out_buffers.mBuffers[0].mData = avpkt->data;


     *got_packet_ptr = avctx->frame_size / at->frame_size;


     ret = AudioConverterFillComplexBuffer(at->converter, ffat_encode_callback, avctx,

                                           got_packet_ptr, &out_buffers,

                                           (avctx->frame_size > at->frame_size) ? NULL : &out_pkt_desc);


     ff_bufqueue_discard_all(&at->used_frame_queue);


     if ((!ret || ret == 1) && *got_packet_ptr) {

         avpkt->size = out_buffers.mBuffers[0].mDataByteSize;

         ff_af_queue_remove(&at->afq, out_pkt_desc.mVariableFramesInPacket ?

                                      out_pkt_desc.mVariableFramesInPacket :

                                      avctx->frame_size,

                            &avpkt->pts,

                            &avpkt->duration);

     } else if (ret && ret != 1) {

         av_log(avctx, AV_LOG_WARNING, "Encode error: %i\n", ret);

     }


     return 0;

 }


 static av_cold void ffat_encode_flush(AVCodecContext *avctx)

 {

     ATDecodeContext *at = avctx->priv_data;

     AudioConverterReset(at->converter);

     ff_bufqueue_discard_all(&at->frame_queue);

     ff_bufqueue_discard_all(&at->used_frame_queue);

 }


 static av_cold int ffat_close_encoder(AVCodecContext *avctx)

 {

     ATDecodeContext *at = avctx->priv_data;

     AudioConverterDispose(at->converter);

     ff_bufqueue_discard_all(&at->frame_queue);

     ff_bufqueue_discard_all(&at->used_frame_queue);

     ff_af_queue_close(&at->afq);

     av_frame_free(&at->encoding_frame);

     return 0;

 }


 static const AVProfile aac_profiles[] = {

     { FF_PROFILE_AAC_LOW,   "LC"       },

     { FF_PROFILE_AAC_HE,    "HE-AAC"   },

     { FF_PROFILE_AAC_HE_V2, "HE-AACv2" },

     { FF_PROFILE_AAC_LD,    "LD"       },

     { FF_PROFILE_AAC_ELD,   "ELD"      },

     { FF_PROFILE_UNKNOWN },

 };


 #define AE AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM

 static const AVOption options[] = {

 #if !TARGET_OS_IPHONE

     {"aac_at_mode", "ratecontrol mode", offsetof(ATDecodeContext, mode), AV_OPT_TYPE_INT, {.i64 = -1}, -1, kAudioCodecBitRateControlMode_Variable, AE, "mode"},

         {"auto", "VBR if global quality is given; CBR otherwise", 0, AV_OPT_TYPE_CONST, {.i64 = -1}, INT_MIN, INT_MAX, AE, "mode"},

         {"cbr",  "constant bitrate", 0, AV_OPT_TYPE_CONST, {.i64 = kAudioCodecBitRateControlMode_Constant}, INT_MIN, INT_MAX, AE, "mode"},

         {"abr",  "long-term average bitrate", 0, AV_OPT_TYPE_CONST, {.i64 = kAudioCodecBitRateControlMode_LongTermAverage}, INT_MIN, INT_MAX, AE, "mode"},

         {"cvbr", "constrained variable bitrate", 0, AV_OPT_TYPE_CONST, {.i64 = kAudioCodecBitRateControlMode_VariableConstrained}, INT_MIN, INT_MAX, AE, "mode"},

         {"vbr" , "variable bitrate", 0, AV_OPT_TYPE_CONST, {.i64 = kAudioCodecBitRateControlMode_Variable}, INT_MIN, INT_MAX, AE, "mode"},

 #endif

     {"aac_at_quality", "quality vs speed control", offsetof(ATDecodeContext, quality), AV_OPT_TYPE_INT, {.i64 = 0}, 0, 2, AE},

     { NULL },

 };


 #define FFAT_ENC_CLASS(NAME) \

     static const AVClass ffat_##NAME##_enc_class = { \

         .class_name = "at_" #NAME "_enc", \

         .item_name  = av_default_item_name, \

         .option     = options, \

         .version    = LIBAVUTIL_VERSION_INT, \

     };


 #define FFAT_ENC(NAME, ID, PROFILES, ...) \

     FFAT_ENC_CLASS(NAME) \

     AVCodec ff_##NAME##_at_encoder = { \

         .name           = #NAME "_at", \

         .long_name      = NULL_IF_CONFIG_SMALL(#NAME " (AudioToolbox)"), \

         .type           = AVMEDIA_TYPE_AUDIO, \

         .id             = ID, \

         .priv_data_size = sizeof(ATDecodeContext), \

         .init           = ffat_init_encoder, \

         .close          = ffat_close_encoder, \

         .encode2        = ffat_encode, \

         .flush          = ffat_encode_flush, \

         .priv_class     = &ffat_##NAME##_enc_class, \

         .capabilities   = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY __VA_ARGS__, \

         .sample_fmts    = (const enum AVSampleFormat[]) { \

             AV_SAMPLE_FMT_S16, \

             AV_SAMPLE_FMT_U8,  AV_SAMPLE_FMT_NONE \

         }, \

         .caps_internal  = FF_CODEC_CAP_INIT_THREADSAFE, \

         .profiles       = PROFILES, \

         .wrapper_name   = "at", \

     };


 static const uint64_t aac_at_channel_layouts[] = {

     AV_CH_LAYOUT_MONO,

     AV_CH_LAYOUT_STEREO,

     AV_CH_LAYOUT_SURROUND,

     AV_CH_LAYOUT_4POINT0,

     AV_CH_LAYOUT_5POINT0,

     AV_CH_LAYOUT_5POINT1,

     AV_CH_LAYOUT_6POINT0,

     AV_CH_LAYOUT_6POINT1,

     AV_CH_LAYOUT_7POINT0,

     AV_CH_LAYOUT_7POINT1_WIDE_BACK,

     AV_CH_LAYOUT_QUAD,

     AV_CH_LAYOUT_OCTAGONAL,

     0,

 };


 FFAT_ENC(aac,          AV_CODEC_ID_AAC,          aac_profiles, , .channel_layouts = aac_at_channel_layouts)

 //FFAT_ENC(adpcm_ima_qt, AV_CODEC_ID_ADPCM_IMA_QT, NULL)

 FFAT_ENC(alac,         AV_CODEC_ID_ALAC,         NULL, | AV_CODEC_CAP_VARIABLE_FRAME_SIZE | AV_CODEC_CAP_LOSSLESS)

 FFAT_ENC(ilbc,         AV_CODEC_ID_ILBC,         NULL)

 FFAT_ENC(pcm_alaw,     AV_CODEC_ID_PCM_ALAW,     NULL)

 FFAT_ENC(pcm_mulaw,    AV_CODEC_ID_PCM_MULAW,    NULL)

ff_bufqueue_get
static AVFrame * ff_bufqueue_get(struct FFBufQueue *queue)
Get the first buffer from the queue and remove it.
Definition: bufferqueue.h:98

ff_af_queue_remove
void ff_af_queue_remove(AudioFrameQueue *afq, int nb_samples, int64_t *pts, int64_t *duration)
Remove frame(s) from the queue.
Definition: audio_frame_queue.c:75

NULL
#define NULL
Definition: coverity.c:32

GetByteContext
Definition: bytestream.h:33

AV_CH_LAYOUT_7POINT1
#define AV_CH_LAYOUT_7POINT1
Definition: channel_layout.h:107

get_aac_tag
static int get_aac_tag(uint64_t in_layout)
Definition: audiotoolboxenc.c:200

FFAT_ENC
#define FFAT_ENC(NAME, ID, PROFILES,...)
Definition: audiotoolboxenc.c:617

MP4ESDescrTag
#define MP4ESDescrTag
Definition: isom.h:299

AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:226

AVOption
AVOption.
Definition: opt.h:246

data
ptrdiff_t const GLvoid * data
Definition: opengl_enc.c:101

AV_CH_LAYOUT_6POINT1
#define AV_CH_LAYOUT_6POINT1
Definition: channel_layout.h:102

AV_CH_LAYOUT_6POINT0
#define AV_CH_LAYOUT_6POINT0
Definition: channel_layout.h:99

ffat_init_encoder
static av_cold int ffat_init_encoder(AVCodecContext *avctx)
Definition: audiotoolboxenc.c:234

AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:182

AVCodecContext::bit_rate
int64_t bit_rate
the average bitrate
Definition: avcodec.h:1583

AV_CH_LAYOUT_SURROUND
#define AV_CH_LAYOUT_SURROUND
Definition: channel_layout.h:89

ffat_close_encoder
static av_cold int ffat_close_encoder(AVCodecContext *avctx)
Definition: audiotoolboxenc.c:575

AV_OPT_TYPE_INT
Definition: opt.h:223

isom.h

AE
#define AE
Definition: audiotoolboxenc.c:595

ATDecodeContext::used_frame_queue
struct FFBufQueue used_frame_queue
Definition: audiotoolboxenc.c:45

AVPacket::size
int size
Definition: avcodec.h:1446

ATDecodeContext::frame_queue
struct FFBufQueue frame_queue
Definition: audiotoolboxenc.c:44

AV_CH_LOW_FREQUENCY_2
#define AV_CH_LOW_FREQUENCY_2
Definition: channel_layout.h:73

bytestream2_init
static av_always_inline void bytestream2_init(GetByteContext *g, const uint8_t *buf, int buf_size)
Definition: bytestream.h:133

AV_CH_LAYOUT_4POINT0
#define AV_CH_LAYOUT_4POINT0
Definition: channel_layout.h:91

AV_CH_LAYOUT_7POINT0
#define AV_CH_LAYOUT_7POINT0
Definition: channel_layout.h:105

av_mallocz
void * av_mallocz(size_t size)
Allocate a memory block with alignment suitable for all memory accesses (including vectors if availab...
Definition: mem.c:236

AV_CH_SURROUND_DIRECT_RIGHT
#define AV_CH_SURROUND_DIRECT_RIGHT
Definition: channel_layout.h:72

AVCodecContext::bits_per_raw_sample
int bits_per_raw_sample
Bits per sample/pixel of internal libavcodec pixel/sample format.
Definition: avcodec.h:2757

AV_CH_LAYOUT_STEREO
#define AV_CH_LAYOUT_STEREO
Definition: channel_layout.h:86

get_channel_label
static av_cold int get_channel_label(int channel)
Definition: audiotoolboxenc.c:154

AV_SAMPLE_FMT_FLT
float
Definition: samplefmt.h:63

FF_PROFILE_AAC_HE_V2
#define FF_PROFILE_AAC_HE_V2
Definition: avcodec.h:2868

AVCodecContext::profile
int profile
profile
Definition: avcodec.h:2859

AV_CH_LAYOUT_5POINT0
#define AV_CH_LAYOUT_5POINT0
Definition: channel_layout.h:95

AVCodecContext::block_align
int block_align
number of bytes per packet if constant and known or 0 Used by some WAV based audio codecs...
Definition: avcodec.h:2226

AV_CODEC_ID_ALAC
Definition: avcodec.h:574

ffat_encode_flush
static av_cold void ffat_encode_flush(AVCodecContext *avctx)
Definition: audiotoolboxenc.c:567

FFBufQueue
Structure holding the queue.
Definition: bufferqueue.h:49

av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:37

ff_alloc_packet2
int ff_alloc_packet2(AVCodecContext *avctx, AVPacket *avpkt, int64_t size, int64_t min_size)
Check AVPacket size and/or allocate data.
Definition: encode.c:32

AV_OPT_TYPE_CONST
Definition: opt.h:232

AVCodecContext::sample_fmt
enum AVSampleFormat sample_fmt
audio sample format
Definition: avcodec.h:2197

config.h

uint8_t
uint8_t
Definition: audio_convert.c:194

av_cold
#define av_cold
Definition: attributes.h:82

av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31

AV_SAMPLE_FMT_U8
AV_SAMPLE_FMT_U8
Definition: audio_convert.c:194

av_frame_alloc
AVFrame * av_frame_alloc(void)
Allocate an AVFrame and set its fields to default values.
Definition: frame.c:189

aac_profiles
static const AVProfile aac_profiles[]
Definition: audiotoolboxenc.c:586

opt.h
AVOptions.

ATDecodeContext::frame_size
int frame_size
Definition: audiotoolboxenc.c:50

ff_af_queue_init
av_cold void ff_af_queue_init(AVCodecContext *avctx, AudioFrameQueue *afq)
Initialize AudioFrameQueue.
Definition: audio_frame_queue.c:28

AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: avcodec.h:1463

AV_CODEC_ID_AAC
Definition: avcodec.h:560

AV_CH_WIDE_RIGHT
#define AV_CH_WIDE_RIGHT
Definition: channel_layout.h:70

av_frame_ref
int av_frame_ref(AVFrame *dst, const AVFrame *src)
Set up a new reference to the data described by the source frame.
Definition: frame.c:443

ATDecodeContext::av_class
AVClass * av_class
Definition: audiotoolboxdec.c:40

AVCodecContext::extradata
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
Definition: avcodec.h:1634

AV_CH_LOW_FREQUENCY
#define AV_CH_LOW_FREQUENCY
Definition: channel_layout.h:52

frame
static AVFrame * frame
Definition: demuxing_decoding.c:53

AV_CODEC_ID_ADPCM_IMA_QT
Definition: avcodec.h:497

AVPacket::data
uint8_t * data
Definition: avcodec.h:1445

GetByteContext::buffer
const uint8_t * buffer
Definition: bytestream.h:34

tag
uint32_t tag
Definition: movenc.c:1483

ATDecodeContext::mode
int mode
Definition: audiotoolboxenc.c:40

size
ptrdiff_t size
Definition: opengl_enc.c:101

FF_PROFILE_AAC_LD
#define FF_PROFILE_AAC_LD
Definition: avcodec.h:2869

av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28

AV_CH_LAYOUT_5POINT1
#define AV_CH_LAYOUT_5POINT1
Definition: channel_layout.h:96

AV_CODEC_ID_PCM_ALAW
Definition: avcodec.h:465

AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: avcodec.h:215

AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176

ffat_update_ctx
static void ffat_update_ctx(AVCodecContext *avctx)
Definition: audiotoolboxenc.c:88

AVERROR
#define AVERROR(e)
Definition: error.h:43

MP4DecSpecificDescrTag
#define MP4DecSpecificDescrTag
Definition: isom.h:301

bytestream2_skip
static av_always_inline void bytestream2_skip(GetByteContext *g, unsigned int size)
Definition: bytestream.h:164

av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:202

ffat_encode_callback
static OSStatus ffat_encode_callback(AudioConverterRef converter, UInt32 *nb_packets, AudioBufferList *data, AudioStreamPacketDescription **packets, void *inctx)
Definition: audiotoolboxenc.c:454

AVCodecContext::initial_padding
int initial_padding
Audio only.
Definition: avcodec.h:3047

ATDecodeContext::quality
int quality
Definition: audiotoolboxenc.c:41

ATDecodeContext::encoding_frame
AVFrame * encoding_frame
Definition: audiotoolboxenc.c:52

bytestream2_get_bytes_left
static av_always_inline unsigned int bytestream2_get_bytes_left(GetByteContext *g)
Definition: bytestream.h:154

AVCodecContext::flags
int flags
AV_CODEC_FLAG_*.
Definition: avcodec.h:1613

avassert.h
simple assert() macros that are a bit more flexible than ISO C assert().

AV_CH_LAYOUT_QUAD
#define AV_CH_LAYOUT_QUAD
Definition: channel_layout.h:94

count
GLsizei count
Definition: opengl_enc.c:109

ff_af_queue_add
int ff_af_queue_add(AudioFrameQueue *afq, const AVFrame *f)
Add a frame to the queue.
Definition: audio_frame_queue.c:44

FF_PROFILE_AAC_ELD
#define FF_PROFILE_AAC_ELD
Definition: avcodec.h:2870

AV_CODEC_CAP_VARIABLE_FRAME_SIZE
#define AV_CODEC_CAP_VARIABLE_FRAME_SIZE
Audio encoder supports receiving a different number of samples in each call.
Definition: avcodec.h:1040

bytestream.h

AVCodecContext::channel_layout
uint64_t channel_layout
Audio channel layout.
Definition: avcodec.h:2240

options
static const AVOption options[]
Definition: audiotoolboxenc.c:596

aac_at_channel_layouts
static const uint64_t aac_at_channel_layouts[]
Definition: audiotoolboxenc.c:640

GetByteContext::buffer_end
const uint8_t * buffer_end
Definition: bytestream.h:34

AV_CH_STEREO_RIGHT
#define AV_CH_STEREO_RIGHT
See AV_CH_STEREO_LEFT.
Definition: channel_layout.h:68

AV_CODEC_FLAG_QSCALE
#define AV_CODEC_FLAG_QSCALE
Use fixed qscale.
Definition: avcodec.h:842

FFMIN
#define FFMIN(a, b)
Definition: common.h:96

ff_bufqueue_is_full
static int ff_bufqueue_is_full(struct FFBufQueue *queue)
Test if a buffer queue is full.
Definition: bufferqueue.h:60

FF_PROFILE_AAC_LOW
#define FF_PROFILE_AAC_LOW
Definition: avcodec.h:2864

FF_PROFILE_UNKNOWN
#define FF_PROFILE_UNKNOWN
Definition: avcodec.h:2860

ATDecodeContext::converter
AudioConverterRef converter
Definition: audiotoolboxdec.c:42

AV_SAMPLE_FMT_DBL
double
Definition: samplefmt.h:64

ATDecodeContext::afq
AudioFrameQueue afq
Definition: audiotoolboxenc.c:48

ff_bufqueue_discard_all
static void ff_bufqueue_discard_all(struct FFBufQueue *queue)
Unref and remove all buffers from the queue.
Definition: bufferqueue.h:111

av_frame_clone
AVFrame * av_frame_clone(const AVFrame *src)
Create a new frame that references the same data as src.
Definition: frame.c:540

bufferqueue.h

AudioFrameQueue
Definition: audio_frame_queue.h:32

AVCodecContext::frame_size
int frame_size
Number of samples per channel in an audio frame.
Definition: avcodec.h:2209

avcodec.h
Libavcodec external API header.

MP4DecConfigDescrTag
#define MP4DecConfigDescrTag
Definition: isom.h:300

AVCodecContext::codec_id
enum AVCodecID codec_id
Definition: avcodec.h:1543

FFBufQueue::available
unsigned short available
number of available buffers
Definition: bufferqueue.h:52

AVCodecContext::sample_rate
int sample_rate
samples per second
Definition: avcodec.h:2189

AVCodecContext
main external API structure.
Definition: avcodec.h:1533

AV_CODEC_ID_PCM_MULAW
Definition: avcodec.h:464

AVCodecContext::extradata_size
int extradata_size
Definition: avcodec.h:1635

AVERROR_BUG
#define AVERROR_BUG
Internal bug, also see AVERROR_BUG2.
Definition: error.h:50

AV_CH_TOP_BACK_RIGHT
#define AV_CH_TOP_BACK_RIGHT
Definition: channel_layout.h:66

channel_layouts
static const uint16_t channel_layouts[7]
Definition: dca_lbr.c:113

AVClass
Describe the class of an AVClass context structure.
Definition: log.h:67

AV_CH_LAYOUT_7POINT1_WIDE_BACK
#define AV_CH_LAYOUT_7POINT1_WIDE_BACK
Definition: channel_layout.h:109

AV_WB32
#define AV_WB32(p, v)
Definition: intreadwrite.h:419

AV_CH_LAYOUT_OCTAGONAL
#define AV_CH_LAYOUT_OCTAGONAL
Definition: channel_layout.h:110

ffat_encode
static int ffat_encode(AVCodecContext *avctx, AVPacket *avpkt, const AVFrame *frame, int *got_packet_ptr)
Definition: audiotoolboxenc.c:497

map
const VDPAUPixFmtMap * map
Definition: hwcontext_vdpau.c:83

profile
mfxU16 profile
Definition: qsvenc.c:44

av_frame_unref
void av_frame_unref(AVFrame *frame)
Unreference all the buffers referenced by frame and reset the frame fields.
Definition: frame.c:553

AVCodecContext::global_quality
int global_quality
Global quality for codecs which cannot change it per frame.
Definition: avcodec.h:1599

flags
#define flags(name, subs,...)
Definition: cbs_av1.c:596

ATDecodeContext
Definition: audiotoolboxdec.c:39

AV_CH_BACK_CENTER
#define AV_CH_BACK_CENTER
Definition: channel_layout.h:57

AVFrame::data
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:240

AV_CH_SIDE_RIGHT
#define AV_CH_SIDE_RIGHT
Definition: channel_layout.h:59

av_get_bytes_per_sample
int av_get_bytes_per_sample(enum AVSampleFormat sample_fmt)
Return number of bytes per sample.
Definition: samplefmt.c:106

audio_frame_queue.h

internal.h
common internal api header.

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

channel
channel
Use these values when setting the channel map with ebur128_set_channel().
Definition: ebur128.h:39

AV_CODEC_CAP_LOSSLESS
#define AV_CODEC_CAP_LOSSLESS
Codec is lossless.
Definition: avcodec.h:1058

AVProfile
AVProfile.
Definition: avcodec.h:3357

AVERROR_UNKNOWN
#define AVERROR_UNKNOWN
Unknown error, typically from an external library.
Definition: error.h:71

MKBETAG
#define MKBETAG(a, b, c, d)
Definition: common.h:367

AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Required number of additionally allocated bytes at the end of the input bitstream for decoding...
Definition: avcodec.h:782

AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:1560

av_free
#define av_free(p)
Definition: tableprint_vlc.h:34

get_ilbc_mode
static int get_ilbc_mode(AVCodecContext *avctx)
Definition: audiotoolboxenc.c:142

ffat_get_format_id
static UInt32 ffat_get_format_id(enum AVCodecID codec, int profile)
Definition: audiotoolboxenc.c:55

len
int len
Definition: vorbis_enc_data.h:452

AVCodecContext::channels
int channels
number of audio channels
Definition: avcodec.h:2190

log.h

FF_QP2LAMBDA
#define FF_QP2LAMBDA
factor to convert from H.263 QP to lambda
Definition: avutil.h:227

layout
uint64_t layout
Definition: channel_layout.c:77

ff_af_queue_close
void ff_af_queue_close(AudioFrameQueue *afq)
Close AudioFrameQueue.
Definition: audio_frame_queue.c:36

FF_PROFILE_AAC_HE
#define FF_PROFILE_AAC_HE
Definition: avcodec.h:2867

av_get_default_channel_layout
int64_t av_get_default_channel_layout(int nb_channels)
Return default channel layout for a given number of channels.
Definition: channel_layout.c:225

read_descr
static int read_descr(GetByteContext *gb, int *tag)
Definition: audiotoolboxenc.c:128

ff_bufqueue_add
static void ff_bufqueue_add(void *log, struct FFBufQueue *queue, AVFrame *buf)
Add a buffer to the queue.
Definition: bufferqueue.h:71

ATDecodeContext::pkt_size
unsigned pkt_size
Definition: audiotoolboxenc.c:47

AV_CODEC_ID_ILBC
Definition: avcodec.h:617

AV_CH_LAYOUT_MONO
#define AV_CH_LAYOUT_MONO
Definition: channel_layout.h:85

AVPacket
This structure stores compressed data.
Definition: avcodec.h:1422

remap_layout
static int remap_layout(AudioChannelLayout *layout, uint64_t in_layout, int count)
Definition: audiotoolboxenc.c:179

mode
mode
Use these values in ebur128_init (or'ed).
Definition: ebur128.h:83

AVFrame::nb_samples
int nb_samples
number of audio samples (per channel) described by this frame
Definition: frame.h:292

AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: avcodec.h:1438

ATDecodeContext::eof
int eof
Definition: audiotoolboxdec.c:53

AV_CH_BACK_RIGHT
#define AV_CH_BACK_RIGHT
Definition: channel_layout.h:54

AVCodecContext::rc_max_rate
int64_t rc_max_rate
maximum bitrate
Definition: avcodec.h:2407