annotate ffmpeg/libavcodec/libvo-aacenc.c @ 13:844d341cf643 tip

Back up before ISMIR
author Yading Song <yading.song@eecs.qmul.ac.uk>
date Thu, 31 Oct 2013 13:17:06 +0000
parents 6840f77b83aa
children
rev   line source
yading@10 1 /*
yading@10 2 * AAC encoder wrapper
yading@10 3 * Copyright (c) 2010 Martin Storsjo
yading@10 4 *
yading@10 5 * This file is part of FFmpeg.
yading@10 6 *
yading@10 7 * FFmpeg is free software; you can redistribute it and/or
yading@10 8 * modify it under the terms of the GNU Lesser General Public
yading@10 9 * License as published by the Free Software Foundation; either
yading@10 10 * version 2.1 of the License, or (at your option) any later version.
yading@10 11 *
yading@10 12 * FFmpeg is distributed in the hope that it will be useful,
yading@10 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
yading@10 14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
yading@10 15 * Lesser General Public License for more details.
yading@10 16 *
yading@10 17 * You should have received a copy of the GNU Lesser General Public
yading@10 18 * License along with FFmpeg; if not, write to the Free Software
yading@10 19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
yading@10 20 */
yading@10 21
yading@10 22 #include <vo-aacenc/voAAC.h>
yading@10 23 #include <vo-aacenc/cmnMemory.h>
yading@10 24
yading@10 25 #include "avcodec.h"
yading@10 26 #include "audio_frame_queue.h"
yading@10 27 #include "internal.h"
yading@10 28 #include "mpeg4audio.h"
yading@10 29
yading@10 30 #define FRAME_SIZE 1024
yading@10 31 #define ENC_DELAY 1600
yading@10 32
yading@10 33 typedef struct AACContext {
yading@10 34 VO_AUDIO_CODECAPI codec_api;
yading@10 35 VO_HANDLE handle;
yading@10 36 VO_MEM_OPERATOR mem_operator;
yading@10 37 VO_CODEC_INIT_USERDATA user_data;
yading@10 38 VO_PBYTE end_buffer;
yading@10 39 AudioFrameQueue afq;
yading@10 40 int last_frame;
yading@10 41 int last_samples;
yading@10 42 } AACContext;
yading@10 43
yading@10 44
yading@10 45 static int aac_encode_close(AVCodecContext *avctx)
yading@10 46 {
yading@10 47 AACContext *s = avctx->priv_data;
yading@10 48
yading@10 49 s->codec_api.Uninit(s->handle);
yading@10 50 av_freep(&avctx->extradata);
yading@10 51 ff_af_queue_close(&s->afq);
yading@10 52 av_freep(&s->end_buffer);
yading@10 53
yading@10 54 return 0;
yading@10 55 }
yading@10 56
yading@10 57 static av_cold int aac_encode_init(AVCodecContext *avctx)
yading@10 58 {
yading@10 59 AACContext *s = avctx->priv_data;
yading@10 60 AACENC_PARAM params = { 0 };
yading@10 61 int index, ret;
yading@10 62
yading@10 63 avctx->frame_size = FRAME_SIZE;
yading@10 64 avctx->delay = ENC_DELAY;
yading@10 65 s->last_frame = 2;
yading@10 66 ff_af_queue_init(avctx, &s->afq);
yading@10 67
yading@10 68 s->end_buffer = av_mallocz(avctx->frame_size * avctx->channels * 2);
yading@10 69 if (!s->end_buffer) {
yading@10 70 ret = AVERROR(ENOMEM);
yading@10 71 goto error;
yading@10 72 }
yading@10 73
yading@10 74 voGetAACEncAPI(&s->codec_api);
yading@10 75
yading@10 76 s->mem_operator.Alloc = cmnMemAlloc;
yading@10 77 s->mem_operator.Copy = cmnMemCopy;
yading@10 78 s->mem_operator.Free = cmnMemFree;
yading@10 79 s->mem_operator.Set = cmnMemSet;
yading@10 80 s->mem_operator.Check = cmnMemCheck;
yading@10 81 s->user_data.memflag = VO_IMF_USERMEMOPERATOR;
yading@10 82 s->user_data.memData = &s->mem_operator;
yading@10 83 s->codec_api.Init(&s->handle, VO_AUDIO_CodingAAC, &s->user_data);
yading@10 84
yading@10 85 params.sampleRate = avctx->sample_rate;
yading@10 86 params.bitRate = avctx->bit_rate;
yading@10 87 params.nChannels = avctx->channels;
yading@10 88 params.adtsUsed = !(avctx->flags & CODEC_FLAG_GLOBAL_HEADER);
yading@10 89 if (s->codec_api.SetParam(s->handle, VO_PID_AAC_ENCPARAM, &params)
yading@10 90 != VO_ERR_NONE) {
yading@10 91 av_log(avctx, AV_LOG_ERROR, "Unable to set encoding parameters\n");
yading@10 92 ret = AVERROR(EINVAL);
yading@10 93 goto error;
yading@10 94 }
yading@10 95
yading@10 96 for (index = 0; index < 16; index++)
yading@10 97 if (avctx->sample_rate == avpriv_mpeg4audio_sample_rates[index])
yading@10 98 break;
yading@10 99 if (index == 16) {
yading@10 100 av_log(avctx, AV_LOG_ERROR, "Unsupported sample rate %d\n",
yading@10 101 avctx->sample_rate);
yading@10 102 ret = AVERROR(ENOSYS);
yading@10 103 goto error;
yading@10 104 }
yading@10 105 if (avctx->flags & CODEC_FLAG_GLOBAL_HEADER) {
yading@10 106 avctx->extradata_size = 2;
yading@10 107 avctx->extradata = av_mallocz(avctx->extradata_size +
yading@10 108 FF_INPUT_BUFFER_PADDING_SIZE);
yading@10 109 if (!avctx->extradata) {
yading@10 110 ret = AVERROR(ENOMEM);
yading@10 111 goto error;
yading@10 112 }
yading@10 113
yading@10 114 avctx->extradata[0] = 0x02 << 3 | index >> 1;
yading@10 115 avctx->extradata[1] = (index & 0x01) << 7 | avctx->channels << 3;
yading@10 116 }
yading@10 117 return 0;
yading@10 118 error:
yading@10 119 aac_encode_close(avctx);
yading@10 120 return ret;
yading@10 121 }
yading@10 122
yading@10 123 static int aac_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
yading@10 124 const AVFrame *frame, int *got_packet_ptr)
yading@10 125 {
yading@10 126 AACContext *s = avctx->priv_data;
yading@10 127 VO_CODECBUFFER input = { 0 }, output = { 0 };
yading@10 128 VO_AUDIO_OUTPUTINFO output_info = { { 0 } };
yading@10 129 VO_PBYTE samples;
yading@10 130 int ret;
yading@10 131
yading@10 132 /* handle end-of-stream small frame and flushing */
yading@10 133 if (!frame) {
yading@10 134 if (s->last_frame <= 0)
yading@10 135 return 0;
yading@10 136 if (s->last_samples > 0 && s->last_samples < ENC_DELAY - FRAME_SIZE) {
yading@10 137 s->last_samples = 0;
yading@10 138 s->last_frame--;
yading@10 139 }
yading@10 140 s->last_frame--;
yading@10 141 memset(s->end_buffer, 0, 2 * avctx->channels * avctx->frame_size);
yading@10 142 samples = s->end_buffer;
yading@10 143 } else {
yading@10 144 if (frame->nb_samples < avctx->frame_size) {
yading@10 145 s->last_samples = frame->nb_samples;
yading@10 146 memcpy(s->end_buffer, frame->data[0], 2 * avctx->channels * frame->nb_samples);
yading@10 147 samples = s->end_buffer;
yading@10 148 } else {
yading@10 149 samples = (VO_PBYTE)frame->data[0];
yading@10 150 }
yading@10 151 /* add current frame to the queue */
yading@10 152 if ((ret = ff_af_queue_add(&s->afq, frame)) < 0)
yading@10 153 return ret;
yading@10 154 }
yading@10 155
yading@10 156 if ((ret = ff_alloc_packet2(avctx, avpkt, FFMAX(8192, 768 * avctx->channels))) < 0)
yading@10 157 return ret;
yading@10 158
yading@10 159 input.Buffer = samples;
yading@10 160 input.Length = 2 * avctx->channels * avctx->frame_size;
yading@10 161 output.Buffer = avpkt->data;
yading@10 162 output.Length = avpkt->size;
yading@10 163
yading@10 164 s->codec_api.SetInputData(s->handle, &input);
yading@10 165 if (s->codec_api.GetOutputData(s->handle, &output, &output_info)
yading@10 166 != VO_ERR_NONE) {
yading@10 167 av_log(avctx, AV_LOG_ERROR, "Unable to encode frame\n");
yading@10 168 return AVERROR(EINVAL);
yading@10 169 }
yading@10 170
yading@10 171 /* Get the next frame pts/duration */
yading@10 172 ff_af_queue_remove(&s->afq, avctx->frame_size, &avpkt->pts,
yading@10 173 &avpkt->duration);
yading@10 174
yading@10 175 avpkt->size = output.Length;
yading@10 176 *got_packet_ptr = 1;
yading@10 177 return 0;
yading@10 178 }
yading@10 179
yading@10 180 /* duplicated from avpriv_mpeg4audio_sample_rates to avoid shared build
yading@10 181 * failures */
yading@10 182 static const int mpeg4audio_sample_rates[16] = {
yading@10 183 96000, 88200, 64000, 48000, 44100, 32000,
yading@10 184 24000, 22050, 16000, 12000, 11025, 8000, 7350
yading@10 185 };
yading@10 186
yading@10 187 AVCodec ff_libvo_aacenc_encoder = {
yading@10 188 .name = "libvo_aacenc",
yading@10 189 .type = AVMEDIA_TYPE_AUDIO,
yading@10 190 .id = AV_CODEC_ID_AAC,
yading@10 191 .priv_data_size = sizeof(AACContext),
yading@10 192 .init = aac_encode_init,
yading@10 193 .encode2 = aac_encode_frame,
yading@10 194 .close = aac_encode_close,
yading@10 195 .supported_samplerates = mpeg4audio_sample_rates,
yading@10 196 .capabilities = CODEC_CAP_SMALL_LAST_FRAME | CODEC_CAP_DELAY,
yading@10 197 .sample_fmts = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S16,
yading@10 198 AV_SAMPLE_FMT_NONE },
yading@10 199 .long_name = NULL_IF_CONFIG_SMALL("Android VisualOn AAC (Advanced Audio Coding)"),
yading@10 200 };