SoftAACEncoder2.cpp revision f60c660f048d5f5e2458cff243c20400d73757a7
1/*
2 * Copyright (C) 2012 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 *      http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17//#define LOG_NDEBUG 0
18#define LOG_TAG "SoftAACEncoder2"
19#include <utils/Log.h>
20
21#include "SoftAACEncoder2.h"
22
23#include <media/stagefright/foundation/ADebug.h>
24#include <media/stagefright/foundation/hexdump.h>
25
26namespace android {
27
28template<class T>
29static void InitOMXParams(T *params) {
30    params->nSize = sizeof(T);
31    params->nVersion.s.nVersionMajor = 1;
32    params->nVersion.s.nVersionMinor = 0;
33    params->nVersion.s.nRevision = 0;
34    params->nVersion.s.nStep = 0;
35}
36
37SoftAACEncoder2::SoftAACEncoder2(
38        const char *name,
39        const OMX_CALLBACKTYPE *callbacks,
40        OMX_PTR appData,
41        OMX_COMPONENTTYPE **component)
42    : SimpleSoftOMXComponent(name, callbacks, appData, component),
43      mAACEncoder(NULL),
44      mNumChannels(1),
45      mSampleRate(44100),
46      mBitRate(0),
47      mAACProfile(OMX_AUDIO_AACObjectLC),
48      mSentCodecSpecificData(false),
49      mInputSize(0),
50      mInputFrame(NULL),
51      mInputTimeUs(-1ll),
52      mSawInputEOS(false),
53      mSignalledError(false) {
54    initPorts();
55    CHECK_EQ(initEncoder(), (status_t)OK);
56    setAudioParams();
57}
58
59SoftAACEncoder2::~SoftAACEncoder2() {
60    aacEncClose(&mAACEncoder);
61
62    delete[] mInputFrame;
63    mInputFrame = NULL;
64}
65
66void SoftAACEncoder2::initPorts() {
67    OMX_PARAM_PORTDEFINITIONTYPE def;
68    InitOMXParams(&def);
69
70    def.nPortIndex = 0;
71    def.eDir = OMX_DirInput;
72    def.nBufferCountMin = kNumBuffers;
73    def.nBufferCountActual = def.nBufferCountMin;
74    def.nBufferSize = kNumSamplesPerFrame * sizeof(int16_t) * 2;
75    def.bEnabled = OMX_TRUE;
76    def.bPopulated = OMX_FALSE;
77    def.eDomain = OMX_PortDomainAudio;
78    def.bBuffersContiguous = OMX_FALSE;
79    def.nBufferAlignment = 1;
80
81    def.format.audio.cMIMEType = const_cast<char *>("audio/raw");
82    def.format.audio.pNativeRender = NULL;
83    def.format.audio.bFlagErrorConcealment = OMX_FALSE;
84    def.format.audio.eEncoding = OMX_AUDIO_CodingPCM;
85
86    addPort(def);
87
88    def.nPortIndex = 1;
89    def.eDir = OMX_DirOutput;
90    def.nBufferCountMin = kNumBuffers;
91    def.nBufferCountActual = def.nBufferCountMin;
92    def.nBufferSize = 8192;
93    def.bEnabled = OMX_TRUE;
94    def.bPopulated = OMX_FALSE;
95    def.eDomain = OMX_PortDomainAudio;
96    def.bBuffersContiguous = OMX_FALSE;
97    def.nBufferAlignment = 2;
98
99    def.format.audio.cMIMEType = const_cast<char *>("audio/aac");
100    def.format.audio.pNativeRender = NULL;
101    def.format.audio.bFlagErrorConcealment = OMX_FALSE;
102    def.format.audio.eEncoding = OMX_AUDIO_CodingAAC;
103
104    addPort(def);
105}
106
107status_t SoftAACEncoder2::initEncoder() {
108    if (AACENC_OK != aacEncOpen(&mAACEncoder, 0, 0)) {
109        ALOGE("Failed to init AAC encoder");
110        return UNKNOWN_ERROR;
111    }
112    return OK;
113}
114
115OMX_ERRORTYPE SoftAACEncoder2::internalGetParameter(
116        OMX_INDEXTYPE index, OMX_PTR params) {
117    switch (index) {
118        case OMX_IndexParamAudioPortFormat:
119        {
120            OMX_AUDIO_PARAM_PORTFORMATTYPE *formatParams =
121                (OMX_AUDIO_PARAM_PORTFORMATTYPE *)params;
122
123            if (formatParams->nPortIndex > 1) {
124                return OMX_ErrorUndefined;
125            }
126
127            if (formatParams->nIndex > 0) {
128                return OMX_ErrorNoMore;
129            }
130
131            formatParams->eEncoding =
132                (formatParams->nPortIndex == 0)
133                    ? OMX_AUDIO_CodingPCM : OMX_AUDIO_CodingAAC;
134
135            return OMX_ErrorNone;
136        }
137
138        case OMX_IndexParamAudioAac:
139        {
140            OMX_AUDIO_PARAM_AACPROFILETYPE *aacParams =
141                (OMX_AUDIO_PARAM_AACPROFILETYPE *)params;
142
143            if (aacParams->nPortIndex != 1) {
144                return OMX_ErrorUndefined;
145            }
146
147            aacParams->nBitRate = mBitRate;
148            aacParams->nAudioBandWidth = 0;
149            aacParams->nAACtools = 0;
150            aacParams->nAACERtools = 0;
151            aacParams->eAACProfile = (OMX_AUDIO_AACPROFILETYPE) mAACProfile;
152            aacParams->eAACStreamFormat = OMX_AUDIO_AACStreamFormatMP4FF;
153            aacParams->eChannelMode = OMX_AUDIO_ChannelModeStereo;
154
155            aacParams->nChannels = mNumChannels;
156            aacParams->nSampleRate = mSampleRate;
157            aacParams->nFrameLength = 0;
158
159            return OMX_ErrorNone;
160        }
161
162        case OMX_IndexParamAudioPcm:
163        {
164            OMX_AUDIO_PARAM_PCMMODETYPE *pcmParams =
165                (OMX_AUDIO_PARAM_PCMMODETYPE *)params;
166
167            if (pcmParams->nPortIndex != 0) {
168                return OMX_ErrorUndefined;
169            }
170
171            pcmParams->eNumData = OMX_NumericalDataSigned;
172            pcmParams->eEndian = OMX_EndianBig;
173            pcmParams->bInterleaved = OMX_TRUE;
174            pcmParams->nBitPerSample = 16;
175            pcmParams->ePCMMode = OMX_AUDIO_PCMModeLinear;
176            pcmParams->eChannelMapping[0] = OMX_AUDIO_ChannelLF;
177            pcmParams->eChannelMapping[1] = OMX_AUDIO_ChannelRF;
178
179            pcmParams->nChannels = mNumChannels;
180            pcmParams->nSamplingRate = mSampleRate;
181
182            return OMX_ErrorNone;
183        }
184
185        default:
186            return SimpleSoftOMXComponent::internalGetParameter(index, params);
187    }
188}
189
190OMX_ERRORTYPE SoftAACEncoder2::internalSetParameter(
191        OMX_INDEXTYPE index, const OMX_PTR params) {
192    switch (index) {
193        case OMX_IndexParamStandardComponentRole:
194        {
195            const OMX_PARAM_COMPONENTROLETYPE *roleParams =
196                (const OMX_PARAM_COMPONENTROLETYPE *)params;
197
198            if (strncmp((const char *)roleParams->cRole,
199                        "audio_encoder.aac",
200                        OMX_MAX_STRINGNAME_SIZE - 1)) {
201                return OMX_ErrorUndefined;
202            }
203
204            return OMX_ErrorNone;
205        }
206
207        case OMX_IndexParamAudioPortFormat:
208        {
209            const OMX_AUDIO_PARAM_PORTFORMATTYPE *formatParams =
210                (const OMX_AUDIO_PARAM_PORTFORMATTYPE *)params;
211
212            if (formatParams->nPortIndex > 1) {
213                return OMX_ErrorUndefined;
214            }
215
216            if (formatParams->nIndex > 0) {
217                return OMX_ErrorNoMore;
218            }
219
220            if ((formatParams->nPortIndex == 0
221                        && formatParams->eEncoding != OMX_AUDIO_CodingPCM)
222                || (formatParams->nPortIndex == 1
223                        && formatParams->eEncoding != OMX_AUDIO_CodingAAC)) {
224                return OMX_ErrorUndefined;
225            }
226
227            return OMX_ErrorNone;
228        }
229
230        case OMX_IndexParamAudioAac:
231        {
232            OMX_AUDIO_PARAM_AACPROFILETYPE *aacParams =
233                (OMX_AUDIO_PARAM_AACPROFILETYPE *)params;
234
235            if (aacParams->nPortIndex != 1) {
236                return OMX_ErrorUndefined;
237            }
238
239            mBitRate = aacParams->nBitRate;
240            mNumChannels = aacParams->nChannels;
241            mSampleRate = aacParams->nSampleRate;
242            if (aacParams->eAACProfile != OMX_AUDIO_AACObjectNull) {
243                mAACProfile = aacParams->eAACProfile;
244            }
245
246            if (setAudioParams() != OK) {
247                return OMX_ErrorUndefined;
248            }
249
250            return OMX_ErrorNone;
251        }
252
253        case OMX_IndexParamAudioPcm:
254        {
255            OMX_AUDIO_PARAM_PCMMODETYPE *pcmParams =
256                (OMX_AUDIO_PARAM_PCMMODETYPE *)params;
257
258            if (pcmParams->nPortIndex != 0) {
259                return OMX_ErrorUndefined;
260            }
261
262            mNumChannels = pcmParams->nChannels;
263            mSampleRate = pcmParams->nSamplingRate;
264            if (setAudioParams() != OK) {
265                return OMX_ErrorUndefined;
266            }
267
268            return OMX_ErrorNone;
269        }
270
271        default:
272            return SimpleSoftOMXComponent::internalSetParameter(index, params);
273    }
274}
275
276static CHANNEL_MODE getChannelMode(OMX_U32 nChannels) {
277    CHANNEL_MODE chMode = MODE_INVALID;
278    switch (nChannels) {
279        case 1: chMode = MODE_1; break;
280        case 2: chMode = MODE_2; break;
281        case 3: chMode = MODE_1_2; break;
282        case 4: chMode = MODE_1_2_1; break;
283        case 5: chMode = MODE_1_2_2; break;
284        case 6: chMode = MODE_1_2_2_1; break;
285        default: chMode = MODE_INVALID;
286    }
287    return chMode;
288}
289
290static AUDIO_OBJECT_TYPE getAOTFromProfile(OMX_U32 profile) {
291    if (profile == OMX_AUDIO_AACObjectLC) {
292        return AOT_AAC_LC;
293    } else if (profile == OMX_AUDIO_AACObjectHE) {
294        return AOT_SBR;
295    } else if (profile == OMX_AUDIO_AACObjectELD) {
296        return AOT_ER_AAC_ELD;
297    } else {
298        ALOGW("Unsupported AAC profile - defaulting to AAC-LC");
299        return AOT_AAC_LC;
300    }
301}
302
303status_t SoftAACEncoder2::setAudioParams() {
304    // We call this whenever sample rate, number of channels or bitrate change
305    // in reponse to setParameter calls.
306
307    ALOGV("setAudioParams: %lu Hz, %lu channels, %lu bps",
308         mSampleRate, mNumChannels, mBitRate);
309
310    if (AACENC_OK != aacEncoder_SetParam(mAACEncoder, AACENC_AOT,
311            getAOTFromProfile(mAACProfile))) {
312        ALOGE("Failed to set AAC encoder parameters");
313        return UNKNOWN_ERROR;
314    }
315
316    if (AACENC_OK != aacEncoder_SetParam(mAACEncoder, AACENC_SAMPLERATE, mSampleRate)) {
317        ALOGE("Failed to set AAC encoder parameters");
318        return UNKNOWN_ERROR;
319    }
320    if (AACENC_OK != aacEncoder_SetParam(mAACEncoder, AACENC_BITRATE, mBitRate)) {
321        ALOGE("Failed to set AAC encoder parameters");
322        return UNKNOWN_ERROR;
323    }
324    if (AACENC_OK != aacEncoder_SetParam(mAACEncoder, AACENC_CHANNELMODE,
325            getChannelMode(mNumChannels))) {
326        ALOGE("Failed to set AAC encoder parameters");
327        return UNKNOWN_ERROR;
328    }
329    if (AACENC_OK != aacEncoder_SetParam(mAACEncoder, AACENC_TRANSMUX, TT_MP4_RAW)) {
330        ALOGE("Failed to set AAC encoder parameters");
331        return UNKNOWN_ERROR;
332    }
333
334    return OK;
335}
336
337void SoftAACEncoder2::onQueueFilled(OMX_U32 portIndex) {
338    if (mSignalledError) {
339        return;
340    }
341
342    List<BufferInfo *> &inQueue = getPortQueue(0);
343    List<BufferInfo *> &outQueue = getPortQueue(1);
344
345    if (!mSentCodecSpecificData) {
346        // The very first thing we want to output is the codec specific
347        // data. It does not require any input data but we will need an
348        // output buffer to store it in.
349
350        if (outQueue.empty()) {
351            return;
352        }
353
354        if (AACENC_OK != aacEncEncode(mAACEncoder, NULL, NULL, NULL, NULL)) {
355            ALOGE("Unable to initialize encoder for profile / sample-rate / bit-rate / channels");
356            notify(OMX_EventError, OMX_ErrorUndefined, 0, NULL);
357            mSignalledError = true;
358            return;
359        }
360
361        OMX_U32 actualBitRate  = aacEncoder_GetParam(mAACEncoder, AACENC_BITRATE);
362        if (mBitRate != actualBitRate) {
363            ALOGW("Requested bitrate %lu unsupported, using %lu", mBitRate, actualBitRate);
364        }
365
366        AACENC_InfoStruct encInfo;
367        if (AACENC_OK != aacEncInfo(mAACEncoder, &encInfo)) {
368            ALOGE("Failed to get AAC encoder info");
369            notify(OMX_EventError, OMX_ErrorUndefined, 0, NULL);
370            mSignalledError = true;
371            return;
372        }
373
374        BufferInfo *outInfo = *outQueue.begin();
375        OMX_BUFFERHEADERTYPE *outHeader = outInfo->mHeader;
376        outHeader->nFilledLen = encInfo.confSize;
377        outHeader->nFlags = OMX_BUFFERFLAG_CODECCONFIG;
378
379        uint8_t *out = outHeader->pBuffer + outHeader->nOffset;
380        memcpy(out, encInfo.confBuf, encInfo.confSize);
381
382        outQueue.erase(outQueue.begin());
383        outInfo->mOwnedByUs = false;
384        notifyFillBufferDone(outHeader);
385
386        mSentCodecSpecificData = true;
387    }
388
389    size_t numBytesPerInputFrame =
390        mNumChannels * kNumSamplesPerFrame * sizeof(int16_t);
391
392    // Limit input size so we only get one ELD frame
393    if (mAACProfile == OMX_AUDIO_AACObjectELD && numBytesPerInputFrame > 512) {
394        numBytesPerInputFrame = 512;
395    }
396
397    for (;;) {
398        // We do the following until we run out of buffers.
399
400        while (mInputSize < numBytesPerInputFrame) {
401            // As long as there's still input data to be read we
402            // will drain "kNumSamplesPerFrame * mNumChannels" samples
403            // into the "mInputFrame" buffer and then encode those
404            // as a unit into an output buffer.
405
406            if (mSawInputEOS || inQueue.empty()) {
407                return;
408            }
409
410            BufferInfo *inInfo = *inQueue.begin();
411            OMX_BUFFERHEADERTYPE *inHeader = inInfo->mHeader;
412
413            const void *inData = inHeader->pBuffer + inHeader->nOffset;
414
415            size_t copy = numBytesPerInputFrame - mInputSize;
416            if (copy > inHeader->nFilledLen) {
417                copy = inHeader->nFilledLen;
418            }
419
420            if (mInputFrame == NULL) {
421                mInputFrame = new int16_t[numBytesPerInputFrame / sizeof(int16_t)];
422            }
423
424            if (mInputSize == 0) {
425                mInputTimeUs = inHeader->nTimeStamp;
426            }
427
428            memcpy((uint8_t *)mInputFrame + mInputSize, inData, copy);
429            mInputSize += copy;
430
431            inHeader->nOffset += copy;
432            inHeader->nFilledLen -= copy;
433
434            // "Time" on the input buffer has in effect advanced by the
435            // number of audio frames we just advanced nOffset by.
436            inHeader->nTimeStamp +=
437                (copy * 1000000ll / mSampleRate)
438                    / (mNumChannels * sizeof(int16_t));
439
440            if (inHeader->nFilledLen == 0) {
441                if (inHeader->nFlags & OMX_BUFFERFLAG_EOS) {
442                    mSawInputEOS = true;
443
444                    // Pad any remaining data with zeroes.
445                    memset((uint8_t *)mInputFrame + mInputSize,
446                           0,
447                           numBytesPerInputFrame - mInputSize);
448
449                    mInputSize = numBytesPerInputFrame;
450                }
451
452                inQueue.erase(inQueue.begin());
453                inInfo->mOwnedByUs = false;
454                notifyEmptyBufferDone(inHeader);
455
456                inData = NULL;
457                inHeader = NULL;
458                inInfo = NULL;
459            }
460        }
461
462        // At this  point we have all the input data necessary to encode
463        // a single frame, all we need is an output buffer to store the result
464        // in.
465
466        if (outQueue.empty()) {
467            return;
468        }
469
470        BufferInfo *outInfo = *outQueue.begin();
471        OMX_BUFFERHEADERTYPE *outHeader = outInfo->mHeader;
472
473        uint8_t *outPtr = (uint8_t *)outHeader->pBuffer + outHeader->nOffset;
474        size_t outAvailable = outHeader->nAllocLen - outHeader->nOffset;
475
476        AACENC_InArgs inargs;
477        AACENC_OutArgs outargs;
478        memset(&inargs, 0, sizeof(inargs));
479        memset(&outargs, 0, sizeof(outargs));
480        inargs.numInSamples = numBytesPerInputFrame / sizeof(int16_t);
481
482        void* inBuffer[]        = { (unsigned char *)mInputFrame };
483        INT   inBufferIds[]     = { IN_AUDIO_DATA };
484        INT   inBufferSize[]    = { numBytesPerInputFrame };
485        INT   inBufferElSize[]  = { sizeof(int16_t) };
486
487        AACENC_BufDesc inBufDesc;
488        inBufDesc.numBufs           = sizeof(inBuffer) / sizeof(void*);
489        inBufDesc.bufs              = (void**)&inBuffer;
490        inBufDesc.bufferIdentifiers = inBufferIds;
491        inBufDesc.bufSizes          = inBufferSize;
492        inBufDesc.bufElSizes        = inBufferElSize;
493
494        void* outBuffer[]       = { outPtr };
495        INT   outBufferIds[]    = { OUT_BITSTREAM_DATA };
496        INT   outBufferSize[]   = { 0 };
497        INT   outBufferElSize[] = { sizeof(UCHAR) };
498
499        AACENC_BufDesc outBufDesc;
500        outBufDesc.numBufs           = sizeof(outBuffer) / sizeof(void*);
501        outBufDesc.bufs              = (void**)&outBuffer;
502        outBufDesc.bufferIdentifiers = outBufferIds;
503        outBufDesc.bufSizes          = outBufferSize;
504        outBufDesc.bufElSizes        = outBufferElSize;
505
506        // Encode the mInputFrame, which is treated as a modulo buffer
507        AACENC_ERROR encoderErr = AACENC_OK;
508        size_t nOutputBytes = 0;
509
510        do {
511            memset(&outargs, 0, sizeof(outargs));
512
513            outBuffer[0] = outPtr;
514            outBufferSize[0] = outAvailable - nOutputBytes;
515
516            encoderErr = aacEncEncode(mAACEncoder,
517                                      &inBufDesc,
518                                      &outBufDesc,
519                                      &inargs,
520                                      &outargs);
521
522            if (encoderErr == AACENC_OK) {
523                outPtr += outargs.numOutBytes;
524                nOutputBytes += outargs.numOutBytes;
525
526                if (outargs.numInSamples > 0) {
527                    int numRemainingSamples = inargs.numInSamples - outargs.numInSamples;
528                    if (numRemainingSamples > 0) {
529                        memmove(mInputFrame,
530                                &mInputFrame[outargs.numInSamples],
531                                sizeof(int16_t) * numRemainingSamples);
532                    }
533                    inargs.numInSamples -= outargs.numInSamples;
534                }
535            }
536        } while (encoderErr == AACENC_OK && inargs.numInSamples > 0);
537
538        outHeader->nFilledLen = nOutputBytes;
539
540        outHeader->nFlags = OMX_BUFFERFLAG_ENDOFFRAME;
541
542        if (mSawInputEOS) {
543            // We also tag this output buffer with EOS if it corresponds
544            // to the final input buffer.
545            outHeader->nFlags = OMX_BUFFERFLAG_EOS;
546        }
547
548        outHeader->nTimeStamp = mInputTimeUs;
549
550#if 0
551        ALOGI("sending %d bytes of data (time = %lld us, flags = 0x%08lx)",
552              nOutputBytes, mInputTimeUs, outHeader->nFlags);
553
554        hexdump(outHeader->pBuffer + outHeader->nOffset, outHeader->nFilledLen);
555#endif
556
557        outQueue.erase(outQueue.begin());
558        outInfo->mOwnedByUs = false;
559        notifyFillBufferDone(outHeader);
560
561        outHeader = NULL;
562        outInfo = NULL;
563
564        mInputSize = 0;
565    }
566}
567
568}  // namespace android
569
570android::SoftOMXComponent *createSoftOMXComponent(
571        const char *name, const OMX_CALLBACKTYPE *callbacks,
572        OMX_PTR appData, OMX_COMPONENTTYPE **component) {
573    return new android::SoftAACEncoder2(name, callbacks, appData, component);
574}
575