/* * Copyright (C) 2009 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ //#define LOG_NDEBUG 0 #define LOG_TAG "Utils" #include #include "include/ESDS.h" #include #include #include #include #include #include #ifdef QCOM_ENHANCED_AUDIO #include #include #include #include #include "include/avc_utils.h" #include "include/QCUtilityClass.h" #endif namespace android { uint16_t U16_AT(const uint8_t *ptr) { return ptr[0] << 8 | ptr[1]; } uint32_t U32_AT(const uint8_t *ptr) { return ptr[0] << 24 | ptr[1] << 16 | ptr[2] << 8 | ptr[3]; } uint64_t U64_AT(const uint8_t *ptr) { return ((uint64_t)U32_AT(ptr)) << 32 | U32_AT(ptr + 4); } uint16_t U16LE_AT(const uint8_t *ptr) { return ptr[0] | (ptr[1] << 8); } uint32_t U32LE_AT(const uint8_t *ptr) { return ptr[3] << 24 | ptr[2] << 16 | ptr[1] << 8 | ptr[0]; } uint64_t U64LE_AT(const uint8_t *ptr) { return ((uint64_t)U32LE_AT(ptr + 4)) << 32 | U32LE_AT(ptr); } // XXX warning: these won't work on big-endian host. uint64_t ntoh64(uint64_t x) { return ((uint64_t)ntohl(x & 0xffffffff) << 32) | ntohl(x >> 32); } uint64_t hton64(uint64_t x) { return ((uint64_t)htonl(x & 0xffffffff) << 32) | htonl(x >> 32); } status_t convertMetaDataToMessage( const sp &meta, sp *format) { format->clear(); const char *mime; CHECK(meta->findCString(kKeyMIMEType, &mime)); sp msg = new AMessage; msg->setString("mime", mime); int64_t durationUs; if (meta->findInt64(kKeyDuration, &durationUs)) { msg->setInt64("durationUs", durationUs); } if (!strncasecmp("video/", mime, 6)) { int32_t width, height; CHECK(meta->findInt32(kKeyWidth, &width)); CHECK(meta->findInt32(kKeyHeight, &height)); msg->setInt32("width", width); msg->setInt32("height", height); } else if (!strncasecmp("audio/", mime, 6)) { int32_t numChannels, sampleRate; CHECK(meta->findInt32(kKeyChannelCount, &numChannels)); CHECK(meta->findInt32(kKeySampleRate, &sampleRate)); msg->setInt32("channel-count", numChannels); msg->setInt32("sample-rate", sampleRate); int32_t channelMask; if (meta->findInt32(kKeyChannelMask, &channelMask)) { msg->setInt32("channel-mask", channelMask); } int32_t delay = 0; if (meta->findInt32(kKeyEncoderDelay, &delay)) { msg->setInt32("encoder-delay", delay); } int32_t padding = 0; if (meta->findInt32(kKeyEncoderPadding, &padding)) { msg->setInt32("encoder-padding", padding); } int32_t isADTS; if (meta->findInt32(kKeyIsADTS, &isADTS)) { msg->setInt32("is-adts", true); } #ifdef QCOM_ENHANCED_AUDIO int32_t keyWMAVersion; if (meta->findInt32(kKeyWMAVersion, &keyWMAVersion)) { msg->setInt32("WMA-Version", keyWMAVersion); } int32_t bitRate; int32_t encodeOptions; int32_t blockAlign; int32_t bitspersample; int32_t formattag; int32_t advencopt1; int32_t advencopt2; int32_t VirtualPktSize; if (meta->findInt32(kKeyWMABitspersample, &bitspersample)) { msg->setInt32("bsps", bitspersample); } if (meta->findInt32(kKeyWMAFormatTag, &formattag)) { msg->setInt32("fmtt", formattag); } if (meta->findInt32(kKeyWMAAdvEncOpt1, &advencopt1)) { msg->setInt32("ade1", advencopt1); } if (meta->findInt32(kKeyWMAAdvEncOpt2, &advencopt2)) { msg->setInt32("ade2", advencopt2); } if (meta->findInt32(kKeyWMAVirPktSize, &VirtualPktSize)) { msg->setInt32("vpks", VirtualPktSize); } if (meta->findInt32(kKeyBitRate, &bitRate)) { msg->setInt32("brte", bitRate); } if (meta->findInt32(kKeyWMAEncodeOpt, &encodeOptions)) { msg->setInt32("eopt", encodeOptions); } if (meta->findInt32(kKeyWMABlockAlign, &blockAlign)) { msg->setInt32("blka", blockAlign); } #endif } int32_t maxInputSize; if (meta->findInt32(kKeyMaxInputSize, &maxInputSize)) { msg->setInt32("max-input-size", maxInputSize); } uint32_t type; const void *data; size_t size; if (meta->findData(kKeyAVCC, &type, &data, &size)) { // Parse the AVCDecoderConfigurationRecord const uint8_t *ptr = (const uint8_t *)data; CHECK(size >= 7); CHECK_EQ((unsigned)ptr[0], 1u); // configurationVersion == 1 uint8_t profile = ptr[1]; uint8_t level = ptr[3]; // There is decodable content out there that fails the following // assertion, let's be lenient for now... // CHECK((ptr[4] >> 2) == 0x3f); // reserved size_t lengthSize = 1 + (ptr[4] & 3); // commented out check below as H264_QVGA_500_NO_AUDIO.3gp // violates it... // CHECK((ptr[5] >> 5) == 7); // reserved size_t numSeqParameterSets = ptr[5] & 31; ptr += 6; size -= 6; sp buffer = new ABuffer(1024); buffer->setRange(0, 0); for (size_t i = 0; i < numSeqParameterSets; ++i) { CHECK(size >= 2); size_t length = U16_AT(ptr); ptr += 2; size -= 2; CHECK(size >= length); memcpy(buffer->data() + buffer->size(), "\x00\x00\x00\x01", 4); memcpy(buffer->data() + buffer->size() + 4, ptr, length); buffer->setRange(0, buffer->size() + 4 + length); ptr += length; size -= length; } buffer->meta()->setInt32("csd", true); buffer->meta()->setInt64("timeUs", 0); msg->setBuffer("csd-0", buffer); buffer = new ABuffer(1024); buffer->setRange(0, 0); CHECK(size >= 1); size_t numPictureParameterSets = *ptr; ++ptr; --size; for (size_t i = 0; i < numPictureParameterSets; ++i) { CHECK(size >= 2); size_t length = U16_AT(ptr); ptr += 2; size -= 2; CHECK(size >= length); memcpy(buffer->data() + buffer->size(), "\x00\x00\x00\x01", 4); memcpy(buffer->data() + buffer->size() + 4, ptr, length); buffer->setRange(0, buffer->size() + 4 + length); ptr += length; size -= length; } buffer->meta()->setInt32("csd", true); buffer->meta()->setInt64("timeUs", 0); msg->setBuffer("csd-1", buffer); } else if (meta->findData(kKeyESDS, &type, &data, &size)) { ESDS esds((const char *)data, size); CHECK_EQ(esds.InitCheck(), (status_t)OK); const void *codec_specific_data; size_t codec_specific_data_size; esds.getCodecSpecificInfo( &codec_specific_data, &codec_specific_data_size); sp buffer = new ABuffer(codec_specific_data_size); memcpy(buffer->data(), codec_specific_data, codec_specific_data_size); buffer->meta()->setInt32("csd", true); buffer->meta()->setInt64("timeUs", 0); msg->setBuffer("csd-0", buffer); } else if (meta->findData(kKeyVorbisInfo, &type, &data, &size)) { sp buffer = new ABuffer(size); memcpy(buffer->data(), data, size); buffer->meta()->setInt32("csd", true); buffer->meta()->setInt64("timeUs", 0); msg->setBuffer("csd-0", buffer); if (!meta->findData(kKeyVorbisBooks, &type, &data, &size)) { return -EINVAL; } buffer = new ABuffer(size); memcpy(buffer->data(), data, size); buffer->meta()->setInt32("csd", true); buffer->meta()->setInt64("timeUs", 0); msg->setBuffer("csd-1", buffer); } *format = msg; return OK; } static size_t reassembleAVCC(const sp &csd0, const sp csd1, char *avcc) { avcc[0] = 1; // version avcc[1] = 0x64; // profile avcc[2] = 0; // unused (?) avcc[3] = 0xd; // level avcc[4] = 0xff; // reserved+size size_t i = 0; int numparams = 0; int lastparamoffset = 0; int avccidx = 6; do { if (i >= csd0->size() - 4 || memcmp(csd0->data() + i, "\x00\x00\x00\x01", 4) == 0) { if (i >= csd0->size() - 4) { // there can't be another param here, so use all the rest i = csd0->size(); } ALOGV("block at %d, last was %d", i, lastparamoffset); if (lastparamoffset > 0) { int size = i - lastparamoffset; avcc[avccidx++] = size >> 8; avcc[avccidx++] = size & 0xff; memcpy(avcc+avccidx, csd0->data() + lastparamoffset, size); avccidx += size; numparams++; } i += 4; lastparamoffset = i; } else { i++; } } while(i < csd0->size()); ALOGV("csd0 contains %d params", numparams); avcc[5] = 0xe0 | numparams; //and now csd-1 i = 0; numparams = 0; lastparamoffset = 0; int numpicparamsoffset = avccidx; avccidx++; do { if (i >= csd1->size() - 4 || memcmp(csd1->data() + i, "\x00\x00\x00\x01", 4) == 0) { if (i >= csd1->size() - 4) { // there can't be another param here, so use all the rest i = csd1->size(); } ALOGV("block at %d, last was %d", i, lastparamoffset); if (lastparamoffset > 0) { int size = i - lastparamoffset; avcc[avccidx++] = size >> 8; avcc[avccidx++] = size & 0xff; memcpy(avcc+avccidx, csd1->data() + lastparamoffset, size); avccidx += size; numparams++; } i += 4; lastparamoffset = i; } else { i++; } } while(i < csd1->size()); avcc[numpicparamsoffset] = numparams; return avccidx; } static void reassembleESDS(const sp &csd0, char *esds) { int csd0size = csd0->size(); esds[0] = 3; // kTag_ESDescriptor; int esdescriptorsize = 26 + csd0size; CHECK(esdescriptorsize < 268435456); // 7 bits per byte, so max is 2^28-1 esds[1] = 0x80 | (esdescriptorsize >> 21); esds[2] = 0x80 | ((esdescriptorsize >> 14) & 0x7f); esds[3] = 0x80 | ((esdescriptorsize >> 7) & 0x7f); esds[4] = (esdescriptorsize & 0x7f); esds[5] = esds[6] = 0; // es id esds[7] = 0; // flags esds[8] = 4; // kTag_DecoderConfigDescriptor int configdescriptorsize = 18 + csd0size; esds[9] = 0x80 | (configdescriptorsize >> 21); esds[10] = 0x80 | ((configdescriptorsize >> 14) & 0x7f); esds[11] = 0x80 | ((configdescriptorsize >> 7) & 0x7f); esds[12] = (configdescriptorsize & 0x7f); esds[13] = 0x40; // objectTypeIndication esds[14] = 0x15; // not sure what 14-25 mean, they are ignored by ESDS.cpp, esds[15] = 0x00; // but the actual values here were taken from a real file. esds[16] = 0x18; esds[17] = 0x00; esds[18] = 0x00; esds[19] = 0x00; esds[20] = 0xfa; esds[21] = 0x00; esds[22] = 0x00; esds[23] = 0x00; esds[24] = 0xfa; esds[25] = 0x00; esds[26] = 5; // kTag_DecoderSpecificInfo; esds[27] = 0x80 | (csd0size >> 21); esds[28] = 0x80 | ((csd0size >> 14) & 0x7f); esds[29] = 0x80 | ((csd0size >> 7) & 0x7f); esds[30] = (csd0size & 0x7f); memcpy((void*)&esds[31], csd0->data(), csd0size); // data following this is ignored, so don't bother appending it } void convertMessageToMetaData(const sp &msg, sp &meta) { AString mime; if (msg->findString("mime", &mime)) { meta->setCString(kKeyMIMEType, mime.c_str()); } else { ALOGW("did not find mime type"); } int64_t durationUs; if (msg->findInt64("durationUs", &durationUs)) { meta->setInt64(kKeyDuration, durationUs); } if (mime.startsWith("video/")) { int32_t width; int32_t height; if (msg->findInt32("width", &width) && msg->findInt32("height", &height)) { meta->setInt32(kKeyWidth, width); meta->setInt32(kKeyHeight, height); } else { ALOGW("did not find width and/or height"); } } else if (mime.startsWith("audio/")) { int32_t numChannels; if (msg->findInt32("channel-count", &numChannels)) { meta->setInt32(kKeyChannelCount, numChannels); } int32_t sampleRate; if (msg->findInt32("sample-rate", &sampleRate)) { meta->setInt32(kKeySampleRate, sampleRate); } int32_t channelMask; if (msg->findInt32("channel-mask", &channelMask)) { meta->setInt32(kKeyChannelMask, channelMask); } int32_t delay = 0; if (msg->findInt32("encoder-delay", &delay)) { meta->setInt32(kKeyEncoderDelay, delay); } int32_t padding = 0; if (msg->findInt32("encoder-padding", &padding)) { meta->setInt32(kKeyEncoderPadding, padding); } int32_t isADTS; if (msg->findInt32("is-adts", &isADTS)) { meta->setInt32(kKeyIsADTS, isADTS); } } int32_t maxInputSize; if (msg->findInt32("max-input-size", &maxInputSize)) { meta->setInt32(kKeyMaxInputSize, maxInputSize); } // reassemble the csd data into its original form sp csd0; if (msg->findBuffer("csd-0", &csd0)) { if (mime.startsWith("video/")) { // do we need to be stricter than this? sp csd1; if (msg->findBuffer("csd-1", &csd1)) { char avcc[1024]; // that oughta be enough, right? size_t outsize = reassembleAVCC(csd0, csd1, avcc); meta->setData(kKeyAVCC, kKeyAVCC, avcc, outsize); } } else if (mime.startsWith("audio/")) { int csd0size = csd0->size(); char esds[csd0size + 31]; reassembleESDS(csd0, esds); meta->setData(kKeyESDS, kKeyESDS, esds, sizeof(esds)); } } // XXX TODO add whatever other keys there are #if 0 ALOGI("converted %s to:", msg->debugString(0).c_str()); meta->dumpToLog(); #endif } } // namespace android