Chih-Chung Chang | 9969866 | 2011-06-30 14:21:38 +0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2011 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
| 17 | #define LOG_NDEBUG 1 |
| 18 | #define LOG_TAG "VideoEditorBGAudioProcessing" |
| 19 | #include <utils/Log.h> |
| 20 | #include "VideoEditorBGAudioProcessing.h" |
| 21 | |
| 22 | namespace android { |
| 23 | |
| 24 | VideoEditorBGAudioProcessing::VideoEditorBGAudioProcessing() { |
| 25 | |
| 26 | LOGV("VideoEditorBGAudioProcessing:: Construct VideoEditorBGAudioProcessing "); |
| 27 | |
| 28 | mAudVolArrIndex = 0; |
| 29 | mDoDucking = 0; |
| 30 | mDucking_enable = 0; |
| 31 | mDucking_lowVolume = 0; |
| 32 | mDucking_threshold = 0; |
| 33 | mDuckingFactor = 0; |
| 34 | |
| 35 | mBTVolLevel = 0; |
| 36 | mPTVolLevel = 0; |
| 37 | |
| 38 | mIsSSRCneeded = 0; |
| 39 | mChannelConversion = 0; |
| 40 | |
| 41 | mBTFormat = MONO_16_BIT; |
| 42 | |
| 43 | mInSampleRate = 8000; |
| 44 | mOutSampleRate = 16000; |
| 45 | mPTChannelCount = 2; |
| 46 | mBTChannelCount = 1; |
| 47 | } |
| 48 | |
| 49 | M4OSA_Int32 VideoEditorBGAudioProcessing::veProcessAudioMixNDuck( |
| 50 | void *pPTBuffer, void *pBTBuffer, void *pOutBuffer) { |
| 51 | |
| 52 | M4AM_Buffer16* pPrimaryTrack = (M4AM_Buffer16*)pPTBuffer; |
| 53 | M4AM_Buffer16* pBackgroundTrack = (M4AM_Buffer16*)pBTBuffer; |
| 54 | M4AM_Buffer16* pMixedOutBuffer = (M4AM_Buffer16*)pOutBuffer; |
| 55 | |
| 56 | LOGV("VideoEditorBGAudioProcessing::lvProcessAudioMixNDuck \ |
| 57 | pPTBuffer 0x%x pBTBuffer 0x%x pOutBuffer 0x%x", pPTBuffer, |
| 58 | pBTBuffer, pOutBuffer); |
| 59 | |
| 60 | M4OSA_ERR result = M4NO_ERROR; |
| 61 | M4OSA_Int16 *pBTMdata1; |
| 62 | M4OSA_Int16 *pPTMdata2; |
| 63 | M4OSA_UInt32 uiPCMsize; |
| 64 | |
| 65 | // Ducking variable |
| 66 | M4OSA_UInt16 loopIndex = 0; |
| 67 | M4OSA_Int16 *pPCM16Sample = M4OSA_NULL; |
| 68 | M4OSA_Int32 peakDbValue = 0; |
| 69 | M4OSA_Int32 previousDbValue = 0; |
| 70 | M4OSA_UInt32 i; |
| 71 | |
| 72 | // Output size if same as PT size |
| 73 | pMixedOutBuffer->m_bufferSize = pPrimaryTrack->m_bufferSize; |
| 74 | |
| 75 | // Before mixing, we need to have only PT as out buffer |
| 76 | memcpy((void *)pMixedOutBuffer->m_dataAddress, |
| 77 | (void *)pPrimaryTrack->m_dataAddress, pMixedOutBuffer->m_bufferSize); |
| 78 | |
| 79 | // Initially contains the input primary track |
| 80 | pPTMdata2 = (M4OSA_Int16*)pMixedOutBuffer->m_dataAddress; |
| 81 | // Contains BG track processed data(like channel conversion etc.. |
| 82 | pBTMdata1 = (M4OSA_Int16*) pBackgroundTrack->m_dataAddress; |
| 83 | |
| 84 | // Since we need to give sample count and not buffer size |
| 85 | uiPCMsize = pMixedOutBuffer->m_bufferSize/2 ; |
| 86 | |
| 87 | if ((mDucking_enable) && (mPTVolLevel != 0.0)) { |
| 88 | // LOGI("VideoEditorBGAudioProcessing:: In Ducking analysis "); |
| 89 | loopIndex = 0; |
| 90 | peakDbValue = 0; |
| 91 | previousDbValue = peakDbValue; |
| 92 | |
| 93 | pPCM16Sample = (M4OSA_Int16*)pPrimaryTrack->m_dataAddress; |
| 94 | |
| 95 | while (loopIndex < pPrimaryTrack->m_bufferSize/sizeof(M4OSA_Int16)) { |
| 96 | if (pPCM16Sample[loopIndex] >= 0) { |
| 97 | peakDbValue = previousDbValue > pPCM16Sample[loopIndex] ? |
| 98 | previousDbValue : pPCM16Sample[loopIndex]; |
| 99 | previousDbValue = peakDbValue; |
| 100 | } else { |
| 101 | peakDbValue = previousDbValue > -pPCM16Sample[loopIndex] ? |
| 102 | previousDbValue: -pPCM16Sample[loopIndex]; |
| 103 | previousDbValue = peakDbValue; |
| 104 | } |
| 105 | loopIndex++; |
| 106 | } |
| 107 | |
| 108 | mAudioVolumeArray[mAudVolArrIndex] = getDecibelSound(peakDbValue); |
| 109 | |
| 110 | LOGV("VideoEditorBGAudioProcessing:: getDecibelSound %d", |
| 111 | mAudioVolumeArray[mAudVolArrIndex]); |
| 112 | |
| 113 | // WINDOW_SIZE is 10 by default |
| 114 | // Check for threshold is done after 10 cycles |
| 115 | if (mAudVolArrIndex >= WINDOW_SIZE - 1) { |
| 116 | mDoDucking = isThresholdBreached(mAudioVolumeArray, |
| 117 | mAudVolArrIndex,mDucking_threshold ); |
| 118 | mAudVolArrIndex = 0; |
| 119 | } else { |
| 120 | mAudVolArrIndex++; |
| 121 | } |
| 122 | |
| 123 | // |
| 124 | // Below logic controls the mixing weightage |
| 125 | // for Background and Primary Tracks |
| 126 | // for the duration of window under analysis, |
| 127 | // to give fade-out for Background and fade-in for primary |
| 128 | // Current fading factor is distributed in equal range over |
| 129 | // the defined window size. |
| 130 | // For a window size = 25 |
| 131 | // (500 ms (window under analysis) / 20 ms (sample duration)) |
| 132 | // |
| 133 | |
| 134 | if (mDoDucking) { |
| 135 | if (mDuckingFactor > mDucking_lowVolume) { |
| 136 | // FADE OUT BG Track |
| 137 | // Increment ducking factor in total steps in factor |
| 138 | // of low volume steps to reach low volume level |
| 139 | mDuckingFactor -= (mDucking_lowVolume); |
| 140 | } else { |
| 141 | mDuckingFactor = mDucking_lowVolume; |
| 142 | } |
| 143 | } else { |
| 144 | if (mDuckingFactor < 1.0 ) { |
| 145 | // FADE IN BG Track |
| 146 | // Increment ducking factor in total steps of |
| 147 | // low volume factor to reach orig.volume level |
| 148 | mDuckingFactor += (mDucking_lowVolume); |
| 149 | } else { |
| 150 | mDuckingFactor = 1.0; |
| 151 | } |
| 152 | } |
| 153 | } // end if - mDucking_enable |
| 154 | |
| 155 | |
| 156 | // Mixing Logic |
| 157 | |
| 158 | LOGV("VideoEditorBGAudioProcessing:: Out of Ducking analysis uiPCMsize\ |
| 159 | %d %f %f", mDoDucking, mDuckingFactor,mBTVolLevel); |
| 160 | |
| 161 | while (uiPCMsize-- > 0) { |
| 162 | |
| 163 | M4OSA_Int32 temp; |
| 164 | // Set vol factor for BT and PT |
| 165 | *pBTMdata1 = (M4OSA_Int16)(*pBTMdata1*mBTVolLevel); |
| 166 | *pPTMdata2 = (M4OSA_Int16)(*pPTMdata2*mPTVolLevel); |
| 167 | |
| 168 | // Mix the two samples |
| 169 | if (mDoDucking) { |
| 170 | |
| 171 | // Duck the BG track to ducking factor value before mixing |
| 172 | *pBTMdata1 = (M4OSA_Int16)((*pBTMdata1)*(mDuckingFactor)); |
| 173 | |
| 174 | // mix as normal case |
| 175 | *pBTMdata1 = (M4OSA_Int16)(*pBTMdata1 /2 + *pPTMdata2 /2); |
| 176 | } else { |
| 177 | |
| 178 | *pBTMdata1 = (M4OSA_Int16)((*pBTMdata1)*(mDuckingFactor)); |
| 179 | *pBTMdata1 = (M4OSA_Int16)(*pBTMdata1 /2 + *pPTMdata2 /2); |
| 180 | } |
| 181 | |
| 182 | if (*pBTMdata1 < 0) { |
| 183 | temp = -(*pBTMdata1) * 2; // bring to original Amplitude level |
| 184 | |
| 185 | if (temp > 32767) { |
| 186 | *pBTMdata1 = -32766; // less then max allowed value |
| 187 | } else { |
| 188 | *pBTMdata1 = (M4OSA_Int16)(-temp); |
| 189 | } |
| 190 | } else { |
| 191 | temp = (*pBTMdata1) * 2; // bring to original Amplitude level |
| 192 | if ( temp > 32768) { |
| 193 | *pBTMdata1 = 32767; // less than max allowed value |
| 194 | } else { |
| 195 | *pBTMdata1 = (M4OSA_Int16)temp; |
| 196 | } |
| 197 | } |
| 198 | |
| 199 | pBTMdata1++; |
| 200 | pPTMdata2++; |
| 201 | } |
| 202 | //LOGV("VideoEditorBGAudioProcessing:: Copy final out "); |
| 203 | memcpy((void *)pMixedOutBuffer->m_dataAddress, |
| 204 | (void *)pBackgroundTrack->m_dataAddress, |
| 205 | pBackgroundTrack->m_bufferSize); |
| 206 | |
| 207 | LOGV("VideoEditorBGAudioProcessing::lvProcessAudioMixNDuck EXIT"); |
| 208 | return result; |
| 209 | } |
| 210 | |
| 211 | VideoEditorBGAudioProcessing::~VideoEditorBGAudioProcessing() { |
| 212 | |
| 213 | } |
| 214 | |
| 215 | M4OSA_Int32 VideoEditorBGAudioProcessing::calculateOutResampleBufSize() { |
| 216 | |
| 217 | // This already takes care of channel count in mBTBuffer.m_bufferSize |
| 218 | return (mOutSampleRate / mInSampleRate) * mBTBuffer.m_bufferSize; |
| 219 | } |
| 220 | |
| 221 | void VideoEditorBGAudioProcessing ::veSetAudioProcessingParams( |
| 222 | const veAudMixSettings& gInputParams) { |
| 223 | |
| 224 | LOGV("VideoEditorBGAudioProcessing:: ENTER lvSetAudioProcessingParams "); |
| 225 | mDucking_enable = gInputParams.lvInDucking_enable; |
| 226 | mDucking_lowVolume = gInputParams.lvInDucking_lowVolume; |
| 227 | mDucking_threshold = gInputParams.lvInDucking_threshold; |
| 228 | |
| 229 | mPTVolLevel = gInputParams.lvPTVolLevel; |
| 230 | mBTVolLevel = gInputParams.lvBTVolLevel ; |
| 231 | |
| 232 | mBTChannelCount = gInputParams.lvBTChannelCount; |
| 233 | mPTChannelCount = gInputParams.lvPTChannelCount; |
| 234 | |
| 235 | mBTFormat = gInputParams.lvBTFormat; |
| 236 | |
| 237 | mInSampleRate = gInputParams.lvInSampleRate; |
| 238 | mOutSampleRate = gInputParams.lvOutSampleRate; |
| 239 | |
| 240 | mAudVolArrIndex = 0; |
| 241 | mDoDucking = 0; |
| 242 | mDuckingFactor = 1.0; // default |
| 243 | |
| 244 | LOGV("VideoEditorBGAudioProcessing:: ducking_enable 0x%x \ |
| 245 | ducking_lowVolume %f ducking_threshold %d fPTVolLevel %f BTVolLevel %f", |
| 246 | mDucking_enable, mDucking_lowVolume, mDucking_threshold, |
| 247 | mPTVolLevel, mPTVolLevel); |
| 248 | |
| 249 | // Following logc decides if SSRC support is needed for this mixing |
| 250 | mIsSSRCneeded = (gInputParams.lvInSampleRate != gInputParams.lvOutSampleRate); |
| 251 | if (gInputParams.lvBTChannelCount != gInputParams.lvPTChannelCount){ |
| 252 | if (gInputParams.lvBTChannelCount == 2){ |
| 253 | mChannelConversion = 1; // convert to MONO |
| 254 | } else { |
| 255 | mChannelConversion = 2; // Convert to STEREO |
| 256 | } |
| 257 | } else { |
| 258 | mChannelConversion = 0; |
| 259 | } |
| 260 | LOGV("VideoEditorBGAudioProcessing:: EXIT veSetAudioProcessingParams "); |
| 261 | } |
| 262 | |
| 263 | |
| 264 | // Fast way to compute 10 * log(value) |
| 265 | M4OSA_Int32 VideoEditorBGAudioProcessing::getDecibelSound(M4OSA_UInt32 value) { |
| 266 | if (value <= 0 || value > 0x8000) { |
| 267 | return 0; |
| 268 | } else if (value > 0x4000) { // 32768 |
| 269 | return 90; |
| 270 | } else if (value > 0x2000) { // 16384 |
| 271 | return 84; |
| 272 | } else if (value > 0x1000) { // 8192 |
| 273 | return 78; |
| 274 | } else if (value > 0x0800) { // 4028 |
| 275 | return 72; |
| 276 | } else if (value > 0x0400) { // 2048 |
| 277 | return 66; |
| 278 | } else if (value > 0x0200) { // 1024 |
| 279 | return 60; |
| 280 | } else if (value > 0x0100) { // 512 |
| 281 | return 54; |
| 282 | } else if (value > 0x0080) { // 256 |
| 283 | return 48; |
| 284 | } else if (value > 0x0040) { // 128 |
| 285 | return 42; |
| 286 | } else if (value > 0x0020) { // 64 |
| 287 | return 36; |
| 288 | } else if (value > 0x0010) { // 32 |
| 289 | return 30; |
| 290 | } else if (value > 0x0008) { // 16 |
| 291 | return 24; |
| 292 | } else if (value > 0x0007) { // 8 |
| 293 | return 24; |
| 294 | } else if (value > 0x0003) { // 4 |
| 295 | return 18; |
| 296 | } else if (value > 0x0001) { // 2 |
| 297 | return 12; |
| 298 | } else { // 1 |
| 299 | return 6; |
| 300 | } |
| 301 | } |
| 302 | |
| 303 | M4OSA_Bool VideoEditorBGAudioProcessing::isThresholdBreached( |
| 304 | M4OSA_Int32* averageValue, |
| 305 | M4OSA_Int32 storeCount, |
| 306 | M4OSA_Int32 thresholdValue) { |
| 307 | |
| 308 | int totalValue = 0; |
| 309 | for (int i = 0; i < storeCount; ++i) { |
| 310 | totalValue += averageValue[i]; |
| 311 | } |
| 312 | return (totalValue / storeCount > thresholdValue); |
| 313 | } |
| 314 | |
| 315 | }//namespace android |