Home | History | Annotate | Download | only in webaudio
      1 /*
      2  * Copyright (C) 2010, Google Inc. All rights reserved.
      3  *
      4  * Redistribution and use in source and binary forms, with or without
      5  * modification, are permitted provided that the following conditions
      6  * are met:
      7  * 1.  Redistributions of source code must retain the above copyright
      8  *    notice, this list of conditions and the following disclaimer.
      9  * 2.  Redistributions in binary form must reproduce the above copyright
     10  *    notice, this list of conditions and the following disclaimer in the
     11  *    documentation and/or other materials provided with the distribution.
     12  *
     13  * THIS SOFTWARE IS PROVIDED BY APPLE INC. AND ITS CONTRIBUTORS ``AS IS'' AND ANY
     14  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
     15  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
     16  * DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR ITS CONTRIBUTORS BE LIABLE FOR ANY
     17  * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
     18  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
     19  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
     20  * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     21  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
     22  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     23  */
     24 
     25 #include "config.h"
     26 
     27 #if ENABLE(WEB_AUDIO)
     28 
     29 #include "RealtimeAnalyser.h"
     30 
     31 #include "AudioBus.h"
     32 #include "AudioUtilities.h"
     33 #include "FFTFrame.h"
     34 
     35 #if ENABLE(WEBGL)
     36 #include "Float32Array.h"
     37 #include "Uint8Array.h"
     38 #endif
     39 
     40 #include <algorithm>
     41 #include <limits.h>
     42 #include <wtf/Complex.h>
     43 #include <wtf/MathExtras.h>
     44 #include <wtf/Threading.h>
     45 
     46 using namespace std;
     47 
     48 namespace WebCore {
     49 
     50 const double RealtimeAnalyser::DefaultSmoothingTimeConstant  = 0.8;
     51 const double RealtimeAnalyser::DefaultMinDecibels = -100.0;
     52 const double RealtimeAnalyser::DefaultMaxDecibels = -30.0;
     53 
     54 const unsigned RealtimeAnalyser::DefaultFFTSize = 2048;
     55 const unsigned RealtimeAnalyser::MaxFFTSize = 2048;
     56 const unsigned RealtimeAnalyser::InputBufferSize = RealtimeAnalyser::MaxFFTSize * 2;
     57 
     58 RealtimeAnalyser::RealtimeAnalyser()
     59     : m_inputBuffer(InputBufferSize)
     60     , m_writeIndex(0)
     61     , m_fftSize(DefaultFFTSize)
     62     , m_magnitudeBuffer(DefaultFFTSize / 2)
     63     , m_smoothingTimeConstant(DefaultSmoothingTimeConstant)
     64     , m_minDecibels(DefaultMinDecibels)
     65     , m_maxDecibels(DefaultMaxDecibels)
     66 {
     67     m_analysisFrame = adoptPtr(new FFTFrame(DefaultFFTSize));
     68 }
     69 
     70 RealtimeAnalyser::~RealtimeAnalyser()
     71 {
     72 }
     73 
     74 void RealtimeAnalyser::reset()
     75 {
     76     m_writeIndex = 0;
     77     m_inputBuffer.zero();
     78     m_magnitudeBuffer.zero();
     79 }
     80 
     81 void RealtimeAnalyser::setFftSize(size_t size)
     82 {
     83     ASSERT(isMainThread());
     84 
     85     // Only allow powers of two.
     86     unsigned log2size = static_cast<unsigned>(log2(size));
     87     bool isPOT(1UL << log2size == size);
     88 
     89     if (!isPOT || size > MaxFFTSize) {
     90         // FIXME: It would be good to also set an exception.
     91         return;
     92     }
     93 
     94     if (m_fftSize != size) {
     95         m_analysisFrame = adoptPtr(new FFTFrame(m_fftSize));
     96         m_magnitudeBuffer.resize(size);
     97         m_fftSize = size;
     98     }
     99 }
    100 
    101 void RealtimeAnalyser::writeInput(AudioBus* bus, size_t framesToProcess)
    102 {
    103     bool isBusGood = bus && bus->numberOfChannels() > 0 && bus->channel(0)->length() >= framesToProcess;
    104     ASSERT(isBusGood);
    105     if (!isBusGood)
    106         return;
    107 
    108     // FIXME : allow to work with non-FFTSize divisible chunking
    109     bool isDestinationGood = m_writeIndex < m_inputBuffer.size() && m_writeIndex + framesToProcess <= m_inputBuffer.size();
    110     ASSERT(isDestinationGood);
    111     if (!isDestinationGood)
    112         return;
    113 
    114     // Perform real-time analysis
    115     // FIXME : for now just use left channel (must mix if stereo source)
    116     float* source = bus->channel(0)->data();
    117 
    118     // The source has already been sanity checked with isBusGood above.
    119 
    120     memcpy(m_inputBuffer.data() + m_writeIndex, source, sizeof(float) * framesToProcess);
    121 
    122     m_writeIndex += framesToProcess;
    123     if (m_writeIndex >= InputBufferSize)
    124         m_writeIndex = 0;
    125 }
    126 
    127 namespace {
    128 
    129 void applyWindow(float* p, size_t n)
    130 {
    131     ASSERT(isMainThread());
    132 
    133     // Blackman window
    134     double alpha = 0.16;
    135     double a0 = 0.5 * (1.0 - alpha);
    136     double a1 = 0.5;
    137     double a2 = 0.5 * alpha;
    138 
    139     for (unsigned i = 0; i < n; ++i) {
    140         double x = static_cast<double>(i) / static_cast<double>(n);
    141         double window = a0 - a1 * cos(2.0 * piDouble * x) + a2 * cos(4.0 * piDouble * x);
    142         p[i] *= float(window);
    143     }
    144 }
    145 
    146 } // namespace
    147 
    148 void RealtimeAnalyser::doFFTAnalysis()
    149 {
    150     ASSERT(isMainThread());
    151 
    152     // Unroll the input buffer into a temporary buffer, where we'll apply an analysis window followed by an FFT.
    153     size_t fftSize = this->fftSize();
    154 
    155     AudioFloatArray temporaryBuffer(fftSize);
    156     float* inputBuffer = m_inputBuffer.data();
    157     float* tempP = temporaryBuffer.data();
    158 
    159     // Take the previous fftSize values from the input buffer and copy into the temporary buffer.
    160     // FIXME : optimize with memcpy().
    161     unsigned writeIndex = m_writeIndex;
    162     for (unsigned i = 0; i < fftSize; ++i)
    163         tempP[i] = inputBuffer[(i + writeIndex - fftSize + InputBufferSize) % InputBufferSize];
    164 
    165     // Window the input samples.
    166     applyWindow(tempP, fftSize);
    167 
    168     // Do the analysis.
    169     m_analysisFrame->doFFT(tempP);
    170 
    171     size_t n = DefaultFFTSize / 2;
    172 
    173     float* realP = m_analysisFrame->realData();
    174     float* imagP = m_analysisFrame->imagData();
    175 
    176     // Blow away the packed nyquist component.
    177     imagP[0] = 0.0f;
    178 
    179     // Normalize so than an input sine wave at 0dBfs registers as 0dBfs (undo FFT scaling factor).
    180     const double MagnitudeScale = 1.0 / DefaultFFTSize;
    181 
    182     // A value of 0 does no averaging with the previous result.  Larger values produce slower, but smoother changes.
    183     double k = m_smoothingTimeConstant;
    184     k = max(0.0, k);
    185     k = min(1.0, k);
    186 
    187     // Convert the analysis data from complex to magnitude and average with the previous result.
    188     float* destination = magnitudeBuffer().data();
    189     for (unsigned i = 0; i < n; ++i) {
    190         Complex c(realP[i], imagP[i]);
    191         double scalarMagnitude = abs(c) * MagnitudeScale;
    192         destination[i] = float(k * destination[i] + (1.0 - k) * scalarMagnitude);
    193     }
    194 }
    195 
    196 #if ENABLE(WEBGL)
    197 
    198 void RealtimeAnalyser::getFloatFrequencyData(Float32Array* destinationArray)
    199 {
    200     ASSERT(isMainThread());
    201 
    202     if (!destinationArray)
    203         return;
    204 
    205     doFFTAnalysis();
    206 
    207     // Convert from linear magnitude to floating-point decibels.
    208     const double MinDecibels = m_minDecibels;
    209     unsigned sourceLength = magnitudeBuffer().size();
    210     size_t len = min(sourceLength, destinationArray->length());
    211     if (len > 0) {
    212         const float* source = magnitudeBuffer().data();
    213         float* destination = destinationArray->data();
    214 
    215         for (unsigned i = 0; i < len; ++i) {
    216             float linearValue = source[i];
    217             double dbMag = !linearValue ? MinDecibels : AudioUtilities::linearToDecibels(linearValue);
    218             destination[i] = float(dbMag);
    219         }
    220     }
    221 }
    222 
    223 void RealtimeAnalyser::getByteFrequencyData(Uint8Array* destinationArray)
    224 {
    225     ASSERT(isMainThread());
    226 
    227     if (!destinationArray)
    228         return;
    229 
    230     doFFTAnalysis();
    231 
    232     // Convert from linear magnitude to unsigned-byte decibels.
    233     unsigned sourceLength = magnitudeBuffer().size();
    234     size_t len = min(sourceLength, destinationArray->length());
    235     if (len > 0) {
    236         const double RangeScaleFactor = m_maxDecibels == m_minDecibels ? 1.0 : 1.0 / (m_maxDecibels - m_minDecibels);
    237 
    238         const float* source = magnitudeBuffer().data();
    239         unsigned char* destination = destinationArray->data();
    240 
    241         for (unsigned i = 0; i < len; ++i) {
    242             float linearValue = source[i];
    243             double dbMag = !linearValue ? m_minDecibels : AudioUtilities::linearToDecibels(linearValue);
    244 
    245             // The range m_minDecibels to m_maxDecibels will be scaled to byte values from 0 to UCHAR_MAX.
    246             double scaledValue = UCHAR_MAX * (dbMag - m_minDecibels) * RangeScaleFactor;
    247 
    248             // Clip to valid range.
    249             if (scaledValue < 0.0)
    250                 scaledValue = 0.0;
    251             if (scaledValue > UCHAR_MAX)
    252                 scaledValue = UCHAR_MAX;
    253 
    254             destination[i] = static_cast<unsigned char>(scaledValue);
    255         }
    256     }
    257 }
    258 
    259 void RealtimeAnalyser::getByteTimeDomainData(Uint8Array* destinationArray)
    260 {
    261     ASSERT(isMainThread());
    262 
    263     if (!destinationArray)
    264         return;
    265 
    266     unsigned fftSize = this->fftSize();
    267     size_t len = min(fftSize, destinationArray->length());
    268     if (len > 0) {
    269         bool isInputBufferGood = m_inputBuffer.size() == InputBufferSize && m_inputBuffer.size() > fftSize;
    270         ASSERT(isInputBufferGood);
    271         if (!isInputBufferGood)
    272             return;
    273 
    274         float* inputBuffer = m_inputBuffer.data();
    275         unsigned char* destination = destinationArray->data();
    276 
    277         unsigned writeIndex = m_writeIndex;
    278 
    279         for (unsigned i = 0; i < len; ++i) {
    280             // Buffer access is protected due to modulo operation.
    281             float value = inputBuffer[(i + writeIndex - fftSize + InputBufferSize) % InputBufferSize];
    282 
    283             // Scale from nominal -1.0 -> +1.0 to unsigned byte.
    284             double scaledValue = 128.0 * (value + 1.0);
    285 
    286             // Clip to valid range.
    287             if (scaledValue < 0.0)
    288                 scaledValue = 0.0;
    289             if (scaledValue > UCHAR_MAX)
    290                 scaledValue = UCHAR_MAX;
    291 
    292             destination[i] = static_cast<unsigned char>(scaledValue);
    293         }
    294     }
    295 }
    296 
    297 #endif // WEBGL
    298 
    299 } // namespace WebCore
    300 
    301 #endif // ENABLE(WEB_AUDIO)
    302