Source/WebCore/webaudio/RealtimeAnalyser.cpp - WebKit - Git at Google

 /*
  * Copyright (C) 2010, Google Inc. All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1.  Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2.  Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY APPLE INC. AND ITS CONTRIBUTORS ``AS IS'' AND ANY
  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
  * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
  * DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR ITS CONTRIBUTORS BE LIABLE FOR ANY
  * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
  * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
  * ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */

 #include "config.h"

 #if ENABLE(WEB_AUDIO)

 #include "RealtimeAnalyser.h"

 #include "AudioBus.h"
 #include "AudioUtilities.h"
 #include "FFTFrame.h"

 #include <algorithm>
 #include <limits.h>
 #include <wtf/Complex.h>
 #include <wtf/Float32Array.h>
 #include <wtf/MainThread.h>
 #include <wtf/MathExtras.h>
 #include <wtf/Uint8Array.h>

 using namespace std;

 namespace WebCore {

 const double RealtimeAnalyser::DefaultSmoothingTimeConstant  = 0.8;
 const double RealtimeAnalyser::DefaultMinDecibels = -100.0;
 const double RealtimeAnalyser::DefaultMaxDecibels = -30.0;

 const unsigned RealtimeAnalyser::DefaultFFTSize = 2048;
 // All FFT implementations are expected to handle power-of-two sizes MinFFTSize <= size <= MaxFFTSize.
 const unsigned RealtimeAnalyser::MinFFTSize = 128;
 const unsigned RealtimeAnalyser::MaxFFTSize = 2048;
 const unsigned RealtimeAnalyser::InputBufferSize = RealtimeAnalyser::MaxFFTSize * 2;

 RealtimeAnalyser::RealtimeAnalyser()
     : m_inputBuffer(InputBufferSize)
     , m_writeIndex(0)
     , m_fftSize(DefaultFFTSize)
     , m_magnitudeBuffer(DefaultFFTSize / 2)
     , m_smoothingTimeConstant(DefaultSmoothingTimeConstant)
     , m_minDecibels(DefaultMinDecibels)
     , m_maxDecibels(DefaultMaxDecibels)
 {
     m_analysisFrame = adoptPtr(new FFTFrame(DefaultFFTSize));
 }

 RealtimeAnalyser::~RealtimeAnalyser()
 {
 }

 void RealtimeAnalyser::reset()
 {
     m_writeIndex = 0;
     m_inputBuffer.zero();
     m_magnitudeBuffer.zero();
 }

 void RealtimeAnalyser::setFftSize(size_t size)
 {
     ASSERT(isMainThread());

     // Only allow powers of two.
     unsigned log2size = static_cast<unsigned>(log2(size));
     bool isPOT(1UL << log2size == size);

     if (!isPOT || size > MaxFFTSize || size < MinFFTSize) {
         // FIXME: It would be good to also set an exception.
         return;
     }

     if (m_fftSize != size) {
         m_analysisFrame = adoptPtr(new FFTFrame(size));
         // m_magnitudeBuffer has size = fftSize / 2 because it contains floats reduced from complex values in m_analysisFrame.
         m_magnitudeBuffer.allocate(size / 2);
         m_fftSize = size;
     }
 }

 void RealtimeAnalyser::writeInput(AudioBus* bus, size_t framesToProcess)
 {
     bool isBusGood = bus && bus->numberOfChannels() > 0 && bus->channel(0)->length() >= framesToProcess;
     ASSERT(isBusGood);
     if (!isBusGood)
         return;

     // FIXME : allow to work with non-FFTSize divisible chunking
     bool isDestinationGood = m_writeIndex < m_inputBuffer.size() && m_writeIndex + framesToProcess <= m_inputBuffer.size();
     ASSERT(isDestinationGood);
     if (!isDestinationGood)
         return;

     // Perform real-time analysis
     // FIXME : for now just use left channel (must mix if stereo source)
     float* source = bus->channel(0)->data();

     // The source has already been sanity checked with isBusGood above.

     memcpy(m_inputBuffer.data() + m_writeIndex, source, sizeof(float) * framesToProcess);

     m_writeIndex += framesToProcess;
     if (m_writeIndex >= InputBufferSize)
         m_writeIndex = 0;
 }

 namespace {

 void applyWindow(float* p, size_t n)
 {
     ASSERT(isMainThread());

     // Blackman window
     double alpha = 0.16;
     double a0 = 0.5 * (1.0 - alpha);
     double a1 = 0.5;
     double a2 = 0.5 * alpha;

     for (unsigned i = 0; i < n; ++i) {
         double x = static_cast<double>(i) / static_cast<double>(n);
         double window = a0 - a1 * cos(2.0 * piDouble * x) + a2 * cos(4.0 * piDouble * x);
         p[i] *= float(window);
     }
 }

 } // namespace

 void RealtimeAnalyser::doFFTAnalysis()
 {
     ASSERT(isMainThread());

     // Unroll the input buffer into a temporary buffer, where we'll apply an analysis window followed by an FFT.
     size_t fftSize = this->fftSize();

     AudioFloatArray temporaryBuffer(fftSize);
     float* inputBuffer = m_inputBuffer.data();
     float* tempP = temporaryBuffer.data();

     // Take the previous fftSize values from the input buffer and copy into the temporary buffer.
     // FIXME : optimize with memcpy().
     unsigned writeIndex = m_writeIndex;
     for (unsigned i = 0; i < fftSize; ++i)
         tempP[i] = inputBuffer[(i + writeIndex - fftSize + InputBufferSize) % InputBufferSize];

     // Window the input samples.
     applyWindow(tempP, fftSize);

     // Do the analysis.
     m_analysisFrame->doFFT(tempP);

     float* realP = m_analysisFrame->realData();
     float* imagP = m_analysisFrame->imagData();

     // Blow away the packed nyquist component.
     imagP[0] = 0.0f;

     // Normalize so than an input sine wave at 0dBfs registers as 0dBfs (undo FFT scaling factor).
     const double MagnitudeScale = 1.0 / DefaultFFTSize;

     // A value of 0 does no averaging with the previous result.  Larger values produce slower, but smoother changes.
     double k = m_smoothingTimeConstant;
     k = max(0.0, k);
     k = min(1.0, k);

     // Convert the analysis data from complex to magnitude and average with the previous result.
     float* destination = magnitudeBuffer().data();
     size_t n = magnitudeBuffer().size();
     for (size_t i = 0; i < n; ++i) {
         Complex c(realP[i], imagP[i]);
         double scalarMagnitude = abs(c) * MagnitudeScale;
         destination[i] = float(k * destination[i] + (1.0 - k) * scalarMagnitude);
     }
 }

 void RealtimeAnalyser::getFloatFrequencyData(Float32Array* destinationArray)
 {
     ASSERT(isMainThread());

     if (!destinationArray)
         return;

     doFFTAnalysis();

     // Convert from linear magnitude to floating-point decibels.
     const double MinDecibels = m_minDecibels;
     unsigned sourceLength = magnitudeBuffer().size();
     size_t len = min(sourceLength, destinationArray->length());
     if (len > 0) {
         const float* source = magnitudeBuffer().data();
         float* destination = destinationArray->data();

         for (unsigned i = 0; i < len; ++i) {
             float linearValue = source[i];
             double dbMag = !linearValue ? MinDecibels : AudioUtilities::linearToDecibels(linearValue);
             destination[i] = float(dbMag);
         }
     }
 }

 void RealtimeAnalyser::getByteFrequencyData(Uint8Array* destinationArray)
 {
     ASSERT(isMainThread());

     if (!destinationArray)
         return;

     doFFTAnalysis();

     // Convert from linear magnitude to unsigned-byte decibels.
     unsigned sourceLength = magnitudeBuffer().size();
     size_t len = min(sourceLength, destinationArray->length());
     if (len > 0) {
         const double RangeScaleFactor = m_maxDecibels == m_minDecibels ? 1.0 : 1.0 / (m_maxDecibels - m_minDecibels);

         const float* source = magnitudeBuffer().data();
         unsigned char* destination = destinationArray->data();

         for (unsigned i = 0; i < len; ++i) {
             float linearValue = source[i];
             double dbMag = !linearValue ? m_minDecibels : AudioUtilities::linearToDecibels(linearValue);

             // The range m_minDecibels to m_maxDecibels will be scaled to byte values from 0 to UCHAR_MAX.
             double scaledValue = UCHAR_MAX * (dbMag - m_minDecibels) * RangeScaleFactor;

             // Clip to valid range.
             if (scaledValue < 0.0)
                 scaledValue = 0.0;
             if (scaledValue > UCHAR_MAX)
                 scaledValue = UCHAR_MAX;

             destination[i] = static_cast<unsigned char>(scaledValue);
         }
     }
 }

 void RealtimeAnalyser::getByteTimeDomainData(Uint8Array* destinationArray)
 {
     ASSERT(isMainThread());

     if (!destinationArray)
         return;

     unsigned fftSize = this->fftSize();
     size_t len = min(fftSize, destinationArray->length());
     if (len > 0) {
         bool isInputBufferGood = m_inputBuffer.size() == InputBufferSize && m_inputBuffer.size() > fftSize;
         ASSERT(isInputBufferGood);
         if (!isInputBufferGood)
             return;

         float* inputBuffer = m_inputBuffer.data();
         unsigned char* destination = destinationArray->data();

         unsigned writeIndex = m_writeIndex;

         for (unsigned i = 0; i < len; ++i) {
             // Buffer access is protected due to modulo operation.
             float value = inputBuffer[(i + writeIndex - fftSize + InputBufferSize) % InputBufferSize];

             // Scale from nominal -1.0 -> +1.0 to unsigned byte.
             double scaledValue = 128.0 * (value + 1.0);

             // Clip to valid range.
             if (scaledValue < 0.0)
                 scaledValue = 0.0;
             if (scaledValue > UCHAR_MAX)
                 scaledValue = UCHAR_MAX;

             destination[i] = static_cast<unsigned char>(scaledValue);
         }
     }
 }

 } // namespace WebCore

 #endif // ENABLE(WEB_AUDIO)
	/*
	* Copyright (C) 2010, Google Inc. All rights reserved.
	*
	* Redistribution and use in source and binary forms, with or without
	* modification, are permitted provided that the following conditions
	* are met:
	* 1. Redistributions of source code must retain the above copyright
	* notice, this list of conditions and the following disclaimer.
	* 2. Redistributions in binary form must reproduce the above copyright
	* notice, this list of conditions and the following disclaimer in the
	* documentation and/or other materials provided with the distribution.
	*
	* THIS SOFTWARE IS PROVIDED BY APPLE INC. AND ITS CONTRIBUTORS ``AS IS'' AND ANY
	* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
	* WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
	* DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR ITS CONTRIBUTORS BE LIABLE FOR ANY
	* DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
	* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
	* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
	* ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
	* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
	*/

	#include "config.h"

	#if ENABLE(WEB_AUDIO)

	#include "RealtimeAnalyser.h"

	#include "AudioBus.h"
	#include "AudioUtilities.h"
	#include "FFTFrame.h"

	#include <algorithm>
	#include <limits.h>
	#include <wtf/Complex.h>
	#include <wtf/Float32Array.h>
	#include <wtf/MainThread.h>
	#include <wtf/MathExtras.h>
	#include <wtf/Uint8Array.h>

	using namespace std;

	namespace WebCore {

	const double RealtimeAnalyser::DefaultSmoothingTimeConstant = 0.8;
	const double RealtimeAnalyser::DefaultMinDecibels = -100.0;
	const double RealtimeAnalyser::DefaultMaxDecibels = -30.0;

	const unsigned RealtimeAnalyser::DefaultFFTSize = 2048;
	// All FFT implementations are expected to handle power-of-two sizes MinFFTSize <= size <= MaxFFTSize.
	const unsigned RealtimeAnalyser::MinFFTSize = 128;
	const unsigned RealtimeAnalyser::MaxFFTSize = 2048;
	const unsigned RealtimeAnalyser::InputBufferSize = RealtimeAnalyser::MaxFFTSize * 2;

	RealtimeAnalyser::RealtimeAnalyser()
	: m_inputBuffer(InputBufferSize)
	, m_writeIndex(0)
	, m_fftSize(DefaultFFTSize)
	, m_magnitudeBuffer(DefaultFFTSize / 2)
	, m_smoothingTimeConstant(DefaultSmoothingTimeConstant)
	, m_minDecibels(DefaultMinDecibels)
	, m_maxDecibels(DefaultMaxDecibels)
	{
	m_analysisFrame = adoptPtr(new FFTFrame(DefaultFFTSize));
	}

	RealtimeAnalyser::~RealtimeAnalyser()
	{
	}

	void RealtimeAnalyser::reset()
	{
	m_writeIndex = 0;
	m_inputBuffer.zero();
	m_magnitudeBuffer.zero();
	}

	void RealtimeAnalyser::setFftSize(size_t size)
	{
	ASSERT(isMainThread());

	// Only allow powers of two.
	unsigned log2size = static_cast<unsigned>(log2(size));
	bool isPOT(1UL << log2size == size);

	if (!isPOT \|\| size > MaxFFTSize \|\| size < MinFFTSize) {
	// FIXME: It would be good to also set an exception.
	return;
	}

	if (m_fftSize != size) {
	m_analysisFrame = adoptPtr(new FFTFrame(size));
	// m_magnitudeBuffer has size = fftSize / 2 because it contains floats reduced from complex values in m_analysisFrame.
	m_magnitudeBuffer.allocate(size / 2);
	m_fftSize = size;
	}
	}

	void RealtimeAnalyser::writeInput(AudioBus* bus, size_t framesToProcess)
	{
	bool isBusGood = bus && bus->numberOfChannels() > 0 && bus->channel(0)->length() >= framesToProcess;
	ASSERT(isBusGood);
	if (!isBusGood)
	return;

	// FIXME : allow to work with non-FFTSize divisible chunking
	bool isDestinationGood = m_writeIndex < m_inputBuffer.size() && m_writeIndex + framesToProcess <= m_inputBuffer.size();
	ASSERT(isDestinationGood);
	if (!isDestinationGood)
	return;

	// Perform real-time analysis
	// FIXME : for now just use left channel (must mix if stereo source)
	float* source = bus->channel(0)->data();

	// The source has already been sanity checked with isBusGood above.

	memcpy(m_inputBuffer.data() + m_writeIndex, source, sizeof(float) * framesToProcess);

	m_writeIndex += framesToProcess;
	if (m_writeIndex >= InputBufferSize)
	m_writeIndex = 0;
	}

	namespace {

	void applyWindow(float* p, size_t n)
	{
	ASSERT(isMainThread());

	// Blackman window
	double alpha = 0.16;
	double a0 = 0.5 * (1.0 - alpha);
	double a1 = 0.5;
	double a2 = 0.5 * alpha;

	for (unsigned i = 0; i < n; ++i) {
	double x = static_cast<double>(i) / static_cast<double>(n);
	double window = a0 - a1 * cos(2.0 * piDouble * x) + a2 * cos(4.0 * piDouble * x);
	p[i] *= float(window);
	}
	}

	} // namespace

	void RealtimeAnalyser::doFFTAnalysis()
	{
	ASSERT(isMainThread());

	// Unroll the input buffer into a temporary buffer, where we'll apply an analysis window followed by an FFT.
	size_t fftSize = this->fftSize();

	AudioFloatArray temporaryBuffer(fftSize);
	float* inputBuffer = m_inputBuffer.data();
	float* tempP = temporaryBuffer.data();

	// Take the previous fftSize values from the input buffer and copy into the temporary buffer.
	// FIXME : optimize with memcpy().
	unsigned writeIndex = m_writeIndex;
	for (unsigned i = 0; i < fftSize; ++i)
	tempP[i] = inputBuffer[(i + writeIndex - fftSize + InputBufferSize) % InputBufferSize];

	// Window the input samples.
	applyWindow(tempP, fftSize);

	// Do the analysis.
	m_analysisFrame->doFFT(tempP);

	float* realP = m_analysisFrame->realData();
	float* imagP = m_analysisFrame->imagData();

	// Blow away the packed nyquist component.
	imagP[0] = 0.0f;

	// Normalize so than an input sine wave at 0dBfs registers as 0dBfs (undo FFT scaling factor).
	const double MagnitudeScale = 1.0 / DefaultFFTSize;

	// A value of 0 does no averaging with the previous result. Larger values produce slower, but smoother changes.
	double k = m_smoothingTimeConstant;
	k = max(0.0, k);
	k = min(1.0, k);

	// Convert the analysis data from complex to magnitude and average with the previous result.
	float* destination = magnitudeBuffer().data();
	size_t n = magnitudeBuffer().size();
	for (size_t i = 0; i < n; ++i) {
	Complex c(realP[i], imagP[i]);
	double scalarMagnitude = abs(c) * MagnitudeScale;
	destination[i] = float(k * destination[i] + (1.0 - k) * scalarMagnitude);
	}
	}

	void RealtimeAnalyser::getFloatFrequencyData(Float32Array* destinationArray)
	{
	ASSERT(isMainThread());

	if (!destinationArray)
	return;

	doFFTAnalysis();

	// Convert from linear magnitude to floating-point decibels.
	const double MinDecibels = m_minDecibels;
	unsigned sourceLength = magnitudeBuffer().size();
	size_t len = min(sourceLength, destinationArray->length());
	if (len > 0) {
	const float* source = magnitudeBuffer().data();
	float* destination = destinationArray->data();

	for (unsigned i = 0; i < len; ++i) {
	float linearValue = source[i];
	double dbMag = !linearValue ? MinDecibels : AudioUtilities::linearToDecibels(linearValue);
	destination[i] = float(dbMag);
	}
	}
	}

	void RealtimeAnalyser::getByteFrequencyData(Uint8Array* destinationArray)
	{
	ASSERT(isMainThread());

	if (!destinationArray)
	return;

	doFFTAnalysis();

	// Convert from linear magnitude to unsigned-byte decibels.
	unsigned sourceLength = magnitudeBuffer().size();
	size_t len = min(sourceLength, destinationArray->length());
	if (len > 0) {
	const double RangeScaleFactor = m_maxDecibels == m_minDecibels ? 1.0 : 1.0 / (m_maxDecibels - m_minDecibels);

	const float* source = magnitudeBuffer().data();
	unsigned char* destination = destinationArray->data();

	for (unsigned i = 0; i < len; ++i) {
	float linearValue = source[i];
	double dbMag = !linearValue ? m_minDecibels : AudioUtilities::linearToDecibels(linearValue);

	// The range m_minDecibels to m_maxDecibels will be scaled to byte values from 0 to UCHAR_MAX.
	double scaledValue = UCHAR_MAX * (dbMag - m_minDecibels) * RangeScaleFactor;

	// Clip to valid range.
	if (scaledValue < 0.0)
	scaledValue = 0.0;
	if (scaledValue > UCHAR_MAX)
	scaledValue = UCHAR_MAX;

	destination[i] = static_cast<unsigned char>(scaledValue);
	}
	}
	}

	void RealtimeAnalyser::getByteTimeDomainData(Uint8Array* destinationArray)
	{
	ASSERT(isMainThread());

	if (!destinationArray)
	return;

	unsigned fftSize = this->fftSize();
	size_t len = min(fftSize, destinationArray->length());
	if (len > 0) {
	bool isInputBufferGood = m_inputBuffer.size() == InputBufferSize && m_inputBuffer.size() > fftSize;
	ASSERT(isInputBufferGood);
	if (!isInputBufferGood)
	return;

	float* inputBuffer = m_inputBuffer.data();
	unsigned char* destination = destinationArray->data();

	unsigned writeIndex = m_writeIndex;

	for (unsigned i = 0; i < len; ++i) {
	// Buffer access is protected due to modulo operation.
	float value = inputBuffer[(i + writeIndex - fftSize + InputBufferSize) % InputBufferSize];

	// Scale from nominal -1.0 -> +1.0 to unsigned byte.
	double scaledValue = 128.0 * (value + 1.0);

	// Clip to valid range.
	if (scaledValue < 0.0)
	scaledValue = 0.0;
	if (scaledValue > UCHAR_MAX)
	scaledValue = UCHAR_MAX;

	destination[i] = static_cast<unsigned char>(scaledValue);
	}
	}
	}

	} // namespace WebCore

	#endif // ENABLE(WEB_AUDIO)