mirror of
https://github.com/RetroDECK/Duckstation.git
synced 2024-11-22 22:05:38 +00:00
539 lines
16 KiB
C++
539 lines
16 KiB
C++
//////////////////////////////////////////////////////////////////////////////
|
|
///
|
|
/// SoundTouch - main class for tempo/pitch/rate adjusting routines.
|
|
///
|
|
/// Notes:
|
|
/// - Initialize the SoundTouch object instance by setting up the sound stream
|
|
/// parameters with functions 'setSampleRate' and 'setChannels', then set
|
|
/// desired tempo/pitch/rate settings with the corresponding functions.
|
|
///
|
|
/// - The SoundTouch class behaves like a first-in-first-out pipeline: The
|
|
/// samples that are to be processed are fed into one of the pipe by calling
|
|
/// function 'putSamples', while the ready processed samples can be read
|
|
/// from the other end of the pipeline with function 'receiveSamples'.
|
|
///
|
|
/// - The SoundTouch processing classes require certain sized 'batches' of
|
|
/// samples in order to process the sound. For this reason the classes buffer
|
|
/// incoming samples until there are enough of samples available for
|
|
/// processing, then they carry out the processing step and consequently
|
|
/// make the processed samples available for outputting.
|
|
///
|
|
/// - For the above reason, the processing routines introduce a certain
|
|
/// 'latency' between the input and output, so that the samples input to
|
|
/// SoundTouch may not be immediately available in the output, and neither
|
|
/// the amount of outputtable samples may not immediately be in direct
|
|
/// relationship with the amount of previously input samples.
|
|
///
|
|
/// - The tempo/pitch/rate control parameters can be altered during processing.
|
|
/// Please notice though that they aren't currently protected by semaphores,
|
|
/// so in multi-thread application external semaphore protection may be
|
|
/// required.
|
|
///
|
|
/// - This class utilizes classes 'TDStretch' for tempo change (without modifying
|
|
/// pitch) and 'RateTransposer' for changing the playback rate (that is, both
|
|
/// tempo and pitch in the same ratio) of the sound. The third available control
|
|
/// 'pitch' (change pitch but maintain tempo) is produced by a combination of
|
|
/// combining the two other controls.
|
|
///
|
|
/// Author : Copyright (c) Olli Parviainen
|
|
/// Author e-mail : oparviai 'at' iki.fi
|
|
/// SoundTouch WWW: http://www.surina.net/soundtouch
|
|
///
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
//
|
|
// License :
|
|
//
|
|
// SoundTouch audio processing library
|
|
// Copyright (c) Olli Parviainen
|
|
//
|
|
// This library is free software; you can redistribute it and/or
|
|
// modify it under the terms of the GNU Lesser General Public
|
|
// License as published by the Free Software Foundation; either
|
|
// version 2.1 of the License, or (at your option) any later version.
|
|
//
|
|
// This library is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
// Lesser General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Lesser General Public
|
|
// License along with this library; if not, write to the Free Software
|
|
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
//
|
|
////////////////////////////////////////////////////////////////////////////////
|
|
|
|
#include <assert.h>
|
|
#include <stdlib.h>
|
|
#include <memory.h>
|
|
#include <math.h>
|
|
#include <stdio.h>
|
|
|
|
#include "SoundTouch.h"
|
|
#include "TDStretch.h"
|
|
#include "RateTransposer.h"
|
|
#include "cpu_detect.h"
|
|
|
|
using namespace soundtouch;
|
|
|
|
/// test if two floating point numbers are equal
|
|
#define TEST_FLOAT_EQUAL(a, b) (fabs(a - b) < 1e-10)
|
|
|
|
|
|
/// Print library version string for autoconf
|
|
extern "C" void soundtouch_ac_test()
|
|
{
|
|
printf("SoundTouch Version: %s\n",SOUNDTOUCH_VERSION);
|
|
}
|
|
|
|
|
|
SoundTouch::SoundTouch()
|
|
{
|
|
// Initialize rate transposer and tempo changer instances
|
|
|
|
pRateTransposer = new RateTransposer();
|
|
pTDStretch = TDStretch::newInstance();
|
|
|
|
setOutPipe(pTDStretch);
|
|
|
|
rate = tempo = 0;
|
|
|
|
virtualPitch =
|
|
virtualRate =
|
|
virtualTempo = 1.0;
|
|
|
|
calcEffectiveRateAndTempo();
|
|
|
|
samplesExpectedOut = 0;
|
|
samplesOutput = 0;
|
|
|
|
channels = 0;
|
|
bSrateSet = false;
|
|
}
|
|
|
|
|
|
SoundTouch::~SoundTouch()
|
|
{
|
|
delete pRateTransposer;
|
|
delete pTDStretch;
|
|
}
|
|
|
|
|
|
/// Get SoundTouch library version string
|
|
const char *SoundTouch::getVersionString()
|
|
{
|
|
static const char *_version = SOUNDTOUCH_VERSION;
|
|
|
|
return _version;
|
|
}
|
|
|
|
|
|
/// Get SoundTouch library version Id
|
|
uint SoundTouch::getVersionId()
|
|
{
|
|
return SOUNDTOUCH_VERSION_ID;
|
|
}
|
|
|
|
|
|
// Sets the number of channels, 1 = mono, 2 = stereo
|
|
void SoundTouch::setChannels(uint numChannels)
|
|
{
|
|
if (!verifyNumberOfChannels(numChannels)) return;
|
|
|
|
channels = numChannels;
|
|
pRateTransposer->setChannels((int)numChannels);
|
|
pTDStretch->setChannels((int)numChannels);
|
|
}
|
|
|
|
|
|
// Sets new rate control value. Normal rate = 1.0, smaller values
|
|
// represent slower rate, larger faster rates.
|
|
void SoundTouch::setRate(double newRate)
|
|
{
|
|
virtualRate = newRate;
|
|
calcEffectiveRateAndTempo();
|
|
}
|
|
|
|
|
|
// Sets new rate control value as a difference in percents compared
|
|
// to the original rate (-50 .. +100 %)
|
|
void SoundTouch::setRateChange(double newRate)
|
|
{
|
|
virtualRate = 1.0 + 0.01 * newRate;
|
|
calcEffectiveRateAndTempo();
|
|
}
|
|
|
|
|
|
// Sets new tempo control value. Normal tempo = 1.0, smaller values
|
|
// represent slower tempo, larger faster tempo.
|
|
void SoundTouch::setTempo(double newTempo)
|
|
{
|
|
virtualTempo = newTempo;
|
|
calcEffectiveRateAndTempo();
|
|
}
|
|
|
|
|
|
// Sets new tempo control value as a difference in percents compared
|
|
// to the original tempo (-50 .. +100 %)
|
|
void SoundTouch::setTempoChange(double newTempo)
|
|
{
|
|
virtualTempo = 1.0 + 0.01 * newTempo;
|
|
calcEffectiveRateAndTempo();
|
|
}
|
|
|
|
|
|
// Sets new pitch control value. Original pitch = 1.0, smaller values
|
|
// represent lower pitches, larger values higher pitch.
|
|
void SoundTouch::setPitch(double newPitch)
|
|
{
|
|
virtualPitch = newPitch;
|
|
calcEffectiveRateAndTempo();
|
|
}
|
|
|
|
|
|
// Sets pitch change in octaves compared to the original pitch
|
|
// (-1.00 .. +1.00)
|
|
void SoundTouch::setPitchOctaves(double newPitch)
|
|
{
|
|
virtualPitch = exp(0.69314718056 * newPitch);
|
|
calcEffectiveRateAndTempo();
|
|
}
|
|
|
|
|
|
// Sets pitch change in semi-tones compared to the original pitch
|
|
// (-12 .. +12)
|
|
void SoundTouch::setPitchSemiTones(int newPitch)
|
|
{
|
|
setPitchOctaves((double)newPitch / 12.0);
|
|
}
|
|
|
|
|
|
void SoundTouch::setPitchSemiTones(double newPitch)
|
|
{
|
|
setPitchOctaves(newPitch / 12.0);
|
|
}
|
|
|
|
|
|
// Calculates 'effective' rate and tempo values from the
|
|
// nominal control values.
|
|
void SoundTouch::calcEffectiveRateAndTempo()
|
|
{
|
|
double oldTempo = tempo;
|
|
double oldRate = rate;
|
|
|
|
tempo = virtualTempo / virtualPitch;
|
|
rate = virtualPitch * virtualRate;
|
|
|
|
if (!TEST_FLOAT_EQUAL(rate,oldRate)) pRateTransposer->setRate(rate);
|
|
if (!TEST_FLOAT_EQUAL(tempo, oldTempo)) pTDStretch->setTempo(tempo);
|
|
|
|
#ifndef SOUNDTOUCH_PREVENT_CLICK_AT_RATE_CROSSOVER
|
|
if (rate <= 1.0f)
|
|
{
|
|
if (output != pTDStretch)
|
|
{
|
|
FIFOSamplePipe *tempoOut;
|
|
|
|
assert(output == pRateTransposer);
|
|
// move samples in the current output buffer to the output of pTDStretch
|
|
tempoOut = pTDStretch->getOutput();
|
|
tempoOut->moveSamples(*output);
|
|
// move samples in pitch transposer's store buffer to tempo changer's input
|
|
// deprecated : pTDStretch->moveSamples(*pRateTransposer->getStore());
|
|
|
|
output = pTDStretch;
|
|
}
|
|
}
|
|
else
|
|
#endif
|
|
{
|
|
if (output != pRateTransposer)
|
|
{
|
|
FIFOSamplePipe *transOut;
|
|
|
|
assert(output == pTDStretch);
|
|
// move samples in the current output buffer to the output of pRateTransposer
|
|
transOut = pRateTransposer->getOutput();
|
|
transOut->moveSamples(*output);
|
|
// move samples in tempo changer's input to pitch transposer's input
|
|
pRateTransposer->moveSamples(*pTDStretch->getInput());
|
|
|
|
output = pRateTransposer;
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
// Sets sample rate.
|
|
void SoundTouch::setSampleRate(uint srate)
|
|
{
|
|
// set sample rate, leave other tempo changer parameters as they are.
|
|
pTDStretch->setParameters((int)srate);
|
|
bSrateSet = true;
|
|
}
|
|
|
|
|
|
// Adds 'numSamples' pcs of samples from the 'samples' memory position into
|
|
// the input of the object.
|
|
void SoundTouch::putSamples(const SAMPLETYPE *samples, uint nSamples)
|
|
{
|
|
if (bSrateSet == false)
|
|
{
|
|
ST_THROW_RT_ERROR("SoundTouch : Sample rate not defined");
|
|
}
|
|
else if (channels == 0)
|
|
{
|
|
ST_THROW_RT_ERROR("SoundTouch : Number of channels not defined");
|
|
}
|
|
|
|
// accumulate how many samples are expected out from processing, given the current
|
|
// processing setting
|
|
samplesExpectedOut += (double)nSamples / ((double)rate * (double)tempo);
|
|
|
|
#ifndef SOUNDTOUCH_PREVENT_CLICK_AT_RATE_CROSSOVER
|
|
if (rate <= 1.0f)
|
|
{
|
|
// transpose the rate down, output the transposed sound to tempo changer buffer
|
|
assert(output == pTDStretch);
|
|
pRateTransposer->putSamples(samples, nSamples);
|
|
pTDStretch->moveSamples(*pRateTransposer);
|
|
}
|
|
else
|
|
#endif
|
|
{
|
|
// evaluate the tempo changer, then transpose the rate up,
|
|
assert(output == pRateTransposer);
|
|
pTDStretch->putSamples(samples, nSamples);
|
|
pRateTransposer->moveSamples(*pTDStretch);
|
|
}
|
|
}
|
|
|
|
|
|
// Flushes the last samples from the processing pipeline to the output.
|
|
// Clears also the internal processing buffers.
|
|
//
|
|
// Note: This function is meant for extracting the last samples of a sound
|
|
// stream. This function may introduce additional blank samples in the end
|
|
// of the sound stream, and thus it's not recommended to call this function
|
|
// in the middle of a sound stream.
|
|
void SoundTouch::flush()
|
|
{
|
|
int i;
|
|
int numStillExpected;
|
|
SAMPLETYPE *buff = new SAMPLETYPE[128 * channels];
|
|
|
|
// how many samples are still expected to output
|
|
numStillExpected = (int)((long)(samplesExpectedOut + 0.5) - samplesOutput);
|
|
if (numStillExpected < 0) numStillExpected = 0;
|
|
|
|
memset(buff, 0, 128 * channels * sizeof(SAMPLETYPE));
|
|
// "Push" the last active samples out from the processing pipeline by
|
|
// feeding blank samples into the processing pipeline until new,
|
|
// processed samples appear in the output (not however, more than
|
|
// 24ksamples in any case)
|
|
for (i = 0; (numStillExpected > (int)numSamples()) && (i < 200); i ++)
|
|
{
|
|
putSamples(buff, 128);
|
|
}
|
|
|
|
adjustAmountOfSamples(numStillExpected);
|
|
|
|
delete[] buff;
|
|
|
|
// Clear input buffers
|
|
pTDStretch->clearInput();
|
|
// yet leave the output intouched as that's where the
|
|
// flushed samples are!
|
|
}
|
|
|
|
|
|
// Changes a setting controlling the processing system behaviour. See the
|
|
// 'SETTING_...' defines for available setting ID's.
|
|
bool SoundTouch::setSetting(int settingId, int value)
|
|
{
|
|
int sampleRate, sequenceMs, seekWindowMs, overlapMs;
|
|
|
|
// read current tdstretch routine parameters
|
|
pTDStretch->getParameters(&sampleRate, &sequenceMs, &seekWindowMs, &overlapMs);
|
|
|
|
switch (settingId)
|
|
{
|
|
case SETTING_USE_AA_FILTER :
|
|
// enables / disabless anti-alias filter
|
|
pRateTransposer->enableAAFilter((value != 0) ? true : false);
|
|
return true;
|
|
|
|
case SETTING_AA_FILTER_LENGTH :
|
|
// sets anti-alias filter length
|
|
pRateTransposer->getAAFilter()->setLength(value);
|
|
return true;
|
|
|
|
case SETTING_USE_QUICKSEEK :
|
|
// enables / disables tempo routine quick seeking algorithm
|
|
pTDStretch->enableQuickSeek((value != 0) ? true : false);
|
|
return true;
|
|
|
|
case SETTING_SEQUENCE_MS:
|
|
// change time-stretch sequence duration parameter
|
|
pTDStretch->setParameters(sampleRate, value, seekWindowMs, overlapMs);
|
|
return true;
|
|
|
|
case SETTING_SEEKWINDOW_MS:
|
|
// change time-stretch seek window length parameter
|
|
pTDStretch->setParameters(sampleRate, sequenceMs, value, overlapMs);
|
|
return true;
|
|
|
|
case SETTING_OVERLAP_MS:
|
|
// change time-stretch overlap length parameter
|
|
pTDStretch->setParameters(sampleRate, sequenceMs, seekWindowMs, value);
|
|
return true;
|
|
|
|
default :
|
|
return false;
|
|
}
|
|
}
|
|
|
|
|
|
// Reads a setting controlling the processing system behaviour. See the
|
|
// 'SETTING_...' defines for available setting ID's.
|
|
//
|
|
// Returns the setting value.
|
|
int SoundTouch::getSetting(int settingId) const
|
|
{
|
|
int temp;
|
|
|
|
switch (settingId)
|
|
{
|
|
case SETTING_USE_AA_FILTER :
|
|
return (uint)pRateTransposer->isAAFilterEnabled();
|
|
|
|
case SETTING_AA_FILTER_LENGTH :
|
|
return pRateTransposer->getAAFilter()->getLength();
|
|
|
|
case SETTING_USE_QUICKSEEK :
|
|
return (uint)pTDStretch->isQuickSeekEnabled();
|
|
|
|
case SETTING_SEQUENCE_MS:
|
|
pTDStretch->getParameters(NULL, &temp, NULL, NULL);
|
|
return temp;
|
|
|
|
case SETTING_SEEKWINDOW_MS:
|
|
pTDStretch->getParameters(NULL, NULL, &temp, NULL);
|
|
return temp;
|
|
|
|
case SETTING_OVERLAP_MS:
|
|
pTDStretch->getParameters(NULL, NULL, NULL, &temp);
|
|
return temp;
|
|
|
|
case SETTING_NOMINAL_INPUT_SEQUENCE :
|
|
{
|
|
int size = pTDStretch->getInputSampleReq();
|
|
|
|
#ifndef SOUNDTOUCH_PREVENT_CLICK_AT_RATE_CROSSOVER
|
|
if (rate <= 1.0)
|
|
{
|
|
// transposing done before timestretch, which impacts latency
|
|
return (int)(size * rate + 0.5);
|
|
}
|
|
#endif
|
|
return size;
|
|
}
|
|
|
|
case SETTING_NOMINAL_OUTPUT_SEQUENCE :
|
|
{
|
|
int size = pTDStretch->getOutputBatchSize();
|
|
|
|
if (rate > 1.0)
|
|
{
|
|
// transposing done after timestretch, which impacts latency
|
|
return (int)(size / rate + 0.5);
|
|
}
|
|
return size;
|
|
}
|
|
|
|
case SETTING_INITIAL_LATENCY:
|
|
{
|
|
double latency = pTDStretch->getLatency();
|
|
int latency_tr = pRateTransposer->getLatency();
|
|
|
|
#ifndef SOUNDTOUCH_PREVENT_CLICK_AT_RATE_CROSSOVER
|
|
if (rate <= 1.0)
|
|
{
|
|
// transposing done before timestretch, which impacts latency
|
|
latency = (latency + latency_tr) * rate;
|
|
}
|
|
else
|
|
#endif
|
|
{
|
|
latency += (double)latency_tr / rate;
|
|
}
|
|
|
|
return (int)(latency + 0.5);
|
|
}
|
|
|
|
default :
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
|
|
// Clears all the samples in the object's output and internal processing
|
|
// buffers.
|
|
void SoundTouch::clear()
|
|
{
|
|
samplesExpectedOut = 0;
|
|
samplesOutput = 0;
|
|
pRateTransposer->clear();
|
|
pTDStretch->clear();
|
|
}
|
|
|
|
|
|
/// Returns number of samples currently unprocessed.
|
|
uint SoundTouch::numUnprocessedSamples() const
|
|
{
|
|
FIFOSamplePipe * psp;
|
|
if (pTDStretch)
|
|
{
|
|
psp = pTDStretch->getInput();
|
|
if (psp)
|
|
{
|
|
return psp->numSamples();
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
|
|
/// Output samples from beginning of the sample buffer. Copies requested samples to
|
|
/// output buffer and removes them from the sample buffer. If there are less than
|
|
/// 'numsample' samples in the buffer, returns all that available.
|
|
///
|
|
/// \return Number of samples returned.
|
|
uint SoundTouch::receiveSamples(SAMPLETYPE *output, uint maxSamples)
|
|
{
|
|
uint ret = FIFOProcessor::receiveSamples(output, maxSamples);
|
|
samplesOutput += (long)ret;
|
|
return ret;
|
|
}
|
|
|
|
|
|
/// Adjusts book-keeping so that given number of samples are removed from beginning of the
|
|
/// sample buffer without copying them anywhere.
|
|
///
|
|
/// Used to reduce the number of samples in the buffer when accessing the sample buffer directly
|
|
/// with 'ptrBegin' function.
|
|
uint SoundTouch::receiveSamples(uint maxSamples)
|
|
{
|
|
uint ret = FIFOProcessor::receiveSamples(maxSamples);
|
|
samplesOutput += (long)ret;
|
|
return ret;
|
|
}
|
|
|
|
|
|
/// Get ratio between input and output audio durations, useful for calculating
|
|
/// processed output duration: if you'll process a stream of N samples, then
|
|
/// you can expect to get out N * getInputOutputSampleRatio() samples.
|
|
double SoundTouch::getInputOutputSampleRatio()
|
|
{
|
|
return 1.0 / (tempo * rate);
|
|
}
|