mirror of
				https://github.com/RetroDECK/Duckstation.git
				synced 2025-04-10 19:15:14 +00:00 
			
		
		
		
	
		
			
	
	
		
			206 lines
		
	
	
		
			7.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
		
		
			
		
	
	
			206 lines
		
	
	
		
			7.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
|   | ////////////////////////////////////////////////////////////////////////////////
 | ||
|  | ///
 | ||
|  | /// Beats-per-minute (BPM) detection routine.
 | ||
|  | ///
 | ||
|  | /// The beat detection algorithm works as follows:
 | ||
|  | /// - Use function 'inputSamples' to input a chunks of samples to the class for
 | ||
|  | ///   analysis. It's a good idea to enter a large sound file or stream in smallish
 | ||
|  | ///   chunks of around few kilosamples in order not to extinguish too much RAM memory.
 | ||
|  | /// - Input sound data is decimated to approx 500 Hz to reduce calculation burden,
 | ||
|  | ///   which is basically ok as low (bass) frequencies mostly determine the beat rate.
 | ||
|  | ///   Simple averaging is used for anti-alias filtering because the resulting signal
 | ||
|  | ///   quality isn't of that high importance.
 | ||
|  | /// - Decimated sound data is enveloped, i.e. the amplitude shape is detected by
 | ||
|  | ///   taking absolute value that's smoothed by sliding average. Signal levels that
 | ||
|  | ///   are below a couple of times the general RMS amplitude level are cut away to
 | ||
|  | ///   leave only notable peaks there.
 | ||
|  | /// - Repeating sound patterns (e.g. beats) are detected by calculating short-term 
 | ||
|  | ///   autocorrelation function of the enveloped signal.
 | ||
|  | /// - After whole sound data file has been analyzed as above, the bpm level is 
 | ||
|  | ///   detected by function 'getBpm' that finds the highest peak of the autocorrelation 
 | ||
|  | ///   function, calculates it's precise location and converts this reading to bpm's.
 | ||
|  | ///
 | ||
|  | /// Author        : Copyright (c) Olli Parviainen
 | ||
|  | /// Author e-mail : oparviai 'at' iki.fi
 | ||
|  | /// SoundTouch WWW: http://www.surina.net/soundtouch
 | ||
|  | ///
 | ||
|  | ////////////////////////////////////////////////////////////////////////////////
 | ||
|  | //
 | ||
|  | // License :
 | ||
|  | //
 | ||
|  | //  SoundTouch audio processing library
 | ||
|  | //  Copyright (c) Olli Parviainen
 | ||
|  | //
 | ||
|  | //  This library is free software; you can redistribute it and/or
 | ||
|  | //  modify it under the terms of the GNU Lesser General Public
 | ||
|  | //  License as published by the Free Software Foundation; either
 | ||
|  | //  version 2.1 of the License, or (at your option) any later version.
 | ||
|  | //
 | ||
|  | //  This library is distributed in the hope that it will be useful,
 | ||
|  | //  but WITHOUT ANY WARRANTY; without even the implied warranty of
 | ||
|  | //  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 | ||
|  | //  Lesser General Public License for more details.
 | ||
|  | //
 | ||
|  | //  You should have received a copy of the GNU Lesser General Public
 | ||
|  | //  License along with this library; if not, write to the Free Software
 | ||
|  | //  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
 | ||
|  | //
 | ||
|  | ////////////////////////////////////////////////////////////////////////////////
 | ||
|  | 
 | ||
|  | #ifndef _BPMDetect_H_
 | ||
|  | #define _BPMDetect_H_
 | ||
|  | 
 | ||
|  | #include <vector>
 | ||
|  | #include "STTypes.h"
 | ||
|  | #include "FIFOSampleBuffer.h"
 | ||
|  | 
 | ||
|  | namespace soundtouch | ||
|  | { | ||
|  | 
 | ||
|  |     /// Minimum allowed BPM rate. Used to restrict accepted result above a reasonable limit.
 | ||
|  |     #define MIN_BPM 45
 | ||
|  | 
 | ||
|  |     /// Maximum allowed BPM rate range. Used for calculating algorithm parametrs
 | ||
|  |     #define MAX_BPM_RANGE 200
 | ||
|  | 
 | ||
|  |     /// Maximum allowed BPM rate range. Used to restrict accepted result below a reasonable limit.
 | ||
|  |     #define MAX_BPM_VALID 190
 | ||
|  | 
 | ||
|  | ////////////////////////////////////////////////////////////////////////////////
 | ||
|  | 
 | ||
|  |     typedef struct | ||
|  |     { | ||
|  |         float pos; | ||
|  |         float strength; | ||
|  |     } BEAT; | ||
|  | 
 | ||
|  | 
 | ||
|  |     class IIR2_filter | ||
|  |     { | ||
|  |         double coeffs[5]; | ||
|  |         double prev[5]; | ||
|  | 
 | ||
|  |     public: | ||
|  |         IIR2_filter(const double *lpf_coeffs); | ||
|  |         float update(float x); | ||
|  |     }; | ||
|  | 
 | ||
|  | 
 | ||
|  |     /// Class for calculating BPM rate for audio data.
 | ||
|  |     class BPMDetect | ||
|  |     { | ||
|  |     protected: | ||
|  |         /// Auto-correlation accumulator bins.
 | ||
|  |         float *xcorr; | ||
|  | 
 | ||
|  |         /// Sample average counter.
 | ||
|  |         int decimateCount; | ||
|  | 
 | ||
|  |         /// Sample average accumulator for FIFO-like decimation.
 | ||
|  |         soundtouch::LONG_SAMPLETYPE decimateSum; | ||
|  | 
 | ||
|  |         /// Decimate sound by this coefficient to reach approx. 500 Hz.
 | ||
|  |         int decimateBy; | ||
|  | 
 | ||
|  |         /// Auto-correlation window length
 | ||
|  |         int windowLen; | ||
|  | 
 | ||
|  |         /// Number of channels (1 = mono, 2 = stereo)
 | ||
|  |         int channels; | ||
|  | 
 | ||
|  |         /// sample rate
 | ||
|  |         int sampleRate; | ||
|  | 
 | ||
|  |         /// Beginning of auto-correlation window: Autocorrelation isn't being updated for
 | ||
|  |         /// the first these many correlation bins.
 | ||
|  |         int windowStart; | ||
|  | 
 | ||
|  |         /// window functions for data preconditioning
 | ||
|  |         float *hamw; | ||
|  |         float *hamw2; | ||
|  | 
 | ||
|  |         // beat detection variables
 | ||
|  |         int pos; | ||
|  |         int peakPos; | ||
|  |         int beatcorr_ringbuffpos; | ||
|  |         int init_scaler; | ||
|  |         float peakVal; | ||
|  |         float *beatcorr_ringbuff; | ||
|  | 
 | ||
|  |         /// FIFO-buffer for decimated processing samples.
 | ||
|  |         soundtouch::FIFOSampleBuffer *buffer; | ||
|  | 
 | ||
|  |         /// Collection of detected beat positions
 | ||
|  |         //BeatCollection beats;
 | ||
|  |         std::vector<BEAT> beats; | ||
|  | 
 | ||
|  |         // 2nd order low-pass-filter
 | ||
|  |         IIR2_filter beat_lpf; | ||
|  | 
 | ||
|  |         /// Updates auto-correlation function for given number of decimated samples that 
 | ||
|  |         /// are read from the internal 'buffer' pipe (samples aren't removed from the pipe 
 | ||
|  |         /// though).
 | ||
|  |         void updateXCorr(int process_samples      /// How many samples are processed.
 | ||
|  |         ); | ||
|  | 
 | ||
|  |         /// Decimates samples to approx. 500 Hz.
 | ||
|  |         ///
 | ||
|  |         /// \return Number of output samples.
 | ||
|  |         int decimate(soundtouch::SAMPLETYPE *dest,      ///< Destination buffer
 | ||
|  |             const soundtouch::SAMPLETYPE *src, ///< Source sample buffer
 | ||
|  |             int numsamples                     ///< Number of source samples.
 | ||
|  |         ); | ||
|  | 
 | ||
|  |         /// Calculates amplitude envelope for the buffer of samples.
 | ||
|  |         /// Result is output to 'samples'.
 | ||
|  |         void calcEnvelope(soundtouch::SAMPLETYPE *samples,  ///< Pointer to input/output data buffer
 | ||
|  |             int numsamples                    ///< Number of samples in buffer
 | ||
|  |         ); | ||
|  | 
 | ||
|  |         /// remove constant bias from xcorr data
 | ||
|  |         void removeBias(); | ||
|  | 
 | ||
|  |         // Detect individual beat positions
 | ||
|  |         void updateBeatPos(int process_samples); | ||
|  | 
 | ||
|  | 
 | ||
|  |     public: | ||
|  |         /// Constructor.
 | ||
|  |         BPMDetect(int numChannels,  ///< Number of channels in sample data.
 | ||
|  |             int sampleRate    ///< Sample rate in Hz.
 | ||
|  |         ); | ||
|  | 
 | ||
|  |         /// Destructor.
 | ||
|  |         virtual ~BPMDetect(); | ||
|  | 
 | ||
|  |         /// Inputs a block of samples for analyzing: Envelopes the samples and then
 | ||
|  |         /// updates the autocorrelation estimation. When whole song data has been input
 | ||
|  |         /// in smaller blocks using this function, read the resulting bpm with 'getBpm' 
 | ||
|  |         /// function. 
 | ||
|  |         /// 
 | ||
|  |         /// Notice that data in 'samples' array can be disrupted in processing.
 | ||
|  |         void inputSamples(const soundtouch::SAMPLETYPE *samples,    ///< Pointer to input/working data buffer
 | ||
|  |             int numSamples                            ///< Number of samples in buffer
 | ||
|  |         ); | ||
|  | 
 | ||
|  |         /// Analyzes the results and returns the BPM rate. Use this function to read result
 | ||
|  |         /// after whole song data has been input to the class by consecutive calls of
 | ||
|  |         /// 'inputSamples' function.
 | ||
|  |         ///
 | ||
|  |         /// \return Beats-per-minute rate, or zero if detection failed.
 | ||
|  |         float getBpm(); | ||
|  | 
 | ||
|  |         /// Get beat position arrays. Note: The array includes also really low beat detection values 
 | ||
|  |         /// in absence of clear strong beats. Consumer may wish to filter low values away.
 | ||
|  |         /// - "pos" receive array of beat positions
 | ||
|  |         /// - "values" receive array of beat detection strengths
 | ||
|  |         /// - max_num indicates max.size of "pos" and "values" array.  
 | ||
|  |         ///
 | ||
|  |         /// You can query a suitable array sized by calling this with NULL in "pos" & "values".
 | ||
|  |         ///
 | ||
|  |         /// \return number of beats in the arrays.
 | ||
|  |         int getBeats(float *pos, float *strength, int max_num); | ||
|  |     }; | ||
|  | } | ||
|  | #endif // _BPMDetect_H_
 |