Thu, 22 Jan 2015 13:21:57 +0100
Incorporate requested changes from Mozilla in review:
https://bugzilla.mozilla.org/show_bug.cgi?id=1123480#c6
1 ////////////////////////////////////////////////////////////////////////////////
2 ///
3 /// Sampled sound tempo changer/time stretch algorithm. Changes the sound tempo
4 /// while maintaining the original pitch by using a time domain WSOLA-like method
5 /// with several performance-increasing tweaks.
6 ///
7 /// Note : MMX/SSE optimized functions reside in separate, platform-specific files
8 /// 'mmx_optimized.cpp' and 'sse_optimized.cpp'
9 ///
10 /// Author : Copyright (c) Olli Parviainen
11 /// Author e-mail : oparviai 'at' iki.fi
12 /// SoundTouch WWW: http://www.surina.net/soundtouch
13 ///
14 ////////////////////////////////////////////////////////////////////////////////
15 //
16 // Last changed : $Date: 2014-04-06 10:57:21 -0500 (Sun, 06 Apr 2014) $
17 // File revision : $Revision: 4 $
18 //
19 // $Id: TDStretch.h 195 2014-04-06 15:57:21Z oparviai $
20 //
21 ////////////////////////////////////////////////////////////////////////////////
22 //
23 // License :
24 //
25 // SoundTouch audio processing library
26 // Copyright (c) Olli Parviainen
27 //
28 // This library is free software; you can redistribute it and/or
29 // modify it under the terms of the GNU Lesser General Public
30 // License as published by the Free Software Foundation; either
31 // version 2.1 of the License, or (at your option) any later version.
32 //
33 // This library is distributed in the hope that it will be useful,
34 // but WITHOUT ANY WARRANTY; without even the implied warranty of
35 // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
36 // Lesser General Public License for more details.
37 //
38 // You should have received a copy of the GNU Lesser General Public
39 // License along with this library; if not, write to the Free Software
40 // Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
41 //
42 ////////////////////////////////////////////////////////////////////////////////
44 #ifndef TDStretch_H
45 #define TDStretch_H
47 #include <stddef.h>
48 #include "STTypes.h"
49 #include "RateTransposer.h"
50 #include "FIFOSamplePipe.h"
52 namespace soundtouch
53 {
55 /// Default values for sound processing parameters:
56 /// Notice that the default parameters are tuned for contemporary popular music
57 /// processing. For speech processing applications these parameters suit better:
58 /// #define DEFAULT_SEQUENCE_MS 40
59 /// #define DEFAULT_SEEKWINDOW_MS 15
60 /// #define DEFAULT_OVERLAP_MS 8
61 ///
63 /// Default length of a single processing sequence, in milliseconds. This determines to how
64 /// long sequences the original sound is chopped in the time-stretch algorithm.
65 ///
66 /// The larger this value is, the lesser sequences are used in processing. In principle
67 /// a bigger value sounds better when slowing down tempo, but worse when increasing tempo
68 /// and vice versa.
69 ///
70 /// Increasing this value reduces computational burden & vice versa.
71 //#define DEFAULT_SEQUENCE_MS 40
72 #define DEFAULT_SEQUENCE_MS USE_AUTO_SEQUENCE_LEN
74 /// Giving this value for the sequence length sets automatic parameter value
75 /// according to tempo setting (recommended)
76 #define USE_AUTO_SEQUENCE_LEN 0
78 /// Seeking window default length in milliseconds for algorithm that finds the best possible
79 /// overlapping location. This determines from how wide window the algorithm may look for an
80 /// optimal joining location when mixing the sound sequences back together.
81 ///
82 /// The bigger this window setting is, the higher the possibility to find a better mixing
83 /// position will become, but at the same time large values may cause a "drifting" artifact
84 /// because consequent sequences will be taken at more uneven intervals.
85 ///
86 /// If there's a disturbing artifact that sounds as if a constant frequency was drifting
87 /// around, try reducing this setting.
88 ///
89 /// Increasing this value increases computational burden & vice versa.
90 //#define DEFAULT_SEEKWINDOW_MS 15
91 #define DEFAULT_SEEKWINDOW_MS USE_AUTO_SEEKWINDOW_LEN
93 /// Giving this value for the seek window length sets automatic parameter value
94 /// according to tempo setting (recommended)
95 #define USE_AUTO_SEEKWINDOW_LEN 0
97 /// Overlap length in milliseconds. When the chopped sound sequences are mixed back together,
98 /// to form a continuous sound stream, this parameter defines over how long period the two
99 /// consecutive sequences are let to overlap each other.
100 ///
101 /// This shouldn't be that critical parameter. If you reduce the DEFAULT_SEQUENCE_MS setting
102 /// by a large amount, you might wish to try a smaller value on this.
103 ///
104 /// Increasing this value increases computational burden & vice versa.
105 #define DEFAULT_OVERLAP_MS 8
108 /// Class that does the time-stretch (tempo change) effect for the processed
109 /// sound.
110 class TDStretch : public FIFOProcessor
111 {
112 protected:
113 int channels;
114 int sampleReq;
115 float tempo;
117 SAMPLETYPE *pMidBuffer;
118 SAMPLETYPE *pMidBufferUnaligned;
119 int overlapLength;
120 int seekLength;
121 int seekWindowLength;
122 int overlapDividerBits;
123 int slopingDivider;
124 float nominalSkip;
125 float skipFract;
126 FIFOSampleBuffer outputBuffer;
127 FIFOSampleBuffer inputBuffer;
128 bool bQuickSeek;
130 int sampleRate;
131 int sequenceMs;
132 int seekWindowMs;
133 int overlapMs;
134 bool bAutoSeqSetting;
135 bool bAutoSeekSetting;
137 void acceptNewOverlapLength(int newOverlapLength);
139 virtual void clearCrossCorrState();
140 void calculateOverlapLength(int overlapMs);
142 virtual double calcCrossCorr(const SAMPLETYPE *mixingPos, const SAMPLETYPE *compare, double &norm) const;
143 virtual double calcCrossCorrAccumulate(const SAMPLETYPE *mixingPos, const SAMPLETYPE *compare, double &norm) const;
145 virtual int seekBestOverlapPositionFull(const SAMPLETYPE *refPos);
146 virtual int seekBestOverlapPositionQuick(const SAMPLETYPE *refPos);
147 int seekBestOverlapPosition(const SAMPLETYPE *refPos);
149 virtual void overlapStereo(SAMPLETYPE *output, const SAMPLETYPE *input) const;
150 virtual void overlapMono(SAMPLETYPE *output, const SAMPLETYPE *input) const;
151 virtual void overlapMulti(SAMPLETYPE *output, const SAMPLETYPE *input) const;
153 void clearMidBuffer();
154 void overlap(SAMPLETYPE *output, const SAMPLETYPE *input, uint ovlPos) const;
156 void calcSeqParameters();
158 /// Changes the tempo of the given sound samples.
159 /// Returns amount of samples returned in the "output" buffer.
160 /// The maximum amount of samples that can be returned at a time is set by
161 /// the 'set_returnBuffer_size' function.
162 void processSamples();
164 public:
165 TDStretch();
166 virtual ~TDStretch();
168 /// Operator 'new' is overloaded so that it automatically creates a suitable instance
169 /// depending on if we've a MMX/SSE/etc-capable CPU available or not.
170 static void *operator new(size_t s);
172 /// Use this function instead of "new" operator to create a new instance of this class.
173 /// This function automatically chooses a correct feature set depending on if the CPU
174 /// supports MMX/SSE/etc extensions.
175 static TDStretch *newInstance();
177 /// Returns the output buffer object
178 FIFOSamplePipe *getOutput() { return &outputBuffer; };
180 /// Returns the input buffer object
181 FIFOSamplePipe *getInput() { return &inputBuffer; };
183 /// Sets new target tempo. Normal tempo = 'SCALE', smaller values represent slower
184 /// tempo, larger faster tempo.
185 void setTempo(float newTempo);
187 /// Returns nonzero if there aren't any samples available for outputting.
188 virtual void clear();
190 /// Clears the input buffer
191 void clearInput();
193 /// Sets the number of channels, 1 = mono, 2 = stereo
194 void setChannels(int numChannels);
196 /// Enables/disables the quick position seeking algorithm. Zero to disable,
197 /// nonzero to enable
198 void enableQuickSeek(bool enable);
200 /// Returns nonzero if the quick seeking algorithm is enabled.
201 bool isQuickSeekEnabled() const;
203 /// Sets routine control parameters. These control are certain time constants
204 /// defining how the sound is stretched to the desired duration.
205 //
206 /// 'sampleRate' = sample rate of the sound
207 /// 'sequenceMS' = one processing sequence length in milliseconds
208 /// 'seekwindowMS' = seeking window length for scanning the best overlapping
209 /// position
210 /// 'overlapMS' = overlapping length
211 void setParameters(int sampleRate, ///< Samplerate of sound being processed (Hz)
212 int sequenceMS = -1, ///< Single processing sequence length (ms)
213 int seekwindowMS = -1, ///< Offset seeking window length (ms)
214 int overlapMS = -1 ///< Sequence overlapping length (ms)
215 );
217 /// Get routine control parameters, see setParameters() function.
218 /// Any of the parameters to this function can be NULL, in such case corresponding parameter
219 /// value isn't returned.
220 void getParameters(int *pSampleRate, int *pSequenceMs, int *pSeekWindowMs, int *pOverlapMs) const;
222 /// Adds 'numsamples' pcs of samples from the 'samples' memory position into
223 /// the input of the object.
224 virtual void putSamples(
225 const SAMPLETYPE *samples, ///< Input sample data
226 uint numSamples ///< Number of samples in 'samples' so that one sample
227 ///< contains both channels if stereo
228 );
230 /// return nominal input sample requirement for triggering a processing batch
231 int getInputSampleReq() const
232 {
233 return (int)(nominalSkip + 0.5);
234 }
236 /// return nominal output sample amount when running a processing batch
237 int getOutputBatchSize() const
238 {
239 return seekWindowLength - overlapLength;
240 }
241 };
245 // Implementation-specific class declarations:
247 #ifdef SOUNDTOUCH_ALLOW_MMX
248 /// Class that implements MMX optimized routines for 16bit integer samples type.
249 class TDStretchMMX : public TDStretch
250 {
251 protected:
252 double calcCrossCorr(const short *mixingPos, const short *compare, double &norm) const;
253 double calcCrossCorrAccumulate(const short *mixingPos, const short *compare, double &norm) const;
254 virtual void overlapStereo(short *output, const short *input) const;
255 virtual void clearCrossCorrState();
256 };
257 #endif /// SOUNDTOUCH_ALLOW_MMX
260 #ifdef SOUNDTOUCH_ALLOW_SSE
261 /// Class that implements SSE optimized routines for floating point samples type.
262 class TDStretchSSE : public TDStretch
263 {
264 protected:
265 double calcCrossCorr(const float *mixingPos, const float *compare, double &norm) const;
266 double calcCrossCorrAccumulate(const float *mixingPos, const float *compare, double &norm) const;
267 };
269 #endif /// SOUNDTOUCH_ALLOW_SSE
271 }
272 #endif /// TDStretch_H