media/libsoundtouch/src/TDStretch.h

Thu, 22 Jan 2015 13:21:57 +0100

author
Michael Schloh von Bennewitz <michael@schloh.com>
date
Thu, 22 Jan 2015 13:21:57 +0100
branch
TOR_BUG_9701
changeset 15
b8a032363ba2
permissions
-rw-r--r--

Incorporate requested changes from Mozilla in review:
https://bugzilla.mozilla.org/show_bug.cgi?id=1123480#c6

     1 ////////////////////////////////////////////////////////////////////////////////
     2 /// 
     3 /// Sampled sound tempo changer/time stretch algorithm. Changes the sound tempo 
     4 /// while maintaining the original pitch by using a time domain WSOLA-like method 
     5 /// with several performance-increasing tweaks.
     6 ///
     7 /// Note : MMX/SSE optimized functions reside in separate, platform-specific files 
     8 /// 'mmx_optimized.cpp' and 'sse_optimized.cpp'
     9 ///
    10 /// Author        : Copyright (c) Olli Parviainen
    11 /// Author e-mail : oparviai 'at' iki.fi
    12 /// SoundTouch WWW: http://www.surina.net/soundtouch
    13 ///
    14 ////////////////////////////////////////////////////////////////////////////////
    15 //
    16 // Last changed  : $Date: 2014-04-06 10:57:21 -0500 (Sun, 06 Apr 2014) $
    17 // File revision : $Revision: 4 $
    18 //
    19 // $Id: TDStretch.h 195 2014-04-06 15:57:21Z oparviai $
    20 //
    21 ////////////////////////////////////////////////////////////////////////////////
    22 //
    23 // License :
    24 //
    25 //  SoundTouch audio processing library
    26 //  Copyright (c) Olli Parviainen
    27 //
    28 //  This library is free software; you can redistribute it and/or
    29 //  modify it under the terms of the GNU Lesser General Public
    30 //  License as published by the Free Software Foundation; either
    31 //  version 2.1 of the License, or (at your option) any later version.
    32 //
    33 //  This library is distributed in the hope that it will be useful,
    34 //  but WITHOUT ANY WARRANTY; without even the implied warranty of
    35 //  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
    36 //  Lesser General Public License for more details.
    37 //
    38 //  You should have received a copy of the GNU Lesser General Public
    39 //  License along with this library; if not, write to the Free Software
    40 //  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
    41 //
    42 ////////////////////////////////////////////////////////////////////////////////
    44 #ifndef TDStretch_H
    45 #define TDStretch_H
    47 #include <stddef.h>
    48 #include "STTypes.h"
    49 #include "RateTransposer.h"
    50 #include "FIFOSamplePipe.h"
    52 namespace soundtouch
    53 {
    55 /// Default values for sound processing parameters:
    56 /// Notice that the default parameters are tuned for contemporary popular music 
    57 /// processing. For speech processing applications these parameters suit better:
    58 ///     #define DEFAULT_SEQUENCE_MS     40
    59 ///     #define DEFAULT_SEEKWINDOW_MS   15
    60 ///     #define DEFAULT_OVERLAP_MS      8
    61 ///
    63 /// Default length of a single processing sequence, in milliseconds. This determines to how 
    64 /// long sequences the original sound is chopped in the time-stretch algorithm.
    65 ///
    66 /// The larger this value is, the lesser sequences are used in processing. In principle
    67 /// a bigger value sounds better when slowing down tempo, but worse when increasing tempo
    68 /// and vice versa.
    69 ///
    70 /// Increasing this value reduces computational burden & vice versa.
    71 //#define DEFAULT_SEQUENCE_MS         40
    72 #define DEFAULT_SEQUENCE_MS         USE_AUTO_SEQUENCE_LEN
    74 /// Giving this value for the sequence length sets automatic parameter value
    75 /// according to tempo setting (recommended)
    76 #define USE_AUTO_SEQUENCE_LEN       0
    78 /// Seeking window default length in milliseconds for algorithm that finds the best possible 
    79 /// overlapping location. This determines from how wide window the algorithm may look for an 
    80 /// optimal joining location when mixing the sound sequences back together. 
    81 ///
    82 /// The bigger this window setting is, the higher the possibility to find a better mixing
    83 /// position will become, but at the same time large values may cause a "drifting" artifact
    84 /// because consequent sequences will be taken at more uneven intervals.
    85 ///
    86 /// If there's a disturbing artifact that sounds as if a constant frequency was drifting 
    87 /// around, try reducing this setting.
    88 ///
    89 /// Increasing this value increases computational burden & vice versa.
    90 //#define DEFAULT_SEEKWINDOW_MS       15
    91 #define DEFAULT_SEEKWINDOW_MS       USE_AUTO_SEEKWINDOW_LEN
    93 /// Giving this value for the seek window length sets automatic parameter value
    94 /// according to tempo setting (recommended)
    95 #define USE_AUTO_SEEKWINDOW_LEN     0
    97 /// Overlap length in milliseconds. When the chopped sound sequences are mixed back together, 
    98 /// to form a continuous sound stream, this parameter defines over how long period the two 
    99 /// consecutive sequences are let to overlap each other. 
   100 ///
   101 /// This shouldn't be that critical parameter. If you reduce the DEFAULT_SEQUENCE_MS setting 
   102 /// by a large amount, you might wish to try a smaller value on this.
   103 ///
   104 /// Increasing this value increases computational burden & vice versa.
   105 #define DEFAULT_OVERLAP_MS      8
   108 /// Class that does the time-stretch (tempo change) effect for the processed
   109 /// sound.
   110 class TDStretch : public FIFOProcessor
   111 {
   112 protected:
   113     int channels;
   114     int sampleReq;
   115     float tempo;
   117     SAMPLETYPE *pMidBuffer;
   118     SAMPLETYPE *pMidBufferUnaligned;
   119     int overlapLength;
   120     int seekLength;
   121     int seekWindowLength;
   122     int overlapDividerBits;
   123     int slopingDivider;
   124     float nominalSkip;
   125     float skipFract;
   126     FIFOSampleBuffer outputBuffer;
   127     FIFOSampleBuffer inputBuffer;
   128     bool bQuickSeek;
   130     int sampleRate;
   131     int sequenceMs;
   132     int seekWindowMs;
   133     int overlapMs;
   134     bool bAutoSeqSetting;
   135     bool bAutoSeekSetting;
   137     void acceptNewOverlapLength(int newOverlapLength);
   139     virtual void clearCrossCorrState();
   140     void calculateOverlapLength(int overlapMs);
   142     virtual double calcCrossCorr(const SAMPLETYPE *mixingPos, const SAMPLETYPE *compare, double &norm) const;
   143     virtual double calcCrossCorrAccumulate(const SAMPLETYPE *mixingPos, const SAMPLETYPE *compare, double &norm) const;
   145     virtual int seekBestOverlapPositionFull(const SAMPLETYPE *refPos);
   146     virtual int seekBestOverlapPositionQuick(const SAMPLETYPE *refPos);
   147     int seekBestOverlapPosition(const SAMPLETYPE *refPos);
   149     virtual void overlapStereo(SAMPLETYPE *output, const SAMPLETYPE *input) const;
   150     virtual void overlapMono(SAMPLETYPE *output, const SAMPLETYPE *input) const;
   151     virtual void overlapMulti(SAMPLETYPE *output, const SAMPLETYPE *input) const;
   153     void clearMidBuffer();
   154     void overlap(SAMPLETYPE *output, const SAMPLETYPE *input, uint ovlPos) const;
   156     void calcSeqParameters();
   158     /// Changes the tempo of the given sound samples.
   159     /// Returns amount of samples returned in the "output" buffer.
   160     /// The maximum amount of samples that can be returned at a time is set by
   161     /// the 'set_returnBuffer_size' function.
   162     void processSamples();
   164 public:
   165     TDStretch();
   166     virtual ~TDStretch();
   168     /// Operator 'new' is overloaded so that it automatically creates a suitable instance 
   169     /// depending on if we've a MMX/SSE/etc-capable CPU available or not.
   170     static void *operator new(size_t s);
   172     /// Use this function instead of "new" operator to create a new instance of this class. 
   173     /// This function automatically chooses a correct feature set depending on if the CPU
   174     /// supports MMX/SSE/etc extensions.
   175     static TDStretch *newInstance();
   177     /// Returns the output buffer object
   178     FIFOSamplePipe *getOutput() { return &outputBuffer; };
   180     /// Returns the input buffer object
   181     FIFOSamplePipe *getInput() { return &inputBuffer; };
   183     /// Sets new target tempo. Normal tempo = 'SCALE', smaller values represent slower 
   184     /// tempo, larger faster tempo.
   185     void setTempo(float newTempo);
   187     /// Returns nonzero if there aren't any samples available for outputting.
   188     virtual void clear();
   190     /// Clears the input buffer
   191     void clearInput();
   193     /// Sets the number of channels, 1 = mono, 2 = stereo
   194     void setChannels(int numChannels);
   196     /// Enables/disables the quick position seeking algorithm. Zero to disable, 
   197     /// nonzero to enable
   198     void enableQuickSeek(bool enable);
   200     /// Returns nonzero if the quick seeking algorithm is enabled.
   201     bool isQuickSeekEnabled() const;
   203     /// Sets routine control parameters. These control are certain time constants
   204     /// defining how the sound is stretched to the desired duration.
   205     //
   206     /// 'sampleRate' = sample rate of the sound
   207     /// 'sequenceMS' = one processing sequence length in milliseconds
   208     /// 'seekwindowMS' = seeking window length for scanning the best overlapping 
   209     ///      position
   210     /// 'overlapMS' = overlapping length
   211     void setParameters(int sampleRate,          ///< Samplerate of sound being processed (Hz)
   212                        int sequenceMS = -1,     ///< Single processing sequence length (ms)
   213                        int seekwindowMS = -1,   ///< Offset seeking window length (ms)
   214                        int overlapMS = -1       ///< Sequence overlapping length (ms)
   215                        );
   217     /// Get routine control parameters, see setParameters() function.
   218     /// Any of the parameters to this function can be NULL, in such case corresponding parameter
   219     /// value isn't returned.
   220     void getParameters(int *pSampleRate, int *pSequenceMs, int *pSeekWindowMs, int *pOverlapMs) const;
   222     /// Adds 'numsamples' pcs of samples from the 'samples' memory position into
   223     /// the input of the object.
   224     virtual void putSamples(
   225             const SAMPLETYPE *samples,  ///< Input sample data
   226             uint numSamples                         ///< Number of samples in 'samples' so that one sample
   227                                                     ///< contains both channels if stereo
   228             );
   230     /// return nominal input sample requirement for triggering a processing batch
   231     int getInputSampleReq() const
   232     {
   233         return (int)(nominalSkip + 0.5);
   234     }
   236     /// return nominal output sample amount when running a processing batch
   237     int getOutputBatchSize() const
   238     {
   239         return seekWindowLength - overlapLength;
   240     }
   241 };
   245 // Implementation-specific class declarations:
   247 #ifdef SOUNDTOUCH_ALLOW_MMX
   248     /// Class that implements MMX optimized routines for 16bit integer samples type.
   249     class TDStretchMMX : public TDStretch
   250     {
   251     protected:
   252         double calcCrossCorr(const short *mixingPos, const short *compare, double &norm) const;
   253         double calcCrossCorrAccumulate(const short *mixingPos, const short *compare, double &norm) const;
   254         virtual void overlapStereo(short *output, const short *input) const;
   255         virtual void clearCrossCorrState();
   256     };
   257 #endif /// SOUNDTOUCH_ALLOW_MMX
   260 #ifdef SOUNDTOUCH_ALLOW_SSE
   261     /// Class that implements SSE optimized routines for floating point samples type.
   262     class TDStretchSSE : public TDStretch
   263     {
   264     protected:
   265         double calcCrossCorr(const float *mixingPos, const float *compare, double &norm) const;
   266         double calcCrossCorrAccumulate(const float *mixingPos, const float *compare, double &norm) const;
   267     };
   269 #endif /// SOUNDTOUCH_ALLOW_SSE
   271 }
   272 #endif  /// TDStretch_H

mercurial