1.1 --- /dev/null Thu Jan 01 00:00:00 1970 +0000 1.2 +++ b/media/libopus/silk/float/find_pitch_lags_FLP.c Wed Dec 31 06:09:35 2014 +0100 1.3 @@ -0,0 +1,132 @@ 1.4 +/*********************************************************************** 1.5 +Copyright (c) 2006-2011, Skype Limited. All rights reserved. 1.6 +Redistribution and use in source and binary forms, with or without 1.7 +modification, are permitted provided that the following conditions 1.8 +are met: 1.9 +- Redistributions of source code must retain the above copyright notice, 1.10 +this list of conditions and the following disclaimer. 1.11 +- Redistributions in binary form must reproduce the above copyright 1.12 +notice, this list of conditions and the following disclaimer in the 1.13 +documentation and/or other materials provided with the distribution. 1.14 +- Neither the name of Internet Society, IETF or IETF Trust, nor the 1.15 +names of specific contributors, may be used to endorse or promote 1.16 +products derived from this software without specific prior written 1.17 +permission. 1.18 +THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 1.19 +AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 1.20 +IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 1.21 +ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE 1.22 +LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 1.23 +CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 1.24 +SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 1.25 +INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 1.26 +CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 1.27 +ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 1.28 +POSSIBILITY OF SUCH DAMAGE. 1.29 +***********************************************************************/ 1.30 + 1.31 +#ifdef HAVE_CONFIG_H 1.32 +#include "config.h" 1.33 +#endif 1.34 + 1.35 +#include <stdlib.h> 1.36 +#include "main_FLP.h" 1.37 +#include "tuning_parameters.h" 1.38 + 1.39 +void silk_find_pitch_lags_FLP( 1.40 + silk_encoder_state_FLP *psEnc, /* I/O Encoder state FLP */ 1.41 + silk_encoder_control_FLP *psEncCtrl, /* I/O Encoder control FLP */ 1.42 + silk_float res[], /* O Residual */ 1.43 + const silk_float x[], /* I Speech signal */ 1.44 + int arch /* I Run-time architecture */ 1.45 +) 1.46 +{ 1.47 + opus_int buf_len; 1.48 + silk_float thrhld, res_nrg; 1.49 + const silk_float *x_buf_ptr, *x_buf; 1.50 + silk_float auto_corr[ MAX_FIND_PITCH_LPC_ORDER + 1 ]; 1.51 + silk_float A[ MAX_FIND_PITCH_LPC_ORDER ]; 1.52 + silk_float refl_coef[ MAX_FIND_PITCH_LPC_ORDER ]; 1.53 + silk_float Wsig[ FIND_PITCH_LPC_WIN_MAX ]; 1.54 + silk_float *Wsig_ptr; 1.55 + 1.56 + /******************************************/ 1.57 + /* Set up buffer lengths etc based on Fs */ 1.58 + /******************************************/ 1.59 + buf_len = psEnc->sCmn.la_pitch + psEnc->sCmn.frame_length + psEnc->sCmn.ltp_mem_length; 1.60 + 1.61 + /* Safety check */ 1.62 + silk_assert( buf_len >= psEnc->sCmn.pitch_LPC_win_length ); 1.63 + 1.64 + x_buf = x - psEnc->sCmn.ltp_mem_length; 1.65 + 1.66 + /******************************************/ 1.67 + /* Estimate LPC AR coeficients */ 1.68 + /******************************************/ 1.69 + 1.70 + /* Calculate windowed signal */ 1.71 + 1.72 + /* First LA_LTP samples */ 1.73 + x_buf_ptr = x_buf + buf_len - psEnc->sCmn.pitch_LPC_win_length; 1.74 + Wsig_ptr = Wsig; 1.75 + silk_apply_sine_window_FLP( Wsig_ptr, x_buf_ptr, 1, psEnc->sCmn.la_pitch ); 1.76 + 1.77 + /* Middle non-windowed samples */ 1.78 + Wsig_ptr += psEnc->sCmn.la_pitch; 1.79 + x_buf_ptr += psEnc->sCmn.la_pitch; 1.80 + silk_memcpy( Wsig_ptr, x_buf_ptr, ( psEnc->sCmn.pitch_LPC_win_length - ( psEnc->sCmn.la_pitch << 1 ) ) * sizeof( silk_float ) ); 1.81 + 1.82 + /* Last LA_LTP samples */ 1.83 + Wsig_ptr += psEnc->sCmn.pitch_LPC_win_length - ( psEnc->sCmn.la_pitch << 1 ); 1.84 + x_buf_ptr += psEnc->sCmn.pitch_LPC_win_length - ( psEnc->sCmn.la_pitch << 1 ); 1.85 + silk_apply_sine_window_FLP( Wsig_ptr, x_buf_ptr, 2, psEnc->sCmn.la_pitch ); 1.86 + 1.87 + /* Calculate autocorrelation sequence */ 1.88 + silk_autocorrelation_FLP( auto_corr, Wsig, psEnc->sCmn.pitch_LPC_win_length, psEnc->sCmn.pitchEstimationLPCOrder + 1 ); 1.89 + 1.90 + /* Add white noise, as a fraction of the energy */ 1.91 + auto_corr[ 0 ] += auto_corr[ 0 ] * FIND_PITCH_WHITE_NOISE_FRACTION + 1; 1.92 + 1.93 + /* Calculate the reflection coefficients using Schur */ 1.94 + res_nrg = silk_schur_FLP( refl_coef, auto_corr, psEnc->sCmn.pitchEstimationLPCOrder ); 1.95 + 1.96 + /* Prediction gain */ 1.97 + psEncCtrl->predGain = auto_corr[ 0 ] / silk_max_float( res_nrg, 1.0f ); 1.98 + 1.99 + /* Convert reflection coefficients to prediction coefficients */ 1.100 + silk_k2a_FLP( A, refl_coef, psEnc->sCmn.pitchEstimationLPCOrder ); 1.101 + 1.102 + /* Bandwidth expansion */ 1.103 + silk_bwexpander_FLP( A, psEnc->sCmn.pitchEstimationLPCOrder, FIND_PITCH_BANDWIDTH_EXPANSION ); 1.104 + 1.105 + /*****************************************/ 1.106 + /* LPC analysis filtering */ 1.107 + /*****************************************/ 1.108 + silk_LPC_analysis_filter_FLP( res, A, x_buf, buf_len, psEnc->sCmn.pitchEstimationLPCOrder ); 1.109 + 1.110 + if( psEnc->sCmn.indices.signalType != TYPE_NO_VOICE_ACTIVITY && psEnc->sCmn.first_frame_after_reset == 0 ) { 1.111 + /* Threshold for pitch estimator */ 1.112 + thrhld = 0.6f; 1.113 + thrhld -= 0.004f * psEnc->sCmn.pitchEstimationLPCOrder; 1.114 + thrhld -= 0.1f * psEnc->sCmn.speech_activity_Q8 * ( 1.0f / 256.0f ); 1.115 + thrhld -= 0.15f * (psEnc->sCmn.prevSignalType >> 1); 1.116 + thrhld -= 0.1f * psEnc->sCmn.input_tilt_Q15 * ( 1.0f / 32768.0f ); 1.117 + 1.118 + /*****************************************/ 1.119 + /* Call Pitch estimator */ 1.120 + /*****************************************/ 1.121 + if( silk_pitch_analysis_core_FLP( res, psEncCtrl->pitchL, &psEnc->sCmn.indices.lagIndex, 1.122 + &psEnc->sCmn.indices.contourIndex, &psEnc->LTPCorr, psEnc->sCmn.prevLag, psEnc->sCmn.pitchEstimationThreshold_Q16 / 65536.0f, 1.123 + thrhld, psEnc->sCmn.fs_kHz, psEnc->sCmn.pitchEstimationComplexity, psEnc->sCmn.nb_subfr, arch ) == 0 ) 1.124 + { 1.125 + psEnc->sCmn.indices.signalType = TYPE_VOICED; 1.126 + } else { 1.127 + psEnc->sCmn.indices.signalType = TYPE_UNVOICED; 1.128 + } 1.129 + } else { 1.130 + silk_memset( psEncCtrl->pitchL, 0, sizeof( psEncCtrl->pitchL ) ); 1.131 + psEnc->sCmn.indices.lagIndex = 0; 1.132 + psEnc->sCmn.indices.contourIndex = 0; 1.133 + psEnc->LTPCorr = 0; 1.134 + } 1.135 +}