|
1 /*********************************************************************** |
|
2 Copyright (c) 2006-2011, Skype Limited. All rights reserved. |
|
3 Redistribution and use in source and binary forms, with or without |
|
4 modification, are permitted provided that the following conditions |
|
5 are met: |
|
6 - Redistributions of source code must retain the above copyright notice, |
|
7 this list of conditions and the following disclaimer. |
|
8 - Redistributions in binary form must reproduce the above copyright |
|
9 notice, this list of conditions and the following disclaimer in the |
|
10 documentation and/or other materials provided with the distribution. |
|
11 - Neither the name of Internet Society, IETF or IETF Trust, nor the |
|
12 names of specific contributors, may be used to endorse or promote |
|
13 products derived from this software without specific prior written |
|
14 permission. |
|
15 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" |
|
16 AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
|
17 IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
|
18 ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE |
|
19 LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR |
|
20 CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF |
|
21 SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS |
|
22 INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN |
|
23 CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
|
24 ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE |
|
25 POSSIBILITY OF SUCH DAMAGE. |
|
26 ***********************************************************************/ |
|
27 |
|
28 #ifndef SILK_DEFINE_H |
|
29 #define SILK_DEFINE_H |
|
30 |
|
31 #include "errors.h" |
|
32 #include "typedef.h" |
|
33 |
|
34 #ifdef __cplusplus |
|
35 extern "C" |
|
36 { |
|
37 #endif |
|
38 |
|
39 /* Max number of encoder channels (1/2) */ |
|
40 #define ENCODER_NUM_CHANNELS 2 |
|
41 /* Number of decoder channels (1/2) */ |
|
42 #define DECODER_NUM_CHANNELS 2 |
|
43 |
|
44 #define MAX_FRAMES_PER_PACKET 3 |
|
45 |
|
46 /* Limits on bitrate */ |
|
47 #define MIN_TARGET_RATE_BPS 5000 |
|
48 #define MAX_TARGET_RATE_BPS 80000 |
|
49 #define TARGET_RATE_TAB_SZ 8 |
|
50 |
|
51 /* LBRR thresholds */ |
|
52 #define LBRR_NB_MIN_RATE_BPS 12000 |
|
53 #define LBRR_MB_MIN_RATE_BPS 14000 |
|
54 #define LBRR_WB_MIN_RATE_BPS 16000 |
|
55 |
|
56 /* DTX settings */ |
|
57 #define NB_SPEECH_FRAMES_BEFORE_DTX 10 /* eq 200 ms */ |
|
58 #define MAX_CONSECUTIVE_DTX 20 /* eq 400 ms */ |
|
59 |
|
60 /* Maximum sampling frequency */ |
|
61 #define MAX_FS_KHZ 16 |
|
62 #define MAX_API_FS_KHZ 48 |
|
63 |
|
64 /* Signal types */ |
|
65 #define TYPE_NO_VOICE_ACTIVITY 0 |
|
66 #define TYPE_UNVOICED 1 |
|
67 #define TYPE_VOICED 2 |
|
68 |
|
69 /* Conditional coding types */ |
|
70 #define CODE_INDEPENDENTLY 0 |
|
71 #define CODE_INDEPENDENTLY_NO_LTP_SCALING 1 |
|
72 #define CODE_CONDITIONALLY 2 |
|
73 |
|
74 /* Settings for stereo processing */ |
|
75 #define STEREO_QUANT_TAB_SIZE 16 |
|
76 #define STEREO_QUANT_SUB_STEPS 5 |
|
77 #define STEREO_INTERP_LEN_MS 8 /* must be even */ |
|
78 #define STEREO_RATIO_SMOOTH_COEF 0.01 /* smoothing coef for signal norms and stereo width */ |
|
79 |
|
80 /* Range of pitch lag estimates */ |
|
81 #define PITCH_EST_MIN_LAG_MS 2 /* 2 ms -> 500 Hz */ |
|
82 #define PITCH_EST_MAX_LAG_MS 18 /* 18 ms -> 56 Hz */ |
|
83 |
|
84 /* Maximum number of subframes */ |
|
85 #define MAX_NB_SUBFR 4 |
|
86 |
|
87 /* Number of samples per frame */ |
|
88 #define LTP_MEM_LENGTH_MS 20 |
|
89 #define SUB_FRAME_LENGTH_MS 5 |
|
90 #define MAX_SUB_FRAME_LENGTH ( SUB_FRAME_LENGTH_MS * MAX_FS_KHZ ) |
|
91 #define MAX_FRAME_LENGTH_MS ( SUB_FRAME_LENGTH_MS * MAX_NB_SUBFR ) |
|
92 #define MAX_FRAME_LENGTH ( MAX_FRAME_LENGTH_MS * MAX_FS_KHZ ) |
|
93 |
|
94 /* Milliseconds of lookahead for pitch analysis */ |
|
95 #define LA_PITCH_MS 2 |
|
96 #define LA_PITCH_MAX ( LA_PITCH_MS * MAX_FS_KHZ ) |
|
97 |
|
98 /* Order of LPC used in find pitch */ |
|
99 #define MAX_FIND_PITCH_LPC_ORDER 16 |
|
100 |
|
101 /* Length of LPC window used in find pitch */ |
|
102 #define FIND_PITCH_LPC_WIN_MS ( 20 + (LA_PITCH_MS << 1) ) |
|
103 #define FIND_PITCH_LPC_WIN_MS_2_SF ( 10 + (LA_PITCH_MS << 1) ) |
|
104 #define FIND_PITCH_LPC_WIN_MAX ( FIND_PITCH_LPC_WIN_MS * MAX_FS_KHZ ) |
|
105 |
|
106 /* Milliseconds of lookahead for noise shape analysis */ |
|
107 #define LA_SHAPE_MS 5 |
|
108 #define LA_SHAPE_MAX ( LA_SHAPE_MS * MAX_FS_KHZ ) |
|
109 |
|
110 /* Maximum length of LPC window used in noise shape analysis */ |
|
111 #define SHAPE_LPC_WIN_MAX ( 15 * MAX_FS_KHZ ) |
|
112 |
|
113 /* dB level of lowest gain quantization level */ |
|
114 #define MIN_QGAIN_DB 2 |
|
115 /* dB level of highest gain quantization level */ |
|
116 #define MAX_QGAIN_DB 88 |
|
117 /* Number of gain quantization levels */ |
|
118 #define N_LEVELS_QGAIN 64 |
|
119 /* Max increase in gain quantization index */ |
|
120 #define MAX_DELTA_GAIN_QUANT 36 |
|
121 /* Max decrease in gain quantization index */ |
|
122 #define MIN_DELTA_GAIN_QUANT -4 |
|
123 |
|
124 /* Quantization offsets (multiples of 4) */ |
|
125 #define OFFSET_VL_Q10 32 |
|
126 #define OFFSET_VH_Q10 100 |
|
127 #define OFFSET_UVL_Q10 100 |
|
128 #define OFFSET_UVH_Q10 240 |
|
129 |
|
130 #define QUANT_LEVEL_ADJUST_Q10 80 |
|
131 |
|
132 /* Maximum numbers of iterations used to stabilize an LPC vector */ |
|
133 #define MAX_LPC_STABILIZE_ITERATIONS 16 |
|
134 #define MAX_PREDICTION_POWER_GAIN 1e4f |
|
135 #define MAX_PREDICTION_POWER_GAIN_AFTER_RESET 1e2f |
|
136 |
|
137 #define MAX_LPC_ORDER 16 |
|
138 #define MIN_LPC_ORDER 10 |
|
139 |
|
140 /* Find Pred Coef defines */ |
|
141 #define LTP_ORDER 5 |
|
142 |
|
143 /* LTP quantization settings */ |
|
144 #define NB_LTP_CBKS 3 |
|
145 |
|
146 /* Flag to use harmonic noise shaping */ |
|
147 #define USE_HARM_SHAPING 1 |
|
148 |
|
149 /* Max LPC order of noise shaping filters */ |
|
150 #define MAX_SHAPE_LPC_ORDER 16 |
|
151 |
|
152 #define HARM_SHAPE_FIR_TAPS 3 |
|
153 |
|
154 /* Maximum number of delayed decision states */ |
|
155 #define MAX_DEL_DEC_STATES 4 |
|
156 |
|
157 #define LTP_BUF_LENGTH 512 |
|
158 #define LTP_MASK ( LTP_BUF_LENGTH - 1 ) |
|
159 |
|
160 #define DECISION_DELAY 32 |
|
161 #define DECISION_DELAY_MASK ( DECISION_DELAY - 1 ) |
|
162 |
|
163 /* Number of subframes for excitation entropy coding */ |
|
164 #define SHELL_CODEC_FRAME_LENGTH 16 |
|
165 #define LOG2_SHELL_CODEC_FRAME_LENGTH 4 |
|
166 #define MAX_NB_SHELL_BLOCKS ( MAX_FRAME_LENGTH / SHELL_CODEC_FRAME_LENGTH ) |
|
167 |
|
168 /* Number of rate levels, for entropy coding of excitation */ |
|
169 #define N_RATE_LEVELS 10 |
|
170 |
|
171 /* Maximum sum of pulses per shell coding frame */ |
|
172 #define MAX_PULSES 16 |
|
173 |
|
174 #define MAX_MATRIX_SIZE MAX_LPC_ORDER /* Max of LPC Order and LTP order */ |
|
175 |
|
176 #if( MAX_LPC_ORDER > DECISION_DELAY ) |
|
177 # define NSQ_LPC_BUF_LENGTH MAX_LPC_ORDER |
|
178 #else |
|
179 # define NSQ_LPC_BUF_LENGTH DECISION_DELAY |
|
180 #endif |
|
181 |
|
182 /***************************/ |
|
183 /* Voice activity detector */ |
|
184 /***************************/ |
|
185 #define VAD_N_BANDS 4 |
|
186 |
|
187 #define VAD_INTERNAL_SUBFRAMES_LOG2 2 |
|
188 #define VAD_INTERNAL_SUBFRAMES ( 1 << VAD_INTERNAL_SUBFRAMES_LOG2 ) |
|
189 |
|
190 #define VAD_NOISE_LEVEL_SMOOTH_COEF_Q16 1024 /* Must be < 4096 */ |
|
191 #define VAD_NOISE_LEVELS_BIAS 50 |
|
192 |
|
193 /* Sigmoid settings */ |
|
194 #define VAD_NEGATIVE_OFFSET_Q5 128 /* sigmoid is 0 at -128 */ |
|
195 #define VAD_SNR_FACTOR_Q16 45000 |
|
196 |
|
197 /* smoothing for SNR measurement */ |
|
198 #define VAD_SNR_SMOOTH_COEF_Q18 4096 |
|
199 |
|
200 /* Size of the piecewise linear cosine approximation table for the LSFs */ |
|
201 #define LSF_COS_TAB_SZ_FIX 128 |
|
202 |
|
203 /******************/ |
|
204 /* NLSF quantizer */ |
|
205 /******************/ |
|
206 #define NLSF_W_Q 2 |
|
207 #define NLSF_VQ_MAX_VECTORS 32 |
|
208 #define NLSF_VQ_MAX_SURVIVORS 32 |
|
209 #define NLSF_QUANT_MAX_AMPLITUDE 4 |
|
210 #define NLSF_QUANT_MAX_AMPLITUDE_EXT 10 |
|
211 #define NLSF_QUANT_LEVEL_ADJ 0.1 |
|
212 #define NLSF_QUANT_DEL_DEC_STATES_LOG2 2 |
|
213 #define NLSF_QUANT_DEL_DEC_STATES ( 1 << NLSF_QUANT_DEL_DEC_STATES_LOG2 ) |
|
214 |
|
215 /* Transition filtering for mode switching */ |
|
216 #define TRANSITION_TIME_MS 5120 /* 5120 = 64 * FRAME_LENGTH_MS * ( TRANSITION_INT_NUM - 1 ) = 64*(20*4)*/ |
|
217 #define TRANSITION_NB 3 /* Hardcoded in tables */ |
|
218 #define TRANSITION_NA 2 /* Hardcoded in tables */ |
|
219 #define TRANSITION_INT_NUM 5 /* Hardcoded in tables */ |
|
220 #define TRANSITION_FRAMES ( TRANSITION_TIME_MS / MAX_FRAME_LENGTH_MS ) |
|
221 #define TRANSITION_INT_STEPS ( TRANSITION_FRAMES / ( TRANSITION_INT_NUM - 1 ) ) |
|
222 |
|
223 /* BWE factors to apply after packet loss */ |
|
224 #define BWE_AFTER_LOSS_Q16 63570 |
|
225 |
|
226 /* Defines for CN generation */ |
|
227 #define CNG_BUF_MASK_MAX 255 /* 2^floor(log2(MAX_FRAME_LENGTH))-1 */ |
|
228 #define CNG_GAIN_SMTH_Q16 4634 /* 0.25^(1/4) */ |
|
229 #define CNG_NLSF_SMTH_Q16 16348 /* 0.25 */ |
|
230 |
|
231 #ifdef __cplusplus |
|
232 } |
|
233 #endif |
|
234 |
|
235 #endif |