1*a58d3d2aSXin Li /*********************************************************************** 2*a58d3d2aSXin Li Copyright (c) 2006-2011, Skype Limited. All rights reserved. 3*a58d3d2aSXin Li Redistribution and use in source and binary forms, with or without 4*a58d3d2aSXin Li modification, are permitted provided that the following conditions 5*a58d3d2aSXin Li are met: 6*a58d3d2aSXin Li - Redistributions of source code must retain the above copyright notice, 7*a58d3d2aSXin Li this list of conditions and the following disclaimer. 8*a58d3d2aSXin Li - Redistributions in binary form must reproduce the above copyright 9*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer in the 10*a58d3d2aSXin Li documentation and/or other materials provided with the distribution. 11*a58d3d2aSXin Li - Neither the name of Internet Society, IETF or IETF Trust, nor the 12*a58d3d2aSXin Li names of specific contributors, may be used to endorse or promote 13*a58d3d2aSXin Li products derived from this software without specific prior written 14*a58d3d2aSXin Li permission. 15*a58d3d2aSXin Li THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 16*a58d3d2aSXin Li AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 17*a58d3d2aSXin Li IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 18*a58d3d2aSXin Li ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE 19*a58d3d2aSXin Li LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 20*a58d3d2aSXin Li CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 21*a58d3d2aSXin Li SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 22*a58d3d2aSXin Li INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 23*a58d3d2aSXin Li CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 24*a58d3d2aSXin Li ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 25*a58d3d2aSXin Li POSSIBILITY OF SUCH DAMAGE. 26*a58d3d2aSXin Li ***********************************************************************/ 27*a58d3d2aSXin Li 28*a58d3d2aSXin Li #ifndef SILK_DEFINE_H 29*a58d3d2aSXin Li #define SILK_DEFINE_H 30*a58d3d2aSXin Li 31*a58d3d2aSXin Li #include "errors.h" 32*a58d3d2aSXin Li #include "typedef.h" 33*a58d3d2aSXin Li 34*a58d3d2aSXin Li #ifdef __cplusplus 35*a58d3d2aSXin Li extern "C" 36*a58d3d2aSXin Li { 37*a58d3d2aSXin Li #endif 38*a58d3d2aSXin Li 39*a58d3d2aSXin Li /* Max number of encoder channels (1/2) */ 40*a58d3d2aSXin Li #define ENCODER_NUM_CHANNELS 2 41*a58d3d2aSXin Li /* Number of decoder channels (1/2) */ 42*a58d3d2aSXin Li #define DECODER_NUM_CHANNELS 2 43*a58d3d2aSXin Li 44*a58d3d2aSXin Li #define MAX_FRAMES_PER_PACKET 3 45*a58d3d2aSXin Li 46*a58d3d2aSXin Li /* Limits on bitrate */ 47*a58d3d2aSXin Li #define MIN_TARGET_RATE_BPS 5000 48*a58d3d2aSXin Li #define MAX_TARGET_RATE_BPS 80000 49*a58d3d2aSXin Li 50*a58d3d2aSXin Li /* LBRR thresholds */ 51*a58d3d2aSXin Li #define LBRR_NB_MIN_RATE_BPS 12000 52*a58d3d2aSXin Li #define LBRR_MB_MIN_RATE_BPS 14000 53*a58d3d2aSXin Li #define LBRR_WB_MIN_RATE_BPS 16000 54*a58d3d2aSXin Li 55*a58d3d2aSXin Li /* DTX settings */ 56*a58d3d2aSXin Li #define NB_SPEECH_FRAMES_BEFORE_DTX 10 /* eq 200 ms */ 57*a58d3d2aSXin Li #define MAX_CONSECUTIVE_DTX 20 /* eq 400 ms */ 58*a58d3d2aSXin Li #define DTX_ACTIVITY_THRESHOLD 0.1f 59*a58d3d2aSXin Li 60*a58d3d2aSXin Li /* VAD decision */ 61*a58d3d2aSXin Li #define VAD_NO_DECISION -1 62*a58d3d2aSXin Li #define VAD_NO_ACTIVITY 0 63*a58d3d2aSXin Li #define VAD_ACTIVITY 1 64*a58d3d2aSXin Li 65*a58d3d2aSXin Li /* Maximum sampling frequency */ 66*a58d3d2aSXin Li #define MAX_FS_KHZ 16 67*a58d3d2aSXin Li #define MAX_API_FS_KHZ 48 68*a58d3d2aSXin Li 69*a58d3d2aSXin Li /* Signal types */ 70*a58d3d2aSXin Li #define TYPE_NO_VOICE_ACTIVITY 0 71*a58d3d2aSXin Li #define TYPE_UNVOICED 1 72*a58d3d2aSXin Li #define TYPE_VOICED 2 73*a58d3d2aSXin Li 74*a58d3d2aSXin Li /* Conditional coding types */ 75*a58d3d2aSXin Li #define CODE_INDEPENDENTLY 0 76*a58d3d2aSXin Li #define CODE_INDEPENDENTLY_NO_LTP_SCALING 1 77*a58d3d2aSXin Li #define CODE_CONDITIONALLY 2 78*a58d3d2aSXin Li 79*a58d3d2aSXin Li /* Settings for stereo processing */ 80*a58d3d2aSXin Li #define STEREO_QUANT_TAB_SIZE 16 81*a58d3d2aSXin Li #define STEREO_QUANT_SUB_STEPS 5 82*a58d3d2aSXin Li #define STEREO_INTERP_LEN_MS 8 /* must be even */ 83*a58d3d2aSXin Li #define STEREO_RATIO_SMOOTH_COEF 0.01 /* smoothing coef for signal norms and stereo width */ 84*a58d3d2aSXin Li 85*a58d3d2aSXin Li /* Range of pitch lag estimates */ 86*a58d3d2aSXin Li #define PITCH_EST_MIN_LAG_MS 2 /* 2 ms -> 500 Hz */ 87*a58d3d2aSXin Li #define PITCH_EST_MAX_LAG_MS 18 /* 18 ms -> 56 Hz */ 88*a58d3d2aSXin Li 89*a58d3d2aSXin Li /* Maximum number of subframes */ 90*a58d3d2aSXin Li #define MAX_NB_SUBFR 4 91*a58d3d2aSXin Li 92*a58d3d2aSXin Li /* Number of samples per frame */ 93*a58d3d2aSXin Li #define LTP_MEM_LENGTH_MS 20 94*a58d3d2aSXin Li #define SUB_FRAME_LENGTH_MS 5 95*a58d3d2aSXin Li #define MAX_SUB_FRAME_LENGTH ( SUB_FRAME_LENGTH_MS * MAX_FS_KHZ ) 96*a58d3d2aSXin Li #define MAX_FRAME_LENGTH_MS ( SUB_FRAME_LENGTH_MS * MAX_NB_SUBFR ) 97*a58d3d2aSXin Li #define MAX_FRAME_LENGTH ( MAX_FRAME_LENGTH_MS * MAX_FS_KHZ ) 98*a58d3d2aSXin Li 99*a58d3d2aSXin Li /* Milliseconds of lookahead for pitch analysis */ 100*a58d3d2aSXin Li #define LA_PITCH_MS 2 101*a58d3d2aSXin Li #define LA_PITCH_MAX ( LA_PITCH_MS * MAX_FS_KHZ ) 102*a58d3d2aSXin Li 103*a58d3d2aSXin Li /* Order of LPC used in find pitch */ 104*a58d3d2aSXin Li #define MAX_FIND_PITCH_LPC_ORDER 16 105*a58d3d2aSXin Li 106*a58d3d2aSXin Li /* Length of LPC window used in find pitch */ 107*a58d3d2aSXin Li #define FIND_PITCH_LPC_WIN_MS ( 20 + (LA_PITCH_MS << 1) ) 108*a58d3d2aSXin Li #define FIND_PITCH_LPC_WIN_MS_2_SF ( 10 + (LA_PITCH_MS << 1) ) 109*a58d3d2aSXin Li #define FIND_PITCH_LPC_WIN_MAX ( FIND_PITCH_LPC_WIN_MS * MAX_FS_KHZ ) 110*a58d3d2aSXin Li 111*a58d3d2aSXin Li /* Milliseconds of lookahead for noise shape analysis */ 112*a58d3d2aSXin Li #define LA_SHAPE_MS 5 113*a58d3d2aSXin Li #define LA_SHAPE_MAX ( LA_SHAPE_MS * MAX_FS_KHZ ) 114*a58d3d2aSXin Li 115*a58d3d2aSXin Li /* Maximum length of LPC window used in noise shape analysis */ 116*a58d3d2aSXin Li #define SHAPE_LPC_WIN_MAX ( 15 * MAX_FS_KHZ ) 117*a58d3d2aSXin Li 118*a58d3d2aSXin Li /* dB level of lowest gain quantization level */ 119*a58d3d2aSXin Li #define MIN_QGAIN_DB 2 120*a58d3d2aSXin Li /* dB level of highest gain quantization level */ 121*a58d3d2aSXin Li #define MAX_QGAIN_DB 88 122*a58d3d2aSXin Li /* Number of gain quantization levels */ 123*a58d3d2aSXin Li #define N_LEVELS_QGAIN 64 124*a58d3d2aSXin Li /* Max increase in gain quantization index */ 125*a58d3d2aSXin Li #define MAX_DELTA_GAIN_QUANT 36 126*a58d3d2aSXin Li /* Max decrease in gain quantization index */ 127*a58d3d2aSXin Li #define MIN_DELTA_GAIN_QUANT -4 128*a58d3d2aSXin Li 129*a58d3d2aSXin Li /* Quantization offsets (multiples of 4) */ 130*a58d3d2aSXin Li #define OFFSET_VL_Q10 32 131*a58d3d2aSXin Li #define OFFSET_VH_Q10 100 132*a58d3d2aSXin Li #define OFFSET_UVL_Q10 100 133*a58d3d2aSXin Li #define OFFSET_UVH_Q10 240 134*a58d3d2aSXin Li 135*a58d3d2aSXin Li #define QUANT_LEVEL_ADJUST_Q10 80 136*a58d3d2aSXin Li 137*a58d3d2aSXin Li /* Maximum numbers of iterations used to stabilize an LPC vector */ 138*a58d3d2aSXin Li #define MAX_LPC_STABILIZE_ITERATIONS 16 139*a58d3d2aSXin Li #define MAX_PREDICTION_POWER_GAIN 1e4f 140*a58d3d2aSXin Li #define MAX_PREDICTION_POWER_GAIN_AFTER_RESET 1e2f 141*a58d3d2aSXin Li 142*a58d3d2aSXin Li #define MAX_LPC_ORDER 16 143*a58d3d2aSXin Li #define MIN_LPC_ORDER 10 144*a58d3d2aSXin Li 145*a58d3d2aSXin Li /* Find Pred Coef defines */ 146*a58d3d2aSXin Li #define LTP_ORDER 5 147*a58d3d2aSXin Li 148*a58d3d2aSXin Li /* LTP quantization settings */ 149*a58d3d2aSXin Li #define NB_LTP_CBKS 3 150*a58d3d2aSXin Li 151*a58d3d2aSXin Li /* Flag to use harmonic noise shaping */ 152*a58d3d2aSXin Li #define USE_HARM_SHAPING 1 153*a58d3d2aSXin Li 154*a58d3d2aSXin Li /* Max LPC order of noise shaping filters */ 155*a58d3d2aSXin Li #define MAX_SHAPE_LPC_ORDER 24 156*a58d3d2aSXin Li 157*a58d3d2aSXin Li #define HARM_SHAPE_FIR_TAPS 3 158*a58d3d2aSXin Li 159*a58d3d2aSXin Li /* Maximum number of delayed decision states */ 160*a58d3d2aSXin Li #define MAX_DEL_DEC_STATES 4 161*a58d3d2aSXin Li 162*a58d3d2aSXin Li #define LTP_BUF_LENGTH 512 163*a58d3d2aSXin Li #define LTP_MASK ( LTP_BUF_LENGTH - 1 ) 164*a58d3d2aSXin Li 165*a58d3d2aSXin Li #define DECISION_DELAY 40 166*a58d3d2aSXin Li 167*a58d3d2aSXin Li /* Number of subframes for excitation entropy coding */ 168*a58d3d2aSXin Li #define SHELL_CODEC_FRAME_LENGTH 16 169*a58d3d2aSXin Li #define LOG2_SHELL_CODEC_FRAME_LENGTH 4 170*a58d3d2aSXin Li #define MAX_NB_SHELL_BLOCKS ( MAX_FRAME_LENGTH / SHELL_CODEC_FRAME_LENGTH ) 171*a58d3d2aSXin Li 172*a58d3d2aSXin Li /* Number of rate levels, for entropy coding of excitation */ 173*a58d3d2aSXin Li #define N_RATE_LEVELS 10 174*a58d3d2aSXin Li 175*a58d3d2aSXin Li /* Maximum sum of pulses per shell coding frame */ 176*a58d3d2aSXin Li #define SILK_MAX_PULSES 16 177*a58d3d2aSXin Li 178*a58d3d2aSXin Li #define MAX_MATRIX_SIZE MAX_LPC_ORDER /* Max of LPC Order and LTP order */ 179*a58d3d2aSXin Li 180*a58d3d2aSXin Li # define NSQ_LPC_BUF_LENGTH MAX_LPC_ORDER 181*a58d3d2aSXin Li 182*a58d3d2aSXin Li /***************************/ 183*a58d3d2aSXin Li /* Voice activity detector */ 184*a58d3d2aSXin Li /***************************/ 185*a58d3d2aSXin Li #define VAD_N_BANDS 4 186*a58d3d2aSXin Li 187*a58d3d2aSXin Li #define VAD_INTERNAL_SUBFRAMES_LOG2 2 188*a58d3d2aSXin Li #define VAD_INTERNAL_SUBFRAMES ( 1 << VAD_INTERNAL_SUBFRAMES_LOG2 ) 189*a58d3d2aSXin Li 190*a58d3d2aSXin Li #define VAD_NOISE_LEVEL_SMOOTH_COEF_Q16 1024 /* Must be < 4096 */ 191*a58d3d2aSXin Li #define VAD_NOISE_LEVELS_BIAS 50 192*a58d3d2aSXin Li 193*a58d3d2aSXin Li /* Sigmoid settings */ 194*a58d3d2aSXin Li #define VAD_NEGATIVE_OFFSET_Q5 128 /* sigmoid is 0 at -128 */ 195*a58d3d2aSXin Li #define VAD_SNR_FACTOR_Q16 45000 196*a58d3d2aSXin Li 197*a58d3d2aSXin Li /* smoothing for SNR measurement */ 198*a58d3d2aSXin Li #define VAD_SNR_SMOOTH_COEF_Q18 4096 199*a58d3d2aSXin Li 200*a58d3d2aSXin Li /* Size of the piecewise linear cosine approximation table for the LSFs */ 201*a58d3d2aSXin Li #define LSF_COS_TAB_SZ_FIX 128 202*a58d3d2aSXin Li 203*a58d3d2aSXin Li /******************/ 204*a58d3d2aSXin Li /* NLSF quantizer */ 205*a58d3d2aSXin Li /******************/ 206*a58d3d2aSXin Li #define NLSF_W_Q 2 207*a58d3d2aSXin Li #define NLSF_VQ_MAX_VECTORS 32 208*a58d3d2aSXin Li #define NLSF_QUANT_MAX_AMPLITUDE 4 209*a58d3d2aSXin Li #define NLSF_QUANT_MAX_AMPLITUDE_EXT 10 210*a58d3d2aSXin Li #define NLSF_QUANT_LEVEL_ADJ 0.1 211*a58d3d2aSXin Li #define NLSF_QUANT_DEL_DEC_STATES_LOG2 2 212*a58d3d2aSXin Li #define NLSF_QUANT_DEL_DEC_STATES ( 1 << NLSF_QUANT_DEL_DEC_STATES_LOG2 ) 213*a58d3d2aSXin Li 214*a58d3d2aSXin Li /* Transition filtering for mode switching */ 215*a58d3d2aSXin Li #define TRANSITION_TIME_MS 5120 /* 5120 = 64 * FRAME_LENGTH_MS * ( TRANSITION_INT_NUM - 1 ) = 64*(20*4)*/ 216*a58d3d2aSXin Li #define TRANSITION_NB 3 /* Hardcoded in tables */ 217*a58d3d2aSXin Li #define TRANSITION_NA 2 /* Hardcoded in tables */ 218*a58d3d2aSXin Li #define TRANSITION_INT_NUM 5 /* Hardcoded in tables */ 219*a58d3d2aSXin Li #define TRANSITION_FRAMES ( TRANSITION_TIME_MS / MAX_FRAME_LENGTH_MS ) 220*a58d3d2aSXin Li #define TRANSITION_INT_STEPS ( TRANSITION_FRAMES / ( TRANSITION_INT_NUM - 1 ) ) 221*a58d3d2aSXin Li 222*a58d3d2aSXin Li /* BWE factors to apply after packet loss */ 223*a58d3d2aSXin Li #define BWE_AFTER_LOSS_Q16 63570 224*a58d3d2aSXin Li 225*a58d3d2aSXin Li /* Defines for CN generation */ 226*a58d3d2aSXin Li #define CNG_BUF_MASK_MAX 255 /* 2^floor(log2(MAX_FRAME_LENGTH))-1 */ 227*a58d3d2aSXin Li #define CNG_GAIN_SMTH_Q16 4634 /* 0.25^(1/4) */ 228*a58d3d2aSXin Li #define CNG_GAIN_SMTH_THRESHOLD_Q16 46396 /* -3 dB */ 229*a58d3d2aSXin Li #define CNG_NLSF_SMTH_Q16 16348 /* 0.25 */ 230*a58d3d2aSXin Li 231*a58d3d2aSXin Li #ifdef __cplusplus 232*a58d3d2aSXin Li } 233*a58d3d2aSXin Li #endif 234*a58d3d2aSXin Li 235*a58d3d2aSXin Li #endif 236