xref: /aosp_15_r20/external/libopus/silk/define.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /***********************************************************************
2*a58d3d2aSXin Li Copyright (c) 2006-2011, Skype Limited. All rights reserved.
3*a58d3d2aSXin Li Redistribution and use in source and binary forms, with or without
4*a58d3d2aSXin Li modification, are permitted provided that the following conditions
5*a58d3d2aSXin Li are met:
6*a58d3d2aSXin Li - Redistributions of source code must retain the above copyright notice,
7*a58d3d2aSXin Li this list of conditions and the following disclaimer.
8*a58d3d2aSXin Li - Redistributions in binary form must reproduce the above copyright
9*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer in the
10*a58d3d2aSXin Li documentation and/or other materials provided with the distribution.
11*a58d3d2aSXin Li - Neither the name of Internet Society, IETF or IETF Trust, nor the
12*a58d3d2aSXin Li names of specific contributors, may be used to endorse or promote
13*a58d3d2aSXin Li products derived from this software without specific prior written
14*a58d3d2aSXin Li permission.
15*a58d3d2aSXin Li THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
16*a58d3d2aSXin Li AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17*a58d3d2aSXin Li IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18*a58d3d2aSXin Li ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
19*a58d3d2aSXin Li LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
20*a58d3d2aSXin Li CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
21*a58d3d2aSXin Li SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
22*a58d3d2aSXin Li INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23*a58d3d2aSXin Li CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
24*a58d3d2aSXin Li ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
25*a58d3d2aSXin Li POSSIBILITY OF SUCH DAMAGE.
26*a58d3d2aSXin Li ***********************************************************************/
27*a58d3d2aSXin Li 
28*a58d3d2aSXin Li #ifndef SILK_DEFINE_H
29*a58d3d2aSXin Li #define SILK_DEFINE_H
30*a58d3d2aSXin Li 
31*a58d3d2aSXin Li #include "errors.h"
32*a58d3d2aSXin Li #include "typedef.h"
33*a58d3d2aSXin Li 
34*a58d3d2aSXin Li #ifdef __cplusplus
35*a58d3d2aSXin Li extern "C"
36*a58d3d2aSXin Li {
37*a58d3d2aSXin Li #endif
38*a58d3d2aSXin Li 
39*a58d3d2aSXin Li /* Max number of encoder channels (1/2) */
40*a58d3d2aSXin Li #define ENCODER_NUM_CHANNELS                    2
41*a58d3d2aSXin Li /* Number of decoder channels (1/2) */
42*a58d3d2aSXin Li #define DECODER_NUM_CHANNELS                    2
43*a58d3d2aSXin Li 
44*a58d3d2aSXin Li #define MAX_FRAMES_PER_PACKET                   3
45*a58d3d2aSXin Li 
46*a58d3d2aSXin Li /* Limits on bitrate */
47*a58d3d2aSXin Li #define MIN_TARGET_RATE_BPS                     5000
48*a58d3d2aSXin Li #define MAX_TARGET_RATE_BPS                     80000
49*a58d3d2aSXin Li 
50*a58d3d2aSXin Li /* LBRR thresholds */
51*a58d3d2aSXin Li #define LBRR_NB_MIN_RATE_BPS                    12000
52*a58d3d2aSXin Li #define LBRR_MB_MIN_RATE_BPS                    14000
53*a58d3d2aSXin Li #define LBRR_WB_MIN_RATE_BPS                    16000
54*a58d3d2aSXin Li 
55*a58d3d2aSXin Li /* DTX settings */
56*a58d3d2aSXin Li #define NB_SPEECH_FRAMES_BEFORE_DTX             10      /* eq 200 ms */
57*a58d3d2aSXin Li #define MAX_CONSECUTIVE_DTX                     20      /* eq 400 ms */
58*a58d3d2aSXin Li #define DTX_ACTIVITY_THRESHOLD                  0.1f
59*a58d3d2aSXin Li 
60*a58d3d2aSXin Li /* VAD decision */
61*a58d3d2aSXin Li #define VAD_NO_DECISION                         -1
62*a58d3d2aSXin Li #define VAD_NO_ACTIVITY                         0
63*a58d3d2aSXin Li #define VAD_ACTIVITY                            1
64*a58d3d2aSXin Li 
65*a58d3d2aSXin Li /* Maximum sampling frequency */
66*a58d3d2aSXin Li #define MAX_FS_KHZ                              16
67*a58d3d2aSXin Li #define MAX_API_FS_KHZ                          48
68*a58d3d2aSXin Li 
69*a58d3d2aSXin Li /* Signal types */
70*a58d3d2aSXin Li #define TYPE_NO_VOICE_ACTIVITY                  0
71*a58d3d2aSXin Li #define TYPE_UNVOICED                           1
72*a58d3d2aSXin Li #define TYPE_VOICED                             2
73*a58d3d2aSXin Li 
74*a58d3d2aSXin Li /* Conditional coding types */
75*a58d3d2aSXin Li #define CODE_INDEPENDENTLY                      0
76*a58d3d2aSXin Li #define CODE_INDEPENDENTLY_NO_LTP_SCALING       1
77*a58d3d2aSXin Li #define CODE_CONDITIONALLY                      2
78*a58d3d2aSXin Li 
79*a58d3d2aSXin Li /* Settings for stereo processing */
80*a58d3d2aSXin Li #define STEREO_QUANT_TAB_SIZE                   16
81*a58d3d2aSXin Li #define STEREO_QUANT_SUB_STEPS                  5
82*a58d3d2aSXin Li #define STEREO_INTERP_LEN_MS                    8       /* must be even */
83*a58d3d2aSXin Li #define STEREO_RATIO_SMOOTH_COEF                0.01    /* smoothing coef for signal norms and stereo width */
84*a58d3d2aSXin Li 
85*a58d3d2aSXin Li /* Range of pitch lag estimates */
86*a58d3d2aSXin Li #define PITCH_EST_MIN_LAG_MS                    2       /* 2 ms -> 500 Hz */
87*a58d3d2aSXin Li #define PITCH_EST_MAX_LAG_MS                    18      /* 18 ms -> 56 Hz */
88*a58d3d2aSXin Li 
89*a58d3d2aSXin Li /* Maximum number of subframes */
90*a58d3d2aSXin Li #define MAX_NB_SUBFR                            4
91*a58d3d2aSXin Li 
92*a58d3d2aSXin Li /* Number of samples per frame */
93*a58d3d2aSXin Li #define LTP_MEM_LENGTH_MS                       20
94*a58d3d2aSXin Li #define SUB_FRAME_LENGTH_MS                     5
95*a58d3d2aSXin Li #define MAX_SUB_FRAME_LENGTH                    ( SUB_FRAME_LENGTH_MS * MAX_FS_KHZ )
96*a58d3d2aSXin Li #define MAX_FRAME_LENGTH_MS                     ( SUB_FRAME_LENGTH_MS * MAX_NB_SUBFR )
97*a58d3d2aSXin Li #define MAX_FRAME_LENGTH                        ( MAX_FRAME_LENGTH_MS * MAX_FS_KHZ )
98*a58d3d2aSXin Li 
99*a58d3d2aSXin Li /* Milliseconds of lookahead for pitch analysis */
100*a58d3d2aSXin Li #define LA_PITCH_MS                             2
101*a58d3d2aSXin Li #define LA_PITCH_MAX                            ( LA_PITCH_MS * MAX_FS_KHZ )
102*a58d3d2aSXin Li 
103*a58d3d2aSXin Li /* Order of LPC used in find pitch */
104*a58d3d2aSXin Li #define MAX_FIND_PITCH_LPC_ORDER                16
105*a58d3d2aSXin Li 
106*a58d3d2aSXin Li /* Length of LPC window used in find pitch */
107*a58d3d2aSXin Li #define FIND_PITCH_LPC_WIN_MS                   ( 20 + (LA_PITCH_MS << 1) )
108*a58d3d2aSXin Li #define FIND_PITCH_LPC_WIN_MS_2_SF              ( 10 + (LA_PITCH_MS << 1) )
109*a58d3d2aSXin Li #define FIND_PITCH_LPC_WIN_MAX                  ( FIND_PITCH_LPC_WIN_MS * MAX_FS_KHZ )
110*a58d3d2aSXin Li 
111*a58d3d2aSXin Li /* Milliseconds of lookahead for noise shape analysis */
112*a58d3d2aSXin Li #define LA_SHAPE_MS                             5
113*a58d3d2aSXin Li #define LA_SHAPE_MAX                            ( LA_SHAPE_MS * MAX_FS_KHZ )
114*a58d3d2aSXin Li 
115*a58d3d2aSXin Li /* Maximum length of LPC window used in noise shape analysis */
116*a58d3d2aSXin Li #define SHAPE_LPC_WIN_MAX                       ( 15 * MAX_FS_KHZ )
117*a58d3d2aSXin Li 
118*a58d3d2aSXin Li /* dB level of lowest gain quantization level */
119*a58d3d2aSXin Li #define MIN_QGAIN_DB                            2
120*a58d3d2aSXin Li /* dB level of highest gain quantization level */
121*a58d3d2aSXin Li #define MAX_QGAIN_DB                            88
122*a58d3d2aSXin Li /* Number of gain quantization levels */
123*a58d3d2aSXin Li #define N_LEVELS_QGAIN                          64
124*a58d3d2aSXin Li /* Max increase in gain quantization index */
125*a58d3d2aSXin Li #define MAX_DELTA_GAIN_QUANT                    36
126*a58d3d2aSXin Li /* Max decrease in gain quantization index */
127*a58d3d2aSXin Li #define MIN_DELTA_GAIN_QUANT                    -4
128*a58d3d2aSXin Li 
129*a58d3d2aSXin Li /* Quantization offsets (multiples of 4) */
130*a58d3d2aSXin Li #define OFFSET_VL_Q10                           32
131*a58d3d2aSXin Li #define OFFSET_VH_Q10                           100
132*a58d3d2aSXin Li #define OFFSET_UVL_Q10                          100
133*a58d3d2aSXin Li #define OFFSET_UVH_Q10                          240
134*a58d3d2aSXin Li 
135*a58d3d2aSXin Li #define QUANT_LEVEL_ADJUST_Q10                  80
136*a58d3d2aSXin Li 
137*a58d3d2aSXin Li /* Maximum numbers of iterations used to stabilize an LPC vector */
138*a58d3d2aSXin Li #define MAX_LPC_STABILIZE_ITERATIONS            16
139*a58d3d2aSXin Li #define MAX_PREDICTION_POWER_GAIN               1e4f
140*a58d3d2aSXin Li #define MAX_PREDICTION_POWER_GAIN_AFTER_RESET   1e2f
141*a58d3d2aSXin Li 
142*a58d3d2aSXin Li #define MAX_LPC_ORDER                           16
143*a58d3d2aSXin Li #define MIN_LPC_ORDER                           10
144*a58d3d2aSXin Li 
145*a58d3d2aSXin Li /* Find Pred Coef defines */
146*a58d3d2aSXin Li #define LTP_ORDER                               5
147*a58d3d2aSXin Li 
148*a58d3d2aSXin Li /* LTP quantization settings */
149*a58d3d2aSXin Li #define NB_LTP_CBKS                             3
150*a58d3d2aSXin Li 
151*a58d3d2aSXin Li /* Flag to use harmonic noise shaping */
152*a58d3d2aSXin Li #define USE_HARM_SHAPING                        1
153*a58d3d2aSXin Li 
154*a58d3d2aSXin Li /* Max LPC order of noise shaping filters */
155*a58d3d2aSXin Li #define MAX_SHAPE_LPC_ORDER                     24
156*a58d3d2aSXin Li 
157*a58d3d2aSXin Li #define HARM_SHAPE_FIR_TAPS                     3
158*a58d3d2aSXin Li 
159*a58d3d2aSXin Li /* Maximum number of delayed decision states */
160*a58d3d2aSXin Li #define MAX_DEL_DEC_STATES                      4
161*a58d3d2aSXin Li 
162*a58d3d2aSXin Li #define LTP_BUF_LENGTH                          512
163*a58d3d2aSXin Li #define LTP_MASK                                ( LTP_BUF_LENGTH - 1 )
164*a58d3d2aSXin Li 
165*a58d3d2aSXin Li #define DECISION_DELAY                          40
166*a58d3d2aSXin Li 
167*a58d3d2aSXin Li /* Number of subframes for excitation entropy coding */
168*a58d3d2aSXin Li #define SHELL_CODEC_FRAME_LENGTH                16
169*a58d3d2aSXin Li #define LOG2_SHELL_CODEC_FRAME_LENGTH           4
170*a58d3d2aSXin Li #define MAX_NB_SHELL_BLOCKS                     ( MAX_FRAME_LENGTH / SHELL_CODEC_FRAME_LENGTH )
171*a58d3d2aSXin Li 
172*a58d3d2aSXin Li /* Number of rate levels, for entropy coding of excitation */
173*a58d3d2aSXin Li #define N_RATE_LEVELS                           10
174*a58d3d2aSXin Li 
175*a58d3d2aSXin Li /* Maximum sum of pulses per shell coding frame */
176*a58d3d2aSXin Li #define SILK_MAX_PULSES                         16
177*a58d3d2aSXin Li 
178*a58d3d2aSXin Li #define MAX_MATRIX_SIZE                         MAX_LPC_ORDER /* Max of LPC Order and LTP order */
179*a58d3d2aSXin Li 
180*a58d3d2aSXin Li # define NSQ_LPC_BUF_LENGTH                     MAX_LPC_ORDER
181*a58d3d2aSXin Li 
182*a58d3d2aSXin Li /***************************/
183*a58d3d2aSXin Li /* Voice activity detector */
184*a58d3d2aSXin Li /***************************/
185*a58d3d2aSXin Li #define VAD_N_BANDS                             4
186*a58d3d2aSXin Li 
187*a58d3d2aSXin Li #define VAD_INTERNAL_SUBFRAMES_LOG2             2
188*a58d3d2aSXin Li #define VAD_INTERNAL_SUBFRAMES                  ( 1 << VAD_INTERNAL_SUBFRAMES_LOG2 )
189*a58d3d2aSXin Li 
190*a58d3d2aSXin Li #define VAD_NOISE_LEVEL_SMOOTH_COEF_Q16         1024    /* Must be <  4096 */
191*a58d3d2aSXin Li #define VAD_NOISE_LEVELS_BIAS                   50
192*a58d3d2aSXin Li 
193*a58d3d2aSXin Li /* Sigmoid settings */
194*a58d3d2aSXin Li #define VAD_NEGATIVE_OFFSET_Q5                  128     /* sigmoid is 0 at -128 */
195*a58d3d2aSXin Li #define VAD_SNR_FACTOR_Q16                      45000
196*a58d3d2aSXin Li 
197*a58d3d2aSXin Li /* smoothing for SNR measurement */
198*a58d3d2aSXin Li #define VAD_SNR_SMOOTH_COEF_Q18                 4096
199*a58d3d2aSXin Li 
200*a58d3d2aSXin Li /* Size of the piecewise linear cosine approximation table for the LSFs */
201*a58d3d2aSXin Li #define LSF_COS_TAB_SZ_FIX                      128
202*a58d3d2aSXin Li 
203*a58d3d2aSXin Li /******************/
204*a58d3d2aSXin Li /* NLSF quantizer */
205*a58d3d2aSXin Li /******************/
206*a58d3d2aSXin Li #define NLSF_W_Q                                2
207*a58d3d2aSXin Li #define NLSF_VQ_MAX_VECTORS                     32
208*a58d3d2aSXin Li #define NLSF_QUANT_MAX_AMPLITUDE                4
209*a58d3d2aSXin Li #define NLSF_QUANT_MAX_AMPLITUDE_EXT            10
210*a58d3d2aSXin Li #define NLSF_QUANT_LEVEL_ADJ                    0.1
211*a58d3d2aSXin Li #define NLSF_QUANT_DEL_DEC_STATES_LOG2          2
212*a58d3d2aSXin Li #define NLSF_QUANT_DEL_DEC_STATES               ( 1 << NLSF_QUANT_DEL_DEC_STATES_LOG2 )
213*a58d3d2aSXin Li 
214*a58d3d2aSXin Li /* Transition filtering for mode switching */
215*a58d3d2aSXin Li #define TRANSITION_TIME_MS                      5120    /* 5120 = 64 * FRAME_LENGTH_MS * ( TRANSITION_INT_NUM - 1 ) = 64*(20*4)*/
216*a58d3d2aSXin Li #define TRANSITION_NB                           3       /* Hardcoded in tables */
217*a58d3d2aSXin Li #define TRANSITION_NA                           2       /* Hardcoded in tables */
218*a58d3d2aSXin Li #define TRANSITION_INT_NUM                      5       /* Hardcoded in tables */
219*a58d3d2aSXin Li #define TRANSITION_FRAMES                       ( TRANSITION_TIME_MS / MAX_FRAME_LENGTH_MS )
220*a58d3d2aSXin Li #define TRANSITION_INT_STEPS                    ( TRANSITION_FRAMES  / ( TRANSITION_INT_NUM - 1 ) )
221*a58d3d2aSXin Li 
222*a58d3d2aSXin Li /* BWE factors to apply after packet loss */
223*a58d3d2aSXin Li #define BWE_AFTER_LOSS_Q16                      63570
224*a58d3d2aSXin Li 
225*a58d3d2aSXin Li /* Defines for CN generation */
226*a58d3d2aSXin Li #define CNG_BUF_MASK_MAX                        255     /* 2^floor(log2(MAX_FRAME_LENGTH))-1    */
227*a58d3d2aSXin Li #define CNG_GAIN_SMTH_Q16                       4634    /* 0.25^(1/4)                           */
228*a58d3d2aSXin Li #define CNG_GAIN_SMTH_THRESHOLD_Q16             46396   /* -3 dB                                */
229*a58d3d2aSXin Li #define CNG_NLSF_SMTH_Q16                       16348   /* 0.25                                 */
230*a58d3d2aSXin Li 
231*a58d3d2aSXin Li #ifdef __cplusplus
232*a58d3d2aSXin Li }
233*a58d3d2aSXin Li #endif
234*a58d3d2aSXin Li 
235*a58d3d2aSXin Li #endif
236