xref: /aosp_15_r20/external/libopus/silk/structs.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1 /***********************************************************************
2 Copyright (c) 2006-2011, Skype Limited. All rights reserved.
3 Redistribution and use in source and binary forms, with or without
4 modification, are permitted provided that the following conditions
5 are met:
6 - Redistributions of source code must retain the above copyright notice,
7 this list of conditions and the following disclaimer.
8 - Redistributions in binary form must reproduce the above copyright
9 notice, this list of conditions and the following disclaimer in the
10 documentation and/or other materials provided with the distribution.
11 - Neither the name of Internet Society, IETF or IETF Trust, nor the
12 names of specific contributors, may be used to endorse or promote
13 products derived from this software without specific prior written
14 permission.
15 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
16 AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17 IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18 ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
19 LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
20 CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
21 SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
22 INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23 CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
24 ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
25 POSSIBILITY OF SUCH DAMAGE.
26 ***********************************************************************/
27 
28 #ifndef SILK_STRUCTS_H
29 #define SILK_STRUCTS_H
30 
31 #include "typedef.h"
32 #include "SigProc_FIX.h"
33 #include "define.h"
34 #include "entenc.h"
35 #include "entdec.h"
36 
37 #ifdef ENABLE_DEEP_PLC
38 #include "lpcnet.h"
39 #include "lpcnet_private.h"
40 #endif
41 
42 #ifdef ENABLE_DRED
43 #include "dred_encoder.h"
44 #include "dred_decoder.h"
45 #endif
46 
47 #ifdef ENABLE_OSCE
48 #include "osce_config.h"
49 #include "osce_structs.h"
50 #endif
51 
52 #ifdef __cplusplus
53 extern "C"
54 {
55 #endif
56 
57 /************************************/
58 /* Noise shaping quantization state */
59 /************************************/
60 typedef struct {
61     opus_int16                  xq[           2 * MAX_FRAME_LENGTH ]; /* Buffer for quantized output signal                             */
62     opus_int32                  sLTP_shp_Q14[ 2 * MAX_FRAME_LENGTH ];
63     opus_int32                  sLPC_Q14[ MAX_SUB_FRAME_LENGTH + NSQ_LPC_BUF_LENGTH ];
64     opus_int32                  sAR2_Q14[ MAX_SHAPE_LPC_ORDER ];
65     opus_int32                  sLF_AR_shp_Q14;
66     opus_int32                  sDiff_shp_Q14;
67     opus_int                    lagPrev;
68     opus_int                    sLTP_buf_idx;
69     opus_int                    sLTP_shp_buf_idx;
70     opus_int32                  rand_seed;
71     opus_int32                  prev_gain_Q16;
72     opus_int                    rewhite_flag;
73 } silk_nsq_state;
74 
75 /********************************/
76 /* VAD state                    */
77 /********************************/
78 typedef struct {
79     opus_int32                  AnaState[ 2 ];                  /* Analysis filterbank state: 0-8 kHz                                   */
80     opus_int32                  AnaState1[ 2 ];                 /* Analysis filterbank state: 0-4 kHz                                   */
81     opus_int32                  AnaState2[ 2 ];                 /* Analysis filterbank state: 0-2 kHz                                   */
82     opus_int32                  XnrgSubfr[ VAD_N_BANDS ];       /* Subframe energies                                                    */
83     opus_int32                  NrgRatioSmth_Q8[ VAD_N_BANDS ]; /* Smoothed energy level in each band                                   */
84     opus_int16                  HPstate;                        /* State of differentiator in the lowest band                           */
85     opus_int32                  NL[ VAD_N_BANDS ];              /* Noise energy level in each band                                      */
86     opus_int32                  inv_NL[ VAD_N_BANDS ];          /* Inverse noise energy level in each band                              */
87     opus_int32                  NoiseLevelBias[ VAD_N_BANDS ];  /* Noise level estimator bias/offset                                    */
88     opus_int32                  counter;                        /* Frame counter used in the initial phase                              */
89 } silk_VAD_state;
90 
91 /* Variable cut-off low-pass filter state */
92 typedef struct {
93     opus_int32                   In_LP_State[ 2 ];           /* Low pass filter state */
94     opus_int32                   transition_frame_no;        /* Counter which is mapped to a cut-off frequency */
95     opus_int                     mode;                       /* Operating mode, <0: switch down, >0: switch up; 0: do nothing           */
96     opus_int32                   saved_fs_kHz;               /* If non-zero, holds the last sampling rate before a bandwidth switching reset. */
97 } silk_LP_state;
98 
99 /* Structure containing NLSF codebook */
100 typedef struct {
101     const opus_int16             nVectors;
102     const opus_int16             order;
103     const opus_int16             quantStepSize_Q16;
104     const opus_int16             invQuantStepSize_Q6;
105     const opus_uint8             *CB1_NLSF_Q8;
106     const opus_int16             *CB1_Wght_Q9;
107     const opus_uint8             *CB1_iCDF;
108     const opus_uint8             *pred_Q8;
109     const opus_uint8             *ec_sel;
110     const opus_uint8             *ec_iCDF;
111     const opus_uint8             *ec_Rates_Q5;
112     const opus_int16             *deltaMin_Q15;
113 } silk_NLSF_CB_struct;
114 
115 typedef struct {
116     opus_int16                   pred_prev_Q13[ 2 ];
117     opus_int16                   sMid[ 2 ];
118     opus_int16                   sSide[ 2 ];
119     opus_int32                   mid_side_amp_Q0[ 4 ];
120     opus_int16                   smth_width_Q14;
121     opus_int16                   width_prev_Q14;
122     opus_int16                   silent_side_len;
123     opus_int8                    predIx[ MAX_FRAMES_PER_PACKET ][ 2 ][ 3 ];
124     opus_int8                    mid_only_flags[ MAX_FRAMES_PER_PACKET ];
125 } stereo_enc_state;
126 
127 typedef struct {
128     opus_int16                   pred_prev_Q13[ 2 ];
129     opus_int16                   sMid[ 2 ];
130     opus_int16                   sSide[ 2 ];
131 } stereo_dec_state;
132 
133 typedef struct {
134     opus_int8                    GainsIndices[ MAX_NB_SUBFR ];
135     opus_int8                    LTPIndex[ MAX_NB_SUBFR ];
136     opus_int8                    NLSFIndices[ MAX_LPC_ORDER + 1 ];
137     opus_int16                   lagIndex;
138     opus_int8                    contourIndex;
139     opus_int8                    signalType;
140     opus_int8                    quantOffsetType;
141     opus_int8                    NLSFInterpCoef_Q2;
142     opus_int8                    PERIndex;
143     opus_int8                    LTP_scaleIndex;
144     opus_int8                    Seed;
145 } SideInfoIndices;
146 
147 /********************************/
148 /* Encoder state                */
149 /********************************/
150 typedef struct {
151     opus_int32                   In_HP_State[ 2 ];                  /* High pass filter state                                           */
152     opus_int32                   variable_HP_smth1_Q15;             /* State of first smoother                                          */
153     opus_int32                   variable_HP_smth2_Q15;             /* State of second smoother                                         */
154     silk_LP_state                sLP;                               /* Low pass filter state                                            */
155     silk_VAD_state               sVAD;                              /* Voice activity detector state                                    */
156     silk_nsq_state               sNSQ;                              /* Noise Shape Quantizer State                                      */
157     opus_int16                   prev_NLSFq_Q15[ MAX_LPC_ORDER ];   /* Previously quantized NLSF vector                                 */
158     opus_int                     speech_activity_Q8;                /* Speech activity                                                  */
159     opus_int                     allow_bandwidth_switch;            /* Flag indicating that switching of internal bandwidth is allowed  */
160     opus_int8                    LBRRprevLastGainIndex;
161     opus_int8                    prevSignalType;
162     opus_int                     prevLag;
163     opus_int                     pitch_LPC_win_length;
164     opus_int                     max_pitch_lag;                     /* Highest possible pitch lag (samples)                             */
165     opus_int32                   API_fs_Hz;                         /* API sampling frequency (Hz)                                      */
166     opus_int32                   prev_API_fs_Hz;                    /* Previous API sampling frequency (Hz)                             */
167     opus_int                     maxInternal_fs_Hz;                 /* Maximum internal sampling frequency (Hz)                         */
168     opus_int                     minInternal_fs_Hz;                 /* Minimum internal sampling frequency (Hz)                         */
169     opus_int                     desiredInternal_fs_Hz;             /* Soft request for internal sampling frequency (Hz)                */
170     opus_int                     fs_kHz;                            /* Internal sampling frequency (kHz)                                */
171     opus_int                     nb_subfr;                          /* Number of 5 ms subframes in a frame                              */
172     opus_int                     frame_length;                      /* Frame length (samples)                                           */
173     opus_int                     subfr_length;                      /* Subframe length (samples)                                        */
174     opus_int                     ltp_mem_length;                    /* Length of LTP memory                                             */
175     opus_int                     la_pitch;                          /* Look-ahead for pitch analysis (samples)                          */
176     opus_int                     la_shape;                          /* Look-ahead for noise shape analysis (samples)                    */
177     opus_int                     shapeWinLength;                    /* Window length for noise shape analysis (samples)                 */
178     opus_int32                   TargetRate_bps;                    /* Target bitrate (bps)                                             */
179     opus_int                     PacketSize_ms;                     /* Number of milliseconds to put in each packet                     */
180     opus_int                     PacketLoss_perc;                   /* Packet loss rate measured by farend                              */
181     opus_int32                   frameCounter;
182     opus_int                     Complexity;                        /* Complexity setting                                               */
183     opus_int                     nStatesDelayedDecision;            /* Number of states in delayed decision quantization                */
184     opus_int                     useInterpolatedNLSFs;              /* Flag for using NLSF interpolation                                */
185     opus_int                     shapingLPCOrder;                   /* Filter order for noise shaping filters                           */
186     opus_int                     predictLPCOrder;                   /* Filter order for prediction filters                              */
187     opus_int                     pitchEstimationComplexity;         /* Complexity level for pitch estimator                             */
188     opus_int                     pitchEstimationLPCOrder;           /* Whitening filter order for pitch estimator                       */
189     opus_int32                   pitchEstimationThreshold_Q16;      /* Threshold for pitch estimator                                    */
190     opus_int32                   sum_log_gain_Q7;                   /* Cumulative max prediction gain                                   */
191     opus_int                     NLSF_MSVQ_Survivors;               /* Number of survivors in NLSF MSVQ                                 */
192     opus_int                     first_frame_after_reset;           /* Flag for deactivating NLSF interpolation, pitch prediction       */
193     opus_int                     controlled_since_last_payload;     /* Flag for ensuring codec_control only runs once per packet        */
194     opus_int                     warping_Q16;                       /* Warping parameter for warped noise shaping                       */
195     opus_int                     useCBR;                            /* Flag to enable constant bitrate                                  */
196     opus_int                     prefillFlag;                       /* Flag to indicate that only buffers are prefilled, no coding      */
197     const opus_uint8             *pitch_lag_low_bits_iCDF;          /* Pointer to iCDF table for low bits of pitch lag index            */
198     const opus_uint8             *pitch_contour_iCDF;               /* Pointer to iCDF table for pitch contour index                    */
199     const silk_NLSF_CB_struct    *psNLSF_CB;                        /* Pointer to NLSF codebook                                         */
200     opus_int                     input_quality_bands_Q15[ VAD_N_BANDS ];
201     opus_int                     input_tilt_Q15;
202     opus_int                     SNR_dB_Q7;                         /* Quality setting                                                  */
203 
204     opus_int8                    VAD_flags[ MAX_FRAMES_PER_PACKET ];
205     opus_int8                    LBRR_flag;
206     opus_int                     LBRR_flags[ MAX_FRAMES_PER_PACKET ];
207 
208     SideInfoIndices              indices;
209     opus_int8                    pulses[ MAX_FRAME_LENGTH ];
210 
211     int                          arch;
212 
213     /* Input/output buffering */
214     opus_int16                   inputBuf[ MAX_FRAME_LENGTH + 2 ];  /* Buffer containing input signal                                   */
215     opus_int                     inputBufIx;
216     opus_int                     nFramesPerPacket;
217     opus_int                     nFramesEncoded;                    /* Number of frames analyzed in current packet                      */
218 
219     opus_int                     nChannelsAPI;
220     opus_int                     nChannelsInternal;
221     opus_int                     channelNb;
222 
223     /* Parameters For LTP scaling Control */
224     opus_int                     frames_since_onset;
225 
226     /* Specifically for entropy coding */
227     opus_int                     ec_prevSignalType;
228     opus_int16                   ec_prevLagIndex;
229 
230     silk_resampler_state_struct resampler_state;
231 
232     /* DTX */
233     opus_int                     useDTX;                            /* Flag to enable DTX                                               */
234     opus_int                     inDTX;                             /* Flag to signal DTX period                                        */
235     opus_int                     noSpeechCounter;                   /* Counts concecutive nonactive frames, used by DTX                 */
236 
237     /* Inband Low Bitrate Redundancy (LBRR) data */
238     opus_int                     useInBandFEC;                      /* Saves the API setting for query                                  */
239     opus_int                     LBRR_enabled;                      /* Depends on useInBandFRC, bitrate and packet loss rate            */
240     opus_int                     LBRR_GainIncreases;                /* Gains increment for coding LBRR frames                           */
241     SideInfoIndices              indices_LBRR[ MAX_FRAMES_PER_PACKET ];
242     opus_int8                    pulses_LBRR[ MAX_FRAMES_PER_PACKET ][ MAX_FRAME_LENGTH ];
243 } silk_encoder_state;
244 
245 
246 #ifdef ENABLE_OSCE
247 typedef struct {
248     OSCEFeatureState features;
249     OSCEState state;
250     int method;
251 } silk_OSCE_struct;
252 #endif
253 
254 /* Struct for Packet Loss Concealment */
255 typedef struct {
256     opus_int32                  pitchL_Q8;                          /* Pitch lag to use for voiced concealment                          */
257     opus_int16                  LTPCoef_Q14[ LTP_ORDER ];           /* LTP coeficients to use for voiced concealment                    */
258     opus_int16                  prevLPC_Q12[ MAX_LPC_ORDER ];
259     opus_int                    last_frame_lost;                    /* Was previous frame lost                                          */
260     opus_int32                  rand_seed;                          /* Seed for unvoiced signal generation                              */
261     opus_int16                  randScale_Q14;                      /* Scaling of unvoiced random signal                                */
262     opus_int32                  conc_energy;
263     opus_int                    conc_energy_shift;
264     opus_int16                  prevLTP_scale_Q14;
265     opus_int32                  prevGain_Q16[ 2 ];
266     opus_int                    fs_kHz;
267     opus_int                    nb_subfr;
268     opus_int                    subfr_length;
269     opus_int                    enable_deep_plc;
270 } silk_PLC_struct;
271 
272 /* Struct for CNG */
273 typedef struct {
274     opus_int32                  CNG_exc_buf_Q14[ MAX_FRAME_LENGTH ];
275     opus_int16                  CNG_smth_NLSF_Q15[ MAX_LPC_ORDER ];
276     opus_int32                  CNG_synth_state[ MAX_LPC_ORDER ];
277     opus_int32                  CNG_smth_Gain_Q16;
278     opus_int32                  rand_seed;
279     opus_int                    fs_kHz;
280 } silk_CNG_struct;
281 
282 /********************************/
283 /* Decoder state                */
284 /********************************/
285 typedef struct {
286 #ifdef ENABLE_OSCE
287     silk_OSCE_struct            osce;
288 #endif
289 #define SILK_DECODER_STATE_RESET_START prev_gain_Q16
290     opus_int32                  prev_gain_Q16;
291     opus_int32                  exc_Q14[ MAX_FRAME_LENGTH ];
292     opus_int32                  sLPC_Q14_buf[ MAX_LPC_ORDER ];
293     opus_int16                  outBuf[ MAX_FRAME_LENGTH + 2 * MAX_SUB_FRAME_LENGTH ];  /* Buffer for output signal                     */
294     opus_int                    lagPrev;                            /* Previous Lag                                                     */
295     opus_int8                   LastGainIndex;                      /* Previous gain index                                              */
296     opus_int                    fs_kHz;                             /* Sampling frequency in kHz                                        */
297     opus_int32                  fs_API_hz;                          /* API sample frequency (Hz)                                        */
298     opus_int                    nb_subfr;                           /* Number of 5 ms subframes in a frame                              */
299     opus_int                    frame_length;                       /* Frame length (samples)                                           */
300     opus_int                    subfr_length;                       /* Subframe length (samples)                                        */
301     opus_int                    ltp_mem_length;                     /* Length of LTP memory                                             */
302     opus_int                    LPC_order;                          /* LPC order                                                        */
303     opus_int16                  prevNLSF_Q15[ MAX_LPC_ORDER ];      /* Used to interpolate LSFs                                         */
304     opus_int                    first_frame_after_reset;            /* Flag for deactivating NLSF interpolation                         */
305     const opus_uint8            *pitch_lag_low_bits_iCDF;           /* Pointer to iCDF table for low bits of pitch lag index            */
306     const opus_uint8            *pitch_contour_iCDF;                /* Pointer to iCDF table for pitch contour index                    */
307 
308     /* For buffering payload in case of more frames per packet */
309     opus_int                    nFramesDecoded;
310     opus_int                    nFramesPerPacket;
311 
312     /* Specifically for entropy coding */
313     opus_int                    ec_prevSignalType;
314     opus_int16                  ec_prevLagIndex;
315 
316     opus_int                    VAD_flags[ MAX_FRAMES_PER_PACKET ];
317     opus_int                    LBRR_flag;
318     opus_int                    LBRR_flags[ MAX_FRAMES_PER_PACKET ];
319 
320     silk_resampler_state_struct resampler_state;
321 
322     const silk_NLSF_CB_struct   *psNLSF_CB;                         /* Pointer to NLSF codebook                                         */
323 
324     /* Quantization indices */
325     SideInfoIndices             indices;
326 
327     /* CNG state */
328     silk_CNG_struct             sCNG;
329 
330     /* Stuff used for PLC */
331     opus_int                    lossCnt;
332     opus_int                    prevSignalType;
333     int                         arch;
334 
335     silk_PLC_struct sPLC;
336 
337 } silk_decoder_state;
338 
339 /************************/
340 /* Decoder control      */
341 /************************/
342 typedef struct {
343     /* Prediction and coding parameters */
344     opus_int                    pitchL[ MAX_NB_SUBFR ];
345     opus_int32                  Gains_Q16[ MAX_NB_SUBFR ];
346     /* Holds interpolated and final coefficients, 4-byte aligned */
347     silk_DWORD_ALIGN opus_int16 PredCoef_Q12[ 2 ][ MAX_LPC_ORDER ];
348     opus_int16                  LTPCoef_Q14[ LTP_ORDER * MAX_NB_SUBFR ];
349     opus_int                    LTP_scale_Q14;
350 } silk_decoder_control;
351 
352 
353 #ifdef __cplusplus
354 }
355 #endif
356 
357 #endif
358