xref: /aosp_15_r20/external/libopus/src/analysis.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /* Copyright (c) 2011 Xiph.Org Foundation
2*a58d3d2aSXin Li    Written by Jean-Marc Valin */
3*a58d3d2aSXin Li /*
4*a58d3d2aSXin Li    Redistribution and use in source and binary forms, with or without
5*a58d3d2aSXin Li    modification, are permitted provided that the following conditions
6*a58d3d2aSXin Li    are met:
7*a58d3d2aSXin Li 
8*a58d3d2aSXin Li    - Redistributions of source code must retain the above copyright
9*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer.
10*a58d3d2aSXin Li 
11*a58d3d2aSXin Li    - Redistributions in binary form must reproduce the above copyright
12*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer in the
13*a58d3d2aSXin Li    documentation and/or other materials provided with the distribution.
14*a58d3d2aSXin Li 
15*a58d3d2aSXin Li    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16*a58d3d2aSXin Li    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17*a58d3d2aSXin Li    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
18*a58d3d2aSXin Li    A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR
19*a58d3d2aSXin Li    CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20*a58d3d2aSXin Li    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21*a58d3d2aSXin Li    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22*a58d3d2aSXin Li    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
23*a58d3d2aSXin Li    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
24*a58d3d2aSXin Li    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25*a58d3d2aSXin Li    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*a58d3d2aSXin Li */
27*a58d3d2aSXin Li 
28*a58d3d2aSXin Li #ifndef ANALYSIS_H
29*a58d3d2aSXin Li #define ANALYSIS_H
30*a58d3d2aSXin Li 
31*a58d3d2aSXin Li #include "celt.h"
32*a58d3d2aSXin Li #include "opus_private.h"
33*a58d3d2aSXin Li #include "mlp.h"
34*a58d3d2aSXin Li 
35*a58d3d2aSXin Li #define NB_FRAMES 8
36*a58d3d2aSXin Li #define NB_TBANDS 18
37*a58d3d2aSXin Li #define ANALYSIS_BUF_SIZE 720 /* 30 ms at 24 kHz */
38*a58d3d2aSXin Li 
39*a58d3d2aSXin Li /* At that point we can stop counting frames because it no longer matters. */
40*a58d3d2aSXin Li #define ANALYSIS_COUNT_MAX 10000
41*a58d3d2aSXin Li 
42*a58d3d2aSXin Li #define DETECT_SIZE 100
43*a58d3d2aSXin Li 
44*a58d3d2aSXin Li /* Uncomment this to print the MLP features on stdout. */
45*a58d3d2aSXin Li /*#define MLP_TRAINING*/
46*a58d3d2aSXin Li 
47*a58d3d2aSXin Li typedef struct {
48*a58d3d2aSXin Li    int arch;
49*a58d3d2aSXin Li    int application;
50*a58d3d2aSXin Li    opus_int32 Fs;
51*a58d3d2aSXin Li #define TONALITY_ANALYSIS_RESET_START angle
52*a58d3d2aSXin Li    float angle[240];
53*a58d3d2aSXin Li    float d_angle[240];
54*a58d3d2aSXin Li    float d2_angle[240];
55*a58d3d2aSXin Li    opus_val32 inmem[ANALYSIS_BUF_SIZE];
56*a58d3d2aSXin Li    int   mem_fill;                      /* number of usable samples in the buffer */
57*a58d3d2aSXin Li    float prev_band_tonality[NB_TBANDS];
58*a58d3d2aSXin Li    float prev_tonality;
59*a58d3d2aSXin Li    int prev_bandwidth;
60*a58d3d2aSXin Li    float E[NB_FRAMES][NB_TBANDS];
61*a58d3d2aSXin Li    float logE[NB_FRAMES][NB_TBANDS];
62*a58d3d2aSXin Li    float lowE[NB_TBANDS];
63*a58d3d2aSXin Li    float highE[NB_TBANDS];
64*a58d3d2aSXin Li    float meanE[NB_TBANDS+1];
65*a58d3d2aSXin Li    float mem[32];
66*a58d3d2aSXin Li    float cmean[8];
67*a58d3d2aSXin Li    float std[9];
68*a58d3d2aSXin Li    float Etracker;
69*a58d3d2aSXin Li    float lowECount;
70*a58d3d2aSXin Li    int E_count;
71*a58d3d2aSXin Li    int count;
72*a58d3d2aSXin Li    int analysis_offset;
73*a58d3d2aSXin Li    int write_pos;
74*a58d3d2aSXin Li    int read_pos;
75*a58d3d2aSXin Li    int read_subframe;
76*a58d3d2aSXin Li    float hp_ener_accum;
77*a58d3d2aSXin Li    int initialized;
78*a58d3d2aSXin Li    float rnn_state[MAX_NEURONS];
79*a58d3d2aSXin Li    opus_val32 downmix_state[3];
80*a58d3d2aSXin Li    AnalysisInfo info[DETECT_SIZE];
81*a58d3d2aSXin Li } TonalityAnalysisState;
82*a58d3d2aSXin Li 
83*a58d3d2aSXin Li /** Initialize a TonalityAnalysisState struct.
84*a58d3d2aSXin Li  *
85*a58d3d2aSXin Li  * This performs some possibly slow initialization steps which should
86*a58d3d2aSXin Li  * not be repeated every analysis step. No allocated memory is retained
87*a58d3d2aSXin Li  * by the state struct, so no cleanup call is required.
88*a58d3d2aSXin Li  */
89*a58d3d2aSXin Li void tonality_analysis_init(TonalityAnalysisState *analysis, opus_int32 Fs);
90*a58d3d2aSXin Li 
91*a58d3d2aSXin Li /** Reset a TonalityAnalysisState stuct.
92*a58d3d2aSXin Li  *
93*a58d3d2aSXin Li  * Call this when there's a discontinuity in the data.
94*a58d3d2aSXin Li  */
95*a58d3d2aSXin Li void tonality_analysis_reset(TonalityAnalysisState *analysis);
96*a58d3d2aSXin Li 
97*a58d3d2aSXin Li void tonality_get_info(TonalityAnalysisState *tonal, AnalysisInfo *info_out, int len);
98*a58d3d2aSXin Li 
99*a58d3d2aSXin Li void run_analysis(TonalityAnalysisState *analysis, const CELTMode *celt_mode, const void *analysis_pcm,
100*a58d3d2aSXin Li                  int analysis_frame_size, int frame_size, int c1, int c2, int C, opus_int32 Fs,
101*a58d3d2aSXin Li                  int lsb_depth, downmix_func downmix, AnalysisInfo *analysis_info);
102*a58d3d2aSXin Li 
103*a58d3d2aSXin Li #endif
104