1*a58d3d2aSXin Li /* Copyright (c) 2011 Xiph.Org Foundation 2*a58d3d2aSXin Li Written by Jean-Marc Valin */ 3*a58d3d2aSXin Li /* 4*a58d3d2aSXin Li Redistribution and use in source and binary forms, with or without 5*a58d3d2aSXin Li modification, are permitted provided that the following conditions 6*a58d3d2aSXin Li are met: 7*a58d3d2aSXin Li 8*a58d3d2aSXin Li - Redistributions of source code must retain the above copyright 9*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer. 10*a58d3d2aSXin Li 11*a58d3d2aSXin Li - Redistributions in binary form must reproduce the above copyright 12*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer in the 13*a58d3d2aSXin Li documentation and/or other materials provided with the distribution. 14*a58d3d2aSXin Li 15*a58d3d2aSXin Li THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 16*a58d3d2aSXin Li ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 17*a58d3d2aSXin Li LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 18*a58d3d2aSXin Li A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR 19*a58d3d2aSXin Li CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 20*a58d3d2aSXin Li EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 21*a58d3d2aSXin Li PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 22*a58d3d2aSXin Li PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF 23*a58d3d2aSXin Li LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING 24*a58d3d2aSXin Li NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 25*a58d3d2aSXin Li SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 26*a58d3d2aSXin Li */ 27*a58d3d2aSXin Li 28*a58d3d2aSXin Li #ifndef ANALYSIS_H 29*a58d3d2aSXin Li #define ANALYSIS_H 30*a58d3d2aSXin Li 31*a58d3d2aSXin Li #include "celt.h" 32*a58d3d2aSXin Li #include "opus_private.h" 33*a58d3d2aSXin Li #include "mlp.h" 34*a58d3d2aSXin Li 35*a58d3d2aSXin Li #define NB_FRAMES 8 36*a58d3d2aSXin Li #define NB_TBANDS 18 37*a58d3d2aSXin Li #define ANALYSIS_BUF_SIZE 720 /* 30 ms at 24 kHz */ 38*a58d3d2aSXin Li 39*a58d3d2aSXin Li /* At that point we can stop counting frames because it no longer matters. */ 40*a58d3d2aSXin Li #define ANALYSIS_COUNT_MAX 10000 41*a58d3d2aSXin Li 42*a58d3d2aSXin Li #define DETECT_SIZE 100 43*a58d3d2aSXin Li 44*a58d3d2aSXin Li /* Uncomment this to print the MLP features on stdout. */ 45*a58d3d2aSXin Li /*#define MLP_TRAINING*/ 46*a58d3d2aSXin Li 47*a58d3d2aSXin Li typedef struct { 48*a58d3d2aSXin Li int arch; 49*a58d3d2aSXin Li int application; 50*a58d3d2aSXin Li opus_int32 Fs; 51*a58d3d2aSXin Li #define TONALITY_ANALYSIS_RESET_START angle 52*a58d3d2aSXin Li float angle[240]; 53*a58d3d2aSXin Li float d_angle[240]; 54*a58d3d2aSXin Li float d2_angle[240]; 55*a58d3d2aSXin Li opus_val32 inmem[ANALYSIS_BUF_SIZE]; 56*a58d3d2aSXin Li int mem_fill; /* number of usable samples in the buffer */ 57*a58d3d2aSXin Li float prev_band_tonality[NB_TBANDS]; 58*a58d3d2aSXin Li float prev_tonality; 59*a58d3d2aSXin Li int prev_bandwidth; 60*a58d3d2aSXin Li float E[NB_FRAMES][NB_TBANDS]; 61*a58d3d2aSXin Li float logE[NB_FRAMES][NB_TBANDS]; 62*a58d3d2aSXin Li float lowE[NB_TBANDS]; 63*a58d3d2aSXin Li float highE[NB_TBANDS]; 64*a58d3d2aSXin Li float meanE[NB_TBANDS+1]; 65*a58d3d2aSXin Li float mem[32]; 66*a58d3d2aSXin Li float cmean[8]; 67*a58d3d2aSXin Li float std[9]; 68*a58d3d2aSXin Li float Etracker; 69*a58d3d2aSXin Li float lowECount; 70*a58d3d2aSXin Li int E_count; 71*a58d3d2aSXin Li int count; 72*a58d3d2aSXin Li int analysis_offset; 73*a58d3d2aSXin Li int write_pos; 74*a58d3d2aSXin Li int read_pos; 75*a58d3d2aSXin Li int read_subframe; 76*a58d3d2aSXin Li float hp_ener_accum; 77*a58d3d2aSXin Li int initialized; 78*a58d3d2aSXin Li float rnn_state[MAX_NEURONS]; 79*a58d3d2aSXin Li opus_val32 downmix_state[3]; 80*a58d3d2aSXin Li AnalysisInfo info[DETECT_SIZE]; 81*a58d3d2aSXin Li } TonalityAnalysisState; 82*a58d3d2aSXin Li 83*a58d3d2aSXin Li /** Initialize a TonalityAnalysisState struct. 84*a58d3d2aSXin Li * 85*a58d3d2aSXin Li * This performs some possibly slow initialization steps which should 86*a58d3d2aSXin Li * not be repeated every analysis step. No allocated memory is retained 87*a58d3d2aSXin Li * by the state struct, so no cleanup call is required. 88*a58d3d2aSXin Li */ 89*a58d3d2aSXin Li void tonality_analysis_init(TonalityAnalysisState *analysis, opus_int32 Fs); 90*a58d3d2aSXin Li 91*a58d3d2aSXin Li /** Reset a TonalityAnalysisState stuct. 92*a58d3d2aSXin Li * 93*a58d3d2aSXin Li * Call this when there's a discontinuity in the data. 94*a58d3d2aSXin Li */ 95*a58d3d2aSXin Li void tonality_analysis_reset(TonalityAnalysisState *analysis); 96*a58d3d2aSXin Li 97*a58d3d2aSXin Li void tonality_get_info(TonalityAnalysisState *tonal, AnalysisInfo *info_out, int len); 98*a58d3d2aSXin Li 99*a58d3d2aSXin Li void run_analysis(TonalityAnalysisState *analysis, const CELTMode *celt_mode, const void *analysis_pcm, 100*a58d3d2aSXin Li int analysis_frame_size, int frame_size, int c1, int c2, int C, opus_int32 Fs, 101*a58d3d2aSXin Li int lsb_depth, downmix_func downmix, AnalysisInfo *analysis_info); 102*a58d3d2aSXin Li 103*a58d3d2aSXin Li #endif 104