xref: /aosp_15_r20/external/libopus/celt/pitch.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /* Copyright (c) 2007-2008 CSIRO
2*a58d3d2aSXin Li    Copyright (c) 2007-2009 Xiph.Org Foundation
3*a58d3d2aSXin Li    Written by Jean-Marc Valin */
4*a58d3d2aSXin Li /**
5*a58d3d2aSXin Li    @file pitch.h
6*a58d3d2aSXin Li    @brief Pitch analysis
7*a58d3d2aSXin Li  */
8*a58d3d2aSXin Li 
9*a58d3d2aSXin Li /*
10*a58d3d2aSXin Li    Redistribution and use in source and binary forms, with or without
11*a58d3d2aSXin Li    modification, are permitted provided that the following conditions
12*a58d3d2aSXin Li    are met:
13*a58d3d2aSXin Li 
14*a58d3d2aSXin Li    - Redistributions of source code must retain the above copyright
15*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer.
16*a58d3d2aSXin Li 
17*a58d3d2aSXin Li    - Redistributions in binary form must reproduce the above copyright
18*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer in the
19*a58d3d2aSXin Li    documentation and/or other materials provided with the distribution.
20*a58d3d2aSXin Li 
21*a58d3d2aSXin Li    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22*a58d3d2aSXin Li    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23*a58d3d2aSXin Li    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24*a58d3d2aSXin Li    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
25*a58d3d2aSXin Li    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
26*a58d3d2aSXin Li    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
27*a58d3d2aSXin Li    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
28*a58d3d2aSXin Li    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29*a58d3d2aSXin Li    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30*a58d3d2aSXin Li    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31*a58d3d2aSXin Li    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32*a58d3d2aSXin Li */
33*a58d3d2aSXin Li 
34*a58d3d2aSXin Li #ifndef PITCH_H
35*a58d3d2aSXin Li #define PITCH_H
36*a58d3d2aSXin Li 
37*a58d3d2aSXin Li #include "modes.h"
38*a58d3d2aSXin Li #include "cpu_support.h"
39*a58d3d2aSXin Li 
40*a58d3d2aSXin Li #if (defined(OPUS_X86_MAY_HAVE_SSE) && !defined(FIXED_POINT)) \
41*a58d3d2aSXin Li   || ((defined(OPUS_X86_MAY_HAVE_SSE4_1) || defined(OPUS_X86_MAY_HAVE_SSE2)) && defined(FIXED_POINT))
42*a58d3d2aSXin Li #include "x86/pitch_sse.h"
43*a58d3d2aSXin Li #endif
44*a58d3d2aSXin Li 
45*a58d3d2aSXin Li #if defined(MIPSr1_ASM)
46*a58d3d2aSXin Li #include "mips/pitch_mipsr1.h"
47*a58d3d2aSXin Li #endif
48*a58d3d2aSXin Li 
49*a58d3d2aSXin Li #if (defined(OPUS_ARM_ASM) || defined(OPUS_ARM_MAY_HAVE_NEON_INTR))
50*a58d3d2aSXin Li # include "arm/pitch_arm.h"
51*a58d3d2aSXin Li #endif
52*a58d3d2aSXin Li 
53*a58d3d2aSXin Li void pitch_downsample(celt_sig * OPUS_RESTRICT x[], opus_val16 * OPUS_RESTRICT x_lp,
54*a58d3d2aSXin Li       int len, int C, int arch);
55*a58d3d2aSXin Li 
56*a58d3d2aSXin Li void pitch_search(const opus_val16 * OPUS_RESTRICT x_lp, opus_val16 * OPUS_RESTRICT y,
57*a58d3d2aSXin Li                   int len, int max_pitch, int *pitch, int arch);
58*a58d3d2aSXin Li 
59*a58d3d2aSXin Li opus_val16 remove_doubling(opus_val16 *x, int maxperiod, int minperiod,
60*a58d3d2aSXin Li       int N, int *T0, int prev_period, opus_val16 prev_gain, int arch);
61*a58d3d2aSXin Li 
62*a58d3d2aSXin Li 
63*a58d3d2aSXin Li /* OPT: This is the kernel you really want to optimize. It gets used a lot
64*a58d3d2aSXin Li    by the prefilter and by the PLC. */
xcorr_kernel_c(const opus_val16 * x,const opus_val16 * y,opus_val32 sum[4],int len)65*a58d3d2aSXin Li static OPUS_INLINE void xcorr_kernel_c(const opus_val16 * x, const opus_val16 * y, opus_val32 sum[4], int len)
66*a58d3d2aSXin Li {
67*a58d3d2aSXin Li    int j;
68*a58d3d2aSXin Li    opus_val16 y_0, y_1, y_2, y_3;
69*a58d3d2aSXin Li    celt_assert(len>=3);
70*a58d3d2aSXin Li    y_3=0; /* gcc doesn't realize that y_3 can't be used uninitialized */
71*a58d3d2aSXin Li    y_0=*y++;
72*a58d3d2aSXin Li    y_1=*y++;
73*a58d3d2aSXin Li    y_2=*y++;
74*a58d3d2aSXin Li    for (j=0;j<len-3;j+=4)
75*a58d3d2aSXin Li    {
76*a58d3d2aSXin Li       opus_val16 tmp;
77*a58d3d2aSXin Li       tmp = *x++;
78*a58d3d2aSXin Li       y_3=*y++;
79*a58d3d2aSXin Li       sum[0] = MAC16_16(sum[0],tmp,y_0);
80*a58d3d2aSXin Li       sum[1] = MAC16_16(sum[1],tmp,y_1);
81*a58d3d2aSXin Li       sum[2] = MAC16_16(sum[2],tmp,y_2);
82*a58d3d2aSXin Li       sum[3] = MAC16_16(sum[3],tmp,y_3);
83*a58d3d2aSXin Li       tmp=*x++;
84*a58d3d2aSXin Li       y_0=*y++;
85*a58d3d2aSXin Li       sum[0] = MAC16_16(sum[0],tmp,y_1);
86*a58d3d2aSXin Li       sum[1] = MAC16_16(sum[1],tmp,y_2);
87*a58d3d2aSXin Li       sum[2] = MAC16_16(sum[2],tmp,y_3);
88*a58d3d2aSXin Li       sum[3] = MAC16_16(sum[3],tmp,y_0);
89*a58d3d2aSXin Li       tmp=*x++;
90*a58d3d2aSXin Li       y_1=*y++;
91*a58d3d2aSXin Li       sum[0] = MAC16_16(sum[0],tmp,y_2);
92*a58d3d2aSXin Li       sum[1] = MAC16_16(sum[1],tmp,y_3);
93*a58d3d2aSXin Li       sum[2] = MAC16_16(sum[2],tmp,y_0);
94*a58d3d2aSXin Li       sum[3] = MAC16_16(sum[3],tmp,y_1);
95*a58d3d2aSXin Li       tmp=*x++;
96*a58d3d2aSXin Li       y_2=*y++;
97*a58d3d2aSXin Li       sum[0] = MAC16_16(sum[0],tmp,y_3);
98*a58d3d2aSXin Li       sum[1] = MAC16_16(sum[1],tmp,y_0);
99*a58d3d2aSXin Li       sum[2] = MAC16_16(sum[2],tmp,y_1);
100*a58d3d2aSXin Li       sum[3] = MAC16_16(sum[3],tmp,y_2);
101*a58d3d2aSXin Li    }
102*a58d3d2aSXin Li    if (j++<len)
103*a58d3d2aSXin Li    {
104*a58d3d2aSXin Li       opus_val16 tmp = *x++;
105*a58d3d2aSXin Li       y_3=*y++;
106*a58d3d2aSXin Li       sum[0] = MAC16_16(sum[0],tmp,y_0);
107*a58d3d2aSXin Li       sum[1] = MAC16_16(sum[1],tmp,y_1);
108*a58d3d2aSXin Li       sum[2] = MAC16_16(sum[2],tmp,y_2);
109*a58d3d2aSXin Li       sum[3] = MAC16_16(sum[3],tmp,y_3);
110*a58d3d2aSXin Li    }
111*a58d3d2aSXin Li    if (j++<len)
112*a58d3d2aSXin Li    {
113*a58d3d2aSXin Li       opus_val16 tmp=*x++;
114*a58d3d2aSXin Li       y_0=*y++;
115*a58d3d2aSXin Li       sum[0] = MAC16_16(sum[0],tmp,y_1);
116*a58d3d2aSXin Li       sum[1] = MAC16_16(sum[1],tmp,y_2);
117*a58d3d2aSXin Li       sum[2] = MAC16_16(sum[2],tmp,y_3);
118*a58d3d2aSXin Li       sum[3] = MAC16_16(sum[3],tmp,y_0);
119*a58d3d2aSXin Li    }
120*a58d3d2aSXin Li    if (j<len)
121*a58d3d2aSXin Li    {
122*a58d3d2aSXin Li       opus_val16 tmp=*x++;
123*a58d3d2aSXin Li       y_1=*y++;
124*a58d3d2aSXin Li       sum[0] = MAC16_16(sum[0],tmp,y_2);
125*a58d3d2aSXin Li       sum[1] = MAC16_16(sum[1],tmp,y_3);
126*a58d3d2aSXin Li       sum[2] = MAC16_16(sum[2],tmp,y_0);
127*a58d3d2aSXin Li       sum[3] = MAC16_16(sum[3],tmp,y_1);
128*a58d3d2aSXin Li    }
129*a58d3d2aSXin Li }
130*a58d3d2aSXin Li 
131*a58d3d2aSXin Li #ifndef OVERRIDE_XCORR_KERNEL
132*a58d3d2aSXin Li #define xcorr_kernel(x, y, sum, len, arch) \
133*a58d3d2aSXin Li     ((void)(arch),xcorr_kernel_c(x, y, sum, len))
134*a58d3d2aSXin Li #endif /* OVERRIDE_XCORR_KERNEL */
135*a58d3d2aSXin Li 
136*a58d3d2aSXin Li 
dual_inner_prod_c(const opus_val16 * x,const opus_val16 * y01,const opus_val16 * y02,int N,opus_val32 * xy1,opus_val32 * xy2)137*a58d3d2aSXin Li static OPUS_INLINE void dual_inner_prod_c(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02,
138*a58d3d2aSXin Li       int N, opus_val32 *xy1, opus_val32 *xy2)
139*a58d3d2aSXin Li {
140*a58d3d2aSXin Li    int i;
141*a58d3d2aSXin Li    opus_val32 xy01=0;
142*a58d3d2aSXin Li    opus_val32 xy02=0;
143*a58d3d2aSXin Li    for (i=0;i<N;i++)
144*a58d3d2aSXin Li    {
145*a58d3d2aSXin Li       xy01 = MAC16_16(xy01, x[i], y01[i]);
146*a58d3d2aSXin Li       xy02 = MAC16_16(xy02, x[i], y02[i]);
147*a58d3d2aSXin Li    }
148*a58d3d2aSXin Li    *xy1 = xy01;
149*a58d3d2aSXin Li    *xy2 = xy02;
150*a58d3d2aSXin Li }
151*a58d3d2aSXin Li 
152*a58d3d2aSXin Li #ifndef OVERRIDE_DUAL_INNER_PROD
153*a58d3d2aSXin Li # define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) \
154*a58d3d2aSXin Li     ((void)(arch),dual_inner_prod_c(x, y01, y02, N, xy1, xy2))
155*a58d3d2aSXin Li #endif
156*a58d3d2aSXin Li 
157*a58d3d2aSXin Li /*We make sure a C version is always available for cases where the overhead of
158*a58d3d2aSXin Li   vectorization and passing around an arch flag aren't worth it.*/
celt_inner_prod_c(const opus_val16 * x,const opus_val16 * y,int N)159*a58d3d2aSXin Li static OPUS_INLINE opus_val32 celt_inner_prod_c(const opus_val16 *x,
160*a58d3d2aSXin Li       const opus_val16 *y, int N)
161*a58d3d2aSXin Li {
162*a58d3d2aSXin Li    int i;
163*a58d3d2aSXin Li    opus_val32 xy=0;
164*a58d3d2aSXin Li    for (i=0;i<N;i++)
165*a58d3d2aSXin Li       xy = MAC16_16(xy, x[i], y[i]);
166*a58d3d2aSXin Li    return xy;
167*a58d3d2aSXin Li }
168*a58d3d2aSXin Li 
169*a58d3d2aSXin Li #if !defined(OVERRIDE_CELT_INNER_PROD)
170*a58d3d2aSXin Li # define celt_inner_prod(x, y, N, arch) \
171*a58d3d2aSXin Li     ((void)(arch),celt_inner_prod_c(x, y, N))
172*a58d3d2aSXin Li #endif
173*a58d3d2aSXin Li 
174*a58d3d2aSXin Li #ifdef NON_STATIC_COMB_FILTER_CONST_C
175*a58d3d2aSXin Li void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N,
176*a58d3d2aSXin Li      opus_val16 g10, opus_val16 g11, opus_val16 g12);
177*a58d3d2aSXin Li #endif
178*a58d3d2aSXin Li 
179*a58d3d2aSXin Li 
180*a58d3d2aSXin Li #ifdef FIXED_POINT
181*a58d3d2aSXin Li opus_val32
182*a58d3d2aSXin Li #else
183*a58d3d2aSXin Li void
184*a58d3d2aSXin Li #endif
185*a58d3d2aSXin Li celt_pitch_xcorr_c(const opus_val16 *_x, const opus_val16 *_y,
186*a58d3d2aSXin Li       opus_val32 *xcorr, int len, int max_pitch, int arch);
187*a58d3d2aSXin Li 
188*a58d3d2aSXin Li #ifndef OVERRIDE_PITCH_XCORR
189*a58d3d2aSXin Li # define celt_pitch_xcorr celt_pitch_xcorr_c
190*a58d3d2aSXin Li #endif
191*a58d3d2aSXin Li 
192*a58d3d2aSXin Li #ifdef NON_STATIC_COMB_FILTER_CONST_C
193*a58d3d2aSXin Li void comb_filter_const_c(opus_val32 *y, opus_val32 *x, int T, int N,
194*a58d3d2aSXin Li                          opus_val16 g10, opus_val16 g11, opus_val16 g12);
195*a58d3d2aSXin Li #endif
196*a58d3d2aSXin Li 
197*a58d3d2aSXin Li #ifndef OVERRIDE_COMB_FILTER_CONST
198*a58d3d2aSXin Li # define comb_filter_const(y, x, T, N, g10, g11, g12, arch) \
199*a58d3d2aSXin Li     ((void)(arch),comb_filter_const_c(y, x, T, N, g10, g11, g12))
200*a58d3d2aSXin Li #endif
201*a58d3d2aSXin Li 
202*a58d3d2aSXin Li 
203*a58d3d2aSXin Li #endif
204