xref: /aosp_15_r20/external/libopus/celt/arm/pitch_arm.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /* Copyright (c) 2010 Xiph.Org Foundation
2*a58d3d2aSXin Li  * Copyright (c) 2013 Parrot */
3*a58d3d2aSXin Li /*
4*a58d3d2aSXin Li    Redistribution and use in source and binary forms, with or without
5*a58d3d2aSXin Li    modification, are permitted provided that the following conditions
6*a58d3d2aSXin Li    are met:
7*a58d3d2aSXin Li 
8*a58d3d2aSXin Li    - Redistributions of source code must retain the above copyright
9*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer.
10*a58d3d2aSXin Li 
11*a58d3d2aSXin Li    - Redistributions in binary form must reproduce the above copyright
12*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer in the
13*a58d3d2aSXin Li    documentation and/or other materials provided with the distribution.
14*a58d3d2aSXin Li 
15*a58d3d2aSXin Li    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16*a58d3d2aSXin Li    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17*a58d3d2aSXin Li    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
18*a58d3d2aSXin Li    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
19*a58d3d2aSXin Li    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20*a58d3d2aSXin Li    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21*a58d3d2aSXin Li    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22*a58d3d2aSXin Li    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
23*a58d3d2aSXin Li    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
24*a58d3d2aSXin Li    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25*a58d3d2aSXin Li    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*a58d3d2aSXin Li */
27*a58d3d2aSXin Li 
28*a58d3d2aSXin Li #if !defined(PITCH_ARM_H)
29*a58d3d2aSXin Li # define PITCH_ARM_H
30*a58d3d2aSXin Li 
31*a58d3d2aSXin Li # include "armcpu.h"
32*a58d3d2aSXin Li 
33*a58d3d2aSXin Li # if defined(OPUS_ARM_MAY_HAVE_NEON_INTR)
34*a58d3d2aSXin Li opus_val32 celt_inner_prod_neon(const opus_val16 *x, const opus_val16 *y, int N);
35*a58d3d2aSXin Li void dual_inner_prod_neon(const opus_val16 *x, const opus_val16 *y01,
36*a58d3d2aSXin Li         const opus_val16 *y02, int N, opus_val32 *xy1, opus_val32 *xy2);
37*a58d3d2aSXin Li 
38*a58d3d2aSXin Li #  if !defined(OPUS_HAVE_RTCD) && defined(OPUS_ARM_PRESUME_NEON)
39*a58d3d2aSXin Li #   define OVERRIDE_CELT_INNER_PROD (1)
40*a58d3d2aSXin Li #   define OVERRIDE_DUAL_INNER_PROD (1)
41*a58d3d2aSXin Li #   define celt_inner_prod(x, y, N, arch) ((void)(arch), PRESUME_NEON(celt_inner_prod)(x, y, N))
42*a58d3d2aSXin Li #   define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) ((void)(arch), PRESUME_NEON(dual_inner_prod)(x, y01, y02, N, xy1, xy2))
43*a58d3d2aSXin Li #  endif
44*a58d3d2aSXin Li # endif
45*a58d3d2aSXin Li 
46*a58d3d2aSXin Li # if !defined(OVERRIDE_CELT_INNER_PROD)
47*a58d3d2aSXin Li #  if defined(OPUS_HAVE_RTCD) && (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR))
48*a58d3d2aSXin Li extern opus_val32 (*const CELT_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x, const opus_val16 *y, int N);
49*a58d3d2aSXin Li #   define OVERRIDE_CELT_INNER_PROD (1)
50*a58d3d2aSXin Li #   define celt_inner_prod(x, y, N, arch) ((*CELT_INNER_PROD_IMPL[(arch)&OPUS_ARCHMASK])(x, y, N))
51*a58d3d2aSXin Li #  elif defined(OPUS_ARM_PRESUME_NEON_INTR)
52*a58d3d2aSXin Li #   define OVERRIDE_CELT_INNER_PROD (1)
53*a58d3d2aSXin Li #   define celt_inner_prod(x, y, N, arch) ((void)(arch), celt_inner_prod_neon(x, y, N))
54*a58d3d2aSXin Li #  endif
55*a58d3d2aSXin Li # endif
56*a58d3d2aSXin Li 
57*a58d3d2aSXin Li # if !defined(OVERRIDE_DUAL_INNER_PROD)
58*a58d3d2aSXin Li #  if defined(OPUS_HAVE_RTCD) && (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR))
59*a58d3d2aSXin Li extern void (*const DUAL_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x,
60*a58d3d2aSXin Li         const opus_val16 *y01, const opus_val16 *y02, int N, opus_val32 *xy1, opus_val32 *xy2);
61*a58d3d2aSXin Li #   define OVERRIDE_DUAL_INNER_PROD (1)
62*a58d3d2aSXin Li #   define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) ((*DUAL_INNER_PROD_IMPL[(arch)&OPUS_ARCHMASK])(x, y01, y02, N, xy1, xy2))
63*a58d3d2aSXin Li #  elif defined(OPUS_ARM_PRESUME_NEON_INTR)
64*a58d3d2aSXin Li #   define OVERRIDE_DUAL_INNER_PROD (1)
65*a58d3d2aSXin Li #   define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) ((void)(arch), dual_inner_prod_neon(x, y01, y02, N, xy1, xy2))
66*a58d3d2aSXin Li #  endif
67*a58d3d2aSXin Li # endif
68*a58d3d2aSXin Li 
69*a58d3d2aSXin Li # if defined(FIXED_POINT)
70*a58d3d2aSXin Li 
71*a58d3d2aSXin Li #  if defined(OPUS_ARM_MAY_HAVE_NEON)
72*a58d3d2aSXin Li opus_val32 celt_pitch_xcorr_neon(const opus_val16 *_x, const opus_val16 *_y,
73*a58d3d2aSXin Li     opus_val32 *xcorr, int len, int max_pitch, int arch);
74*a58d3d2aSXin Li #  endif
75*a58d3d2aSXin Li 
76*a58d3d2aSXin Li #  if defined(OPUS_ARM_MAY_HAVE_MEDIA)
77*a58d3d2aSXin Li #   define celt_pitch_xcorr_media MAY_HAVE_EDSP(celt_pitch_xcorr)
78*a58d3d2aSXin Li #  endif
79*a58d3d2aSXin Li 
80*a58d3d2aSXin Li #  if defined(OPUS_ARM_MAY_HAVE_EDSP)
81*a58d3d2aSXin Li opus_val32 celt_pitch_xcorr_edsp(const opus_val16 *_x, const opus_val16 *_y,
82*a58d3d2aSXin Li     opus_val32 *xcorr, int len, int max_pitch, int arch);
83*a58d3d2aSXin Li #  endif
84*a58d3d2aSXin Li 
85*a58d3d2aSXin Li #  if defined(OPUS_HAVE_RTCD) && \
86*a58d3d2aSXin Li     ((defined(OPUS_ARM_MAY_HAVE_NEON) && !defined(OPUS_ARM_PRESUME_NEON)) || \
87*a58d3d2aSXin Li      (defined(OPUS_ARM_MAY_HAVE_MEDIA) && !defined(OPUS_ARM_PRESUME_MEDIA)) || \
88*a58d3d2aSXin Li      (defined(OPUS_ARM_MAY_HAVE_EDSP) && !defined(OPUS_ARM_PRESUME_EDSP)))
89*a58d3d2aSXin Li extern opus_val32
90*a58d3d2aSXin Li (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *,
91*a58d3d2aSXin Li       const opus_val16 *, opus_val32 *, int, int, int);
92*a58d3d2aSXin Li #   define OVERRIDE_PITCH_XCORR (1)
93*a58d3d2aSXin Li #   define celt_pitch_xcorr(_x, _y, xcorr, len, max_pitch, arch) \
94*a58d3d2aSXin Li   ((*CELT_PITCH_XCORR_IMPL[(arch)&OPUS_ARCHMASK])(_x, _y, \
95*a58d3d2aSXin Li         xcorr, len, max_pitch, arch))
96*a58d3d2aSXin Li 
97*a58d3d2aSXin Li #  elif defined(OPUS_ARM_PRESUME_EDSP) || \
98*a58d3d2aSXin Li     defined(OPUS_ARM_PRESUME_MEDIA) || \
99*a58d3d2aSXin Li     defined(OPUS_ARM_PRESUME_NEON)
100*a58d3d2aSXin Li #   define OVERRIDE_PITCH_XCORR (1)
101*a58d3d2aSXin Li #   define celt_pitch_xcorr (PRESUME_NEON(celt_pitch_xcorr))
102*a58d3d2aSXin Li 
103*a58d3d2aSXin Li #  endif
104*a58d3d2aSXin Li 
105*a58d3d2aSXin Li #  if defined(OPUS_ARM_MAY_HAVE_NEON_INTR)
106*a58d3d2aSXin Li void xcorr_kernel_neon_fixed(
107*a58d3d2aSXin Li                     const opus_val16 *x,
108*a58d3d2aSXin Li                     const opus_val16 *y,
109*a58d3d2aSXin Li                     opus_val32       sum[4],
110*a58d3d2aSXin Li                     int              len);
111*a58d3d2aSXin Li #  endif
112*a58d3d2aSXin Li 
113*a58d3d2aSXin Li #  if defined(OPUS_HAVE_RTCD) && \
114*a58d3d2aSXin Li     (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR))
115*a58d3d2aSXin Li 
116*a58d3d2aSXin Li extern void (*const XCORR_KERNEL_IMPL[OPUS_ARCHMASK + 1])(
117*a58d3d2aSXin Li                     const opus_val16 *x,
118*a58d3d2aSXin Li                     const opus_val16 *y,
119*a58d3d2aSXin Li                     opus_val32       sum[4],
120*a58d3d2aSXin Li                     int              len);
121*a58d3d2aSXin Li 
122*a58d3d2aSXin Li #   define OVERRIDE_XCORR_KERNEL (1)
123*a58d3d2aSXin Li #   define xcorr_kernel(x, y, sum, len, arch) \
124*a58d3d2aSXin Li      ((*XCORR_KERNEL_IMPL[(arch) & OPUS_ARCHMASK])(x, y, sum, len))
125*a58d3d2aSXin Li 
126*a58d3d2aSXin Li #  elif defined(OPUS_ARM_PRESUME_NEON_INTR)
127*a58d3d2aSXin Li #   define OVERRIDE_XCORR_KERNEL (1)
128*a58d3d2aSXin Li #   define xcorr_kernel(x, y, sum, len, arch) \
129*a58d3d2aSXin Li       ((void)arch, xcorr_kernel_neon_fixed(x, y, sum, len))
130*a58d3d2aSXin Li 
131*a58d3d2aSXin Li #  endif
132*a58d3d2aSXin Li 
133*a58d3d2aSXin Li #else /* Start !FIXED_POINT */
134*a58d3d2aSXin Li /* Float case */
135*a58d3d2aSXin Li #if defined(OPUS_ARM_MAY_HAVE_NEON_INTR)
136*a58d3d2aSXin Li void celt_pitch_xcorr_float_neon(const opus_val16 *_x, const opus_val16 *_y,
137*a58d3d2aSXin Li                                  opus_val32 *xcorr, int len, int max_pitch, int arch);
138*a58d3d2aSXin Li #endif
139*a58d3d2aSXin Li 
140*a58d3d2aSXin Li #  if defined(OPUS_HAVE_RTCD) && \
141*a58d3d2aSXin Li     (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR))
142*a58d3d2aSXin Li extern void
143*a58d3d2aSXin Li (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *,
144*a58d3d2aSXin Li       const opus_val16 *, opus_val32 *, int, int, int);
145*a58d3d2aSXin Li 
146*a58d3d2aSXin Li #  define OVERRIDE_PITCH_XCORR (1)
147*a58d3d2aSXin Li #  define celt_pitch_xcorr(_x, _y, xcorr, len, max_pitch, arch) \
148*a58d3d2aSXin Li   ((*CELT_PITCH_XCORR_IMPL[(arch)&OPUS_ARCHMASK])(_x, _y, \
149*a58d3d2aSXin Li         xcorr, len, max_pitch, arch))
150*a58d3d2aSXin Li 
151*a58d3d2aSXin Li #  elif defined(OPUS_ARM_PRESUME_NEON_INTR)
152*a58d3d2aSXin Li 
153*a58d3d2aSXin Li #   define OVERRIDE_PITCH_XCORR (1)
154*a58d3d2aSXin Li #   define celt_pitch_xcorr celt_pitch_xcorr_float_neon
155*a58d3d2aSXin Li 
156*a58d3d2aSXin Li #  endif
157*a58d3d2aSXin Li 
158*a58d3d2aSXin Li #endif /* end !FIXED_POINT */
159*a58d3d2aSXin Li 
160*a58d3d2aSXin Li #endif
161