xref: /aosp_15_r20/external/libopus/celt/arm/arm_celt_map.c (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /* Copyright (c) 2010 Xiph.Org Foundation
2*a58d3d2aSXin Li  * Copyright (c) 2013 Parrot */
3*a58d3d2aSXin Li /*
4*a58d3d2aSXin Li    Redistribution and use in source and binary forms, with or without
5*a58d3d2aSXin Li    modification, are permitted provided that the following conditions
6*a58d3d2aSXin Li    are met:
7*a58d3d2aSXin Li 
8*a58d3d2aSXin Li    - Redistributions of source code must retain the above copyright
9*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer.
10*a58d3d2aSXin Li 
11*a58d3d2aSXin Li    - Redistributions in binary form must reproduce the above copyright
12*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer in the
13*a58d3d2aSXin Li    documentation and/or other materials provided with the distribution.
14*a58d3d2aSXin Li 
15*a58d3d2aSXin Li    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16*a58d3d2aSXin Li    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17*a58d3d2aSXin Li    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
18*a58d3d2aSXin Li    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
19*a58d3d2aSXin Li    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20*a58d3d2aSXin Li    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21*a58d3d2aSXin Li    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22*a58d3d2aSXin Li    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
23*a58d3d2aSXin Li    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
24*a58d3d2aSXin Li    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25*a58d3d2aSXin Li    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*a58d3d2aSXin Li */
27*a58d3d2aSXin Li 
28*a58d3d2aSXin Li #ifdef HAVE_CONFIG_H
29*a58d3d2aSXin Li #include "config.h"
30*a58d3d2aSXin Li #endif
31*a58d3d2aSXin Li 
32*a58d3d2aSXin Li #include "pitch.h"
33*a58d3d2aSXin Li #include "kiss_fft.h"
34*a58d3d2aSXin Li #include "mdct.h"
35*a58d3d2aSXin Li 
36*a58d3d2aSXin Li #if defined(OPUS_HAVE_RTCD)
37*a58d3d2aSXin Li 
38*a58d3d2aSXin Li # if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)
39*a58d3d2aSXin Li opus_val32 (*const CELT_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x, const opus_val16 *y, int N) = {
40*a58d3d2aSXin Li   celt_inner_prod_c,   /* ARMv4 */
41*a58d3d2aSXin Li   celt_inner_prod_c,   /* EDSP */
42*a58d3d2aSXin Li   celt_inner_prod_c,   /* Media */
43*a58d3d2aSXin Li   celt_inner_prod_neon,/* NEON */
44*a58d3d2aSXin Li   celt_inner_prod_neon /* DOTPROD */
45*a58d3d2aSXin Li };
46*a58d3d2aSXin Li 
47*a58d3d2aSXin Li void (*const DUAL_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x, const opus_val16 *y01, const opus_val16 *y02,
48*a58d3d2aSXin Li       int N, opus_val32 *xy1, opus_val32 *xy2) = {
49*a58d3d2aSXin Li   dual_inner_prod_c,   /* ARMv4 */
50*a58d3d2aSXin Li   dual_inner_prod_c,   /* EDSP */
51*a58d3d2aSXin Li   dual_inner_prod_c,   /* Media */
52*a58d3d2aSXin Li   dual_inner_prod_neon,/* NEON */
53*a58d3d2aSXin Li   dual_inner_prod_neon /* DOTPROD */
54*a58d3d2aSXin Li };
55*a58d3d2aSXin Li # endif
56*a58d3d2aSXin Li 
57*a58d3d2aSXin Li # if defined(FIXED_POINT)
58*a58d3d2aSXin Li #  if ((defined(OPUS_ARM_MAY_HAVE_NEON) && !defined(OPUS_ARM_PRESUME_NEON)) || \
59*a58d3d2aSXin Li     (defined(OPUS_ARM_MAY_HAVE_MEDIA) && !defined(OPUS_ARM_PRESUME_MEDIA)) || \
60*a58d3d2aSXin Li     (defined(OPUS_ARM_MAY_HAVE_EDSP) && !defined(OPUS_ARM_PRESUME_EDSP)))
61*a58d3d2aSXin Li opus_val32 (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *,
62*a58d3d2aSXin Li     const opus_val16 *, opus_val32 *, int, int, int) = {
63*a58d3d2aSXin Li   celt_pitch_xcorr_c,               /* ARMv4 */
64*a58d3d2aSXin Li   MAY_HAVE_EDSP(celt_pitch_xcorr),  /* EDSP */
65*a58d3d2aSXin Li   MAY_HAVE_MEDIA(celt_pitch_xcorr), /* Media */
66*a58d3d2aSXin Li   MAY_HAVE_NEON(celt_pitch_xcorr),  /* NEON */
67*a58d3d2aSXin Li   MAY_HAVE_NEON(celt_pitch_xcorr)   /* DOTPROD */
68*a58d3d2aSXin Li };
69*a58d3d2aSXin Li 
70*a58d3d2aSXin Li #  endif
71*a58d3d2aSXin Li # else /* !FIXED_POINT */
72*a58d3d2aSXin Li #  if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)
73*a58d3d2aSXin Li void (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *,
74*a58d3d2aSXin Li     const opus_val16 *, opus_val32 *, int, int, int) = {
75*a58d3d2aSXin Li   celt_pitch_xcorr_c,              /* ARMv4 */
76*a58d3d2aSXin Li   celt_pitch_xcorr_c,              /* EDSP */
77*a58d3d2aSXin Li   celt_pitch_xcorr_c,              /* Media */
78*a58d3d2aSXin Li   celt_pitch_xcorr_float_neon,     /* Neon */
79*a58d3d2aSXin Li   celt_pitch_xcorr_float_neon      /* DOTPROD */
80*a58d3d2aSXin Li };
81*a58d3d2aSXin Li #  endif
82*a58d3d2aSXin Li # endif /* FIXED_POINT */
83*a58d3d2aSXin Li 
84*a58d3d2aSXin Li #if defined(FIXED_POINT) && defined(OPUS_HAVE_RTCD) && \
85*a58d3d2aSXin Li  defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)
86*a58d3d2aSXin Li 
87*a58d3d2aSXin Li void (*const XCORR_KERNEL_IMPL[OPUS_ARCHMASK + 1])(
88*a58d3d2aSXin Li          const opus_val16 *x,
89*a58d3d2aSXin Li          const opus_val16 *y,
90*a58d3d2aSXin Li          opus_val32       sum[4],
91*a58d3d2aSXin Li          int              len
92*a58d3d2aSXin Li ) = {
93*a58d3d2aSXin Li   xcorr_kernel_c,                /* ARMv4 */
94*a58d3d2aSXin Li   xcorr_kernel_c,                /* EDSP */
95*a58d3d2aSXin Li   xcorr_kernel_c,                /* Media */
96*a58d3d2aSXin Li   xcorr_kernel_neon_fixed,       /* Neon */
97*a58d3d2aSXin Li   xcorr_kernel_neon_fixed        /* DOTPROD */
98*a58d3d2aSXin Li };
99*a58d3d2aSXin Li 
100*a58d3d2aSXin Li #endif
101*a58d3d2aSXin Li 
102*a58d3d2aSXin Li # if defined(OPUS_ARM_MAY_HAVE_NEON_INTR)
103*a58d3d2aSXin Li #  if defined(HAVE_ARM_NE10)
104*a58d3d2aSXin Li #   if defined(CUSTOM_MODES)
105*a58d3d2aSXin Li int (*const OPUS_FFT_ALLOC_ARCH_IMPL[OPUS_ARCHMASK+1])(kiss_fft_state *st) = {
106*a58d3d2aSXin Li    opus_fft_alloc_arch_c,        /* ARMv4 */
107*a58d3d2aSXin Li    opus_fft_alloc_arch_c,        /* EDSP */
108*a58d3d2aSXin Li    opus_fft_alloc_arch_c,        /* Media */
109*a58d3d2aSXin Li    opus_fft_alloc_arm_neon,      /* Neon with NE10 library support */
110*a58d3d2aSXin Li    opus_fft_alloc_arm_neon       /* DOTPROD with NE10 library support */
111*a58d3d2aSXin Li };
112*a58d3d2aSXin Li 
113*a58d3d2aSXin Li void (*const OPUS_FFT_FREE_ARCH_IMPL[OPUS_ARCHMASK+1])(kiss_fft_state *st) = {
114*a58d3d2aSXin Li    opus_fft_free_arch_c,         /* ARMv4 */
115*a58d3d2aSXin Li    opus_fft_free_arch_c,         /* EDSP */
116*a58d3d2aSXin Li    opus_fft_free_arch_c,         /* Media */
117*a58d3d2aSXin Li    opus_fft_free_arm_neon,       /* Neon with NE10 */
118*a58d3d2aSXin Li    opus_fft_free_arm_neon        /* DOTPROD with NE10 */
119*a58d3d2aSXin Li };
120*a58d3d2aSXin Li #   endif /* CUSTOM_MODES */
121*a58d3d2aSXin Li 
122*a58d3d2aSXin Li void (*const OPUS_FFT[OPUS_ARCHMASK+1])(const kiss_fft_state *cfg,
123*a58d3d2aSXin Li                                         const kiss_fft_cpx *fin,
124*a58d3d2aSXin Li                                         kiss_fft_cpx *fout) = {
125*a58d3d2aSXin Li    opus_fft_c,                   /* ARMv4 */
126*a58d3d2aSXin Li    opus_fft_c,                   /* EDSP */
127*a58d3d2aSXin Li    opus_fft_c,                   /* Media */
128*a58d3d2aSXin Li    opus_fft_neon,                /* Neon with NE10 */
129*a58d3d2aSXin Li    opus_fft_neon                 /* DOTPROD with NE10 */
130*a58d3d2aSXin Li };
131*a58d3d2aSXin Li 
132*a58d3d2aSXin Li void (*const OPUS_IFFT[OPUS_ARCHMASK+1])(const kiss_fft_state *cfg,
133*a58d3d2aSXin Li                                          const kiss_fft_cpx *fin,
134*a58d3d2aSXin Li                                          kiss_fft_cpx *fout) = {
135*a58d3d2aSXin Li    opus_ifft_c,                   /* ARMv4 */
136*a58d3d2aSXin Li    opus_ifft_c,                   /* EDSP */
137*a58d3d2aSXin Li    opus_ifft_c,                   /* Media */
138*a58d3d2aSXin Li    opus_ifft_neon,                /* Neon with NE10 */
139*a58d3d2aSXin Li    opus_ifft_neon                 /* DOTPROD with NE10 */
140*a58d3d2aSXin Li };
141*a58d3d2aSXin Li 
142*a58d3d2aSXin Li void (*const CLT_MDCT_FORWARD_IMPL[OPUS_ARCHMASK+1])(const mdct_lookup *l,
143*a58d3d2aSXin Li                                                      kiss_fft_scalar *in,
144*a58d3d2aSXin Li                                                      kiss_fft_scalar * OPUS_RESTRICT out,
145*a58d3d2aSXin Li                                                      const opus_val16 *window,
146*a58d3d2aSXin Li                                                      int overlap, int shift,
147*a58d3d2aSXin Li                                                      int stride, int arch) = {
148*a58d3d2aSXin Li    clt_mdct_forward_c,           /* ARMv4 */
149*a58d3d2aSXin Li    clt_mdct_forward_c,           /* EDSP */
150*a58d3d2aSXin Li    clt_mdct_forward_c,           /* Media */
151*a58d3d2aSXin Li    clt_mdct_forward_neon,        /* Neon with NE10 */
152*a58d3d2aSXin Li    clt_mdct_forward_neon         /* DOTPROD with NE10 */
153*a58d3d2aSXin Li };
154*a58d3d2aSXin Li 
155*a58d3d2aSXin Li void (*const CLT_MDCT_BACKWARD_IMPL[OPUS_ARCHMASK+1])(const mdct_lookup *l,
156*a58d3d2aSXin Li                                                       kiss_fft_scalar *in,
157*a58d3d2aSXin Li                                                       kiss_fft_scalar * OPUS_RESTRICT out,
158*a58d3d2aSXin Li                                                       const opus_val16 *window,
159*a58d3d2aSXin Li                                                       int overlap, int shift,
160*a58d3d2aSXin Li                                                       int stride, int arch) = {
161*a58d3d2aSXin Li    clt_mdct_backward_c,           /* ARMv4 */
162*a58d3d2aSXin Li    clt_mdct_backward_c,           /* EDSP */
163*a58d3d2aSXin Li    clt_mdct_backward_c,           /* Media */
164*a58d3d2aSXin Li    clt_mdct_backward_neon,        /* Neon with NE10 */
165*a58d3d2aSXin Li    clt_mdct_backward_neon         /* DOTPROD with NE10 */
166*a58d3d2aSXin Li };
167*a58d3d2aSXin Li 
168*a58d3d2aSXin Li #  endif /* HAVE_ARM_NE10 */
169*a58d3d2aSXin Li # endif /* OPUS_ARM_MAY_HAVE_NEON_INTR */
170*a58d3d2aSXin Li 
171*a58d3d2aSXin Li #endif /* OPUS_HAVE_RTCD */
172