1*a58d3d2aSXin Li /* Copyright (c) 2010 Xiph.Org Foundation 2*a58d3d2aSXin Li * Copyright (c) 2013 Parrot */ 3*a58d3d2aSXin Li /* 4*a58d3d2aSXin Li Redistribution and use in source and binary forms, with or without 5*a58d3d2aSXin Li modification, are permitted provided that the following conditions 6*a58d3d2aSXin Li are met: 7*a58d3d2aSXin Li 8*a58d3d2aSXin Li - Redistributions of source code must retain the above copyright 9*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer. 10*a58d3d2aSXin Li 11*a58d3d2aSXin Li - Redistributions in binary form must reproduce the above copyright 12*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer in the 13*a58d3d2aSXin Li documentation and/or other materials provided with the distribution. 14*a58d3d2aSXin Li 15*a58d3d2aSXin Li THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 16*a58d3d2aSXin Li ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 17*a58d3d2aSXin Li LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 18*a58d3d2aSXin Li A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER 19*a58d3d2aSXin Li OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 20*a58d3d2aSXin Li EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 21*a58d3d2aSXin Li PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 22*a58d3d2aSXin Li PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF 23*a58d3d2aSXin Li LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING 24*a58d3d2aSXin Li NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 25*a58d3d2aSXin Li SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 26*a58d3d2aSXin Li */ 27*a58d3d2aSXin Li 28*a58d3d2aSXin Li #if !defined(PITCH_ARM_H) 29*a58d3d2aSXin Li # define PITCH_ARM_H 30*a58d3d2aSXin Li 31*a58d3d2aSXin Li # include "armcpu.h" 32*a58d3d2aSXin Li 33*a58d3d2aSXin Li # if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) 34*a58d3d2aSXin Li opus_val32 celt_inner_prod_neon(const opus_val16 *x, const opus_val16 *y, int N); 35*a58d3d2aSXin Li void dual_inner_prod_neon(const opus_val16 *x, const opus_val16 *y01, 36*a58d3d2aSXin Li const opus_val16 *y02, int N, opus_val32 *xy1, opus_val32 *xy2); 37*a58d3d2aSXin Li 38*a58d3d2aSXin Li # if !defined(OPUS_HAVE_RTCD) && defined(OPUS_ARM_PRESUME_NEON) 39*a58d3d2aSXin Li # define OVERRIDE_CELT_INNER_PROD (1) 40*a58d3d2aSXin Li # define OVERRIDE_DUAL_INNER_PROD (1) 41*a58d3d2aSXin Li # define celt_inner_prod(x, y, N, arch) ((void)(arch), PRESUME_NEON(celt_inner_prod)(x, y, N)) 42*a58d3d2aSXin Li # define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) ((void)(arch), PRESUME_NEON(dual_inner_prod)(x, y01, y02, N, xy1, xy2)) 43*a58d3d2aSXin Li # endif 44*a58d3d2aSXin Li # endif 45*a58d3d2aSXin Li 46*a58d3d2aSXin Li # if !defined(OVERRIDE_CELT_INNER_PROD) 47*a58d3d2aSXin Li # if defined(OPUS_HAVE_RTCD) && (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)) 48*a58d3d2aSXin Li extern opus_val32 (*const CELT_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x, const opus_val16 *y, int N); 49*a58d3d2aSXin Li # define OVERRIDE_CELT_INNER_PROD (1) 50*a58d3d2aSXin Li # define celt_inner_prod(x, y, N, arch) ((*CELT_INNER_PROD_IMPL[(arch)&OPUS_ARCHMASK])(x, y, N)) 51*a58d3d2aSXin Li # elif defined(OPUS_ARM_PRESUME_NEON_INTR) 52*a58d3d2aSXin Li # define OVERRIDE_CELT_INNER_PROD (1) 53*a58d3d2aSXin Li # define celt_inner_prod(x, y, N, arch) ((void)(arch), celt_inner_prod_neon(x, y, N)) 54*a58d3d2aSXin Li # endif 55*a58d3d2aSXin Li # endif 56*a58d3d2aSXin Li 57*a58d3d2aSXin Li # if !defined(OVERRIDE_DUAL_INNER_PROD) 58*a58d3d2aSXin Li # if defined(OPUS_HAVE_RTCD) && (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)) 59*a58d3d2aSXin Li extern void (*const DUAL_INNER_PROD_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *x, 60*a58d3d2aSXin Li const opus_val16 *y01, const opus_val16 *y02, int N, opus_val32 *xy1, opus_val32 *xy2); 61*a58d3d2aSXin Li # define OVERRIDE_DUAL_INNER_PROD (1) 62*a58d3d2aSXin Li # define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) ((*DUAL_INNER_PROD_IMPL[(arch)&OPUS_ARCHMASK])(x, y01, y02, N, xy1, xy2)) 63*a58d3d2aSXin Li # elif defined(OPUS_ARM_PRESUME_NEON_INTR) 64*a58d3d2aSXin Li # define OVERRIDE_DUAL_INNER_PROD (1) 65*a58d3d2aSXin Li # define dual_inner_prod(x, y01, y02, N, xy1, xy2, arch) ((void)(arch), dual_inner_prod_neon(x, y01, y02, N, xy1, xy2)) 66*a58d3d2aSXin Li # endif 67*a58d3d2aSXin Li # endif 68*a58d3d2aSXin Li 69*a58d3d2aSXin Li # if defined(FIXED_POINT) 70*a58d3d2aSXin Li 71*a58d3d2aSXin Li # if defined(OPUS_ARM_MAY_HAVE_NEON) 72*a58d3d2aSXin Li opus_val32 celt_pitch_xcorr_neon(const opus_val16 *_x, const opus_val16 *_y, 73*a58d3d2aSXin Li opus_val32 *xcorr, int len, int max_pitch, int arch); 74*a58d3d2aSXin Li # endif 75*a58d3d2aSXin Li 76*a58d3d2aSXin Li # if defined(OPUS_ARM_MAY_HAVE_MEDIA) 77*a58d3d2aSXin Li # define celt_pitch_xcorr_media MAY_HAVE_EDSP(celt_pitch_xcorr) 78*a58d3d2aSXin Li # endif 79*a58d3d2aSXin Li 80*a58d3d2aSXin Li # if defined(OPUS_ARM_MAY_HAVE_EDSP) 81*a58d3d2aSXin Li opus_val32 celt_pitch_xcorr_edsp(const opus_val16 *_x, const opus_val16 *_y, 82*a58d3d2aSXin Li opus_val32 *xcorr, int len, int max_pitch, int arch); 83*a58d3d2aSXin Li # endif 84*a58d3d2aSXin Li 85*a58d3d2aSXin Li # if defined(OPUS_HAVE_RTCD) && \ 86*a58d3d2aSXin Li ((defined(OPUS_ARM_MAY_HAVE_NEON) && !defined(OPUS_ARM_PRESUME_NEON)) || \ 87*a58d3d2aSXin Li (defined(OPUS_ARM_MAY_HAVE_MEDIA) && !defined(OPUS_ARM_PRESUME_MEDIA)) || \ 88*a58d3d2aSXin Li (defined(OPUS_ARM_MAY_HAVE_EDSP) && !defined(OPUS_ARM_PRESUME_EDSP))) 89*a58d3d2aSXin Li extern opus_val32 90*a58d3d2aSXin Li (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *, 91*a58d3d2aSXin Li const opus_val16 *, opus_val32 *, int, int, int); 92*a58d3d2aSXin Li # define OVERRIDE_PITCH_XCORR (1) 93*a58d3d2aSXin Li # define celt_pitch_xcorr(_x, _y, xcorr, len, max_pitch, arch) \ 94*a58d3d2aSXin Li ((*CELT_PITCH_XCORR_IMPL[(arch)&OPUS_ARCHMASK])(_x, _y, \ 95*a58d3d2aSXin Li xcorr, len, max_pitch, arch)) 96*a58d3d2aSXin Li 97*a58d3d2aSXin Li # elif defined(OPUS_ARM_PRESUME_EDSP) || \ 98*a58d3d2aSXin Li defined(OPUS_ARM_PRESUME_MEDIA) || \ 99*a58d3d2aSXin Li defined(OPUS_ARM_PRESUME_NEON) 100*a58d3d2aSXin Li # define OVERRIDE_PITCH_XCORR (1) 101*a58d3d2aSXin Li # define celt_pitch_xcorr (PRESUME_NEON(celt_pitch_xcorr)) 102*a58d3d2aSXin Li 103*a58d3d2aSXin Li # endif 104*a58d3d2aSXin Li 105*a58d3d2aSXin Li # if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) 106*a58d3d2aSXin Li void xcorr_kernel_neon_fixed( 107*a58d3d2aSXin Li const opus_val16 *x, 108*a58d3d2aSXin Li const opus_val16 *y, 109*a58d3d2aSXin Li opus_val32 sum[4], 110*a58d3d2aSXin Li int len); 111*a58d3d2aSXin Li # endif 112*a58d3d2aSXin Li 113*a58d3d2aSXin Li # if defined(OPUS_HAVE_RTCD) && \ 114*a58d3d2aSXin Li (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)) 115*a58d3d2aSXin Li 116*a58d3d2aSXin Li extern void (*const XCORR_KERNEL_IMPL[OPUS_ARCHMASK + 1])( 117*a58d3d2aSXin Li const opus_val16 *x, 118*a58d3d2aSXin Li const opus_val16 *y, 119*a58d3d2aSXin Li opus_val32 sum[4], 120*a58d3d2aSXin Li int len); 121*a58d3d2aSXin Li 122*a58d3d2aSXin Li # define OVERRIDE_XCORR_KERNEL (1) 123*a58d3d2aSXin Li # define xcorr_kernel(x, y, sum, len, arch) \ 124*a58d3d2aSXin Li ((*XCORR_KERNEL_IMPL[(arch) & OPUS_ARCHMASK])(x, y, sum, len)) 125*a58d3d2aSXin Li 126*a58d3d2aSXin Li # elif defined(OPUS_ARM_PRESUME_NEON_INTR) 127*a58d3d2aSXin Li # define OVERRIDE_XCORR_KERNEL (1) 128*a58d3d2aSXin Li # define xcorr_kernel(x, y, sum, len, arch) \ 129*a58d3d2aSXin Li ((void)arch, xcorr_kernel_neon_fixed(x, y, sum, len)) 130*a58d3d2aSXin Li 131*a58d3d2aSXin Li # endif 132*a58d3d2aSXin Li 133*a58d3d2aSXin Li #else /* Start !FIXED_POINT */ 134*a58d3d2aSXin Li /* Float case */ 135*a58d3d2aSXin Li #if defined(OPUS_ARM_MAY_HAVE_NEON_INTR) 136*a58d3d2aSXin Li void celt_pitch_xcorr_float_neon(const opus_val16 *_x, const opus_val16 *_y, 137*a58d3d2aSXin Li opus_val32 *xcorr, int len, int max_pitch, int arch); 138*a58d3d2aSXin Li #endif 139*a58d3d2aSXin Li 140*a58d3d2aSXin Li # if defined(OPUS_HAVE_RTCD) && \ 141*a58d3d2aSXin Li (defined(OPUS_ARM_MAY_HAVE_NEON_INTR) && !defined(OPUS_ARM_PRESUME_NEON_INTR)) 142*a58d3d2aSXin Li extern void 143*a58d3d2aSXin Li (*const CELT_PITCH_XCORR_IMPL[OPUS_ARCHMASK+1])(const opus_val16 *, 144*a58d3d2aSXin Li const opus_val16 *, opus_val32 *, int, int, int); 145*a58d3d2aSXin Li 146*a58d3d2aSXin Li # define OVERRIDE_PITCH_XCORR (1) 147*a58d3d2aSXin Li # define celt_pitch_xcorr(_x, _y, xcorr, len, max_pitch, arch) \ 148*a58d3d2aSXin Li ((*CELT_PITCH_XCORR_IMPL[(arch)&OPUS_ARCHMASK])(_x, _y, \ 149*a58d3d2aSXin Li xcorr, len, max_pitch, arch)) 150*a58d3d2aSXin Li 151*a58d3d2aSXin Li # elif defined(OPUS_ARM_PRESUME_NEON_INTR) 152*a58d3d2aSXin Li 153*a58d3d2aSXin Li # define OVERRIDE_PITCH_XCORR (1) 154*a58d3d2aSXin Li # define celt_pitch_xcorr celt_pitch_xcorr_float_neon 155*a58d3d2aSXin Li 156*a58d3d2aSXin Li # endif 157*a58d3d2aSXin Li 158*a58d3d2aSXin Li #endif /* end !FIXED_POINT */ 159*a58d3d2aSXin Li 160*a58d3d2aSXin Li #endif 161