1*a58d3d2aSXin Li /* Copyright (c) 2014, Cisco Systems, INC 2*a58d3d2aSXin Li Written by XiangMingZhu WeiZhou MinPeng YanWang 3*a58d3d2aSXin Li 4*a58d3d2aSXin Li Redistribution and use in source and binary forms, with or without 5*a58d3d2aSXin Li modification, are permitted provided that the following conditions 6*a58d3d2aSXin Li are met: 7*a58d3d2aSXin Li 8*a58d3d2aSXin Li - Redistributions of source code must retain the above copyright 9*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer. 10*a58d3d2aSXin Li 11*a58d3d2aSXin Li - Redistributions in binary form must reproduce the above copyright 12*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer in the 13*a58d3d2aSXin Li documentation and/or other materials provided with the distribution. 14*a58d3d2aSXin Li 15*a58d3d2aSXin Li THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 16*a58d3d2aSXin Li ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 17*a58d3d2aSXin Li LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 18*a58d3d2aSXin Li A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER 19*a58d3d2aSXin Li OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 20*a58d3d2aSXin Li EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 21*a58d3d2aSXin Li PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 22*a58d3d2aSXin Li PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF 23*a58d3d2aSXin Li LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING 24*a58d3d2aSXin Li NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS 25*a58d3d2aSXin Li SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 26*a58d3d2aSXin Li */ 27*a58d3d2aSXin Li 28*a58d3d2aSXin Li #ifndef SIGPROC_FIX_SSE_H 29*a58d3d2aSXin Li # define SIGPROC_FIX_SSE_H 30*a58d3d2aSXin Li 31*a58d3d2aSXin Li # ifdef HAVE_CONFIG_H 32*a58d3d2aSXin Li # include "config.h" 33*a58d3d2aSXin Li # endif 34*a58d3d2aSXin Li 35*a58d3d2aSXin Li # if defined(OPUS_X86_MAY_HAVE_SSE4_1) 36*a58d3d2aSXin Li void silk_burg_modified_sse4_1( 37*a58d3d2aSXin Li opus_int32 *res_nrg, /* O Residual energy */ 38*a58d3d2aSXin Li opus_int *res_nrg_Q, /* O Residual energy Q value */ 39*a58d3d2aSXin Li opus_int32 A_Q16[], /* O Prediction coefficients (length order) */ 40*a58d3d2aSXin Li const opus_int16 x[], /* I Input signal, length: nb_subfr * ( D + subfr_length ) */ 41*a58d3d2aSXin Li const opus_int32 minInvGain_Q30, /* I Inverse of max prediction gain */ 42*a58d3d2aSXin Li const opus_int subfr_length, /* I Input signal subframe length (incl. D preceding samples) */ 43*a58d3d2aSXin Li const opus_int nb_subfr, /* I Number of subframes stacked in x */ 44*a58d3d2aSXin Li const opus_int D, /* I Order */ 45*a58d3d2aSXin Li int arch /* I Run-time architecture */ 46*a58d3d2aSXin Li ); 47*a58d3d2aSXin Li 48*a58d3d2aSXin Li # if defined(OPUS_X86_PRESUME_SSE4_1) 49*a58d3d2aSXin Li 50*a58d3d2aSXin Li # define OVERRIDE_silk_burg_modified 51*a58d3d2aSXin Li # define silk_burg_modified(res_nrg, res_nrg_Q, A_Q16, x, minInvGain_Q30, subfr_length, nb_subfr, D, arch) \ 52*a58d3d2aSXin Li ((void)(arch), silk_burg_modified_sse4_1(res_nrg, res_nrg_Q, A_Q16, x, minInvGain_Q30, subfr_length, nb_subfr, D, arch)) 53*a58d3d2aSXin Li 54*a58d3d2aSXin Li # elif defined(OPUS_HAVE_RTCD) 55*a58d3d2aSXin Li 56*a58d3d2aSXin Li extern void (*const SILK_BURG_MODIFIED_IMPL[OPUS_ARCHMASK + 1])( 57*a58d3d2aSXin Li opus_int32 *res_nrg, /* O Residual energy */ 58*a58d3d2aSXin Li opus_int *res_nrg_Q, /* O Residual energy Q value */ 59*a58d3d2aSXin Li opus_int32 A_Q16[], /* O Prediction coefficients (length order) */ 60*a58d3d2aSXin Li const opus_int16 x[], /* I Input signal, length: nb_subfr * ( D + subfr_length ) */ 61*a58d3d2aSXin Li const opus_int32 minInvGain_Q30, /* I Inverse of max prediction gain */ 62*a58d3d2aSXin Li const opus_int subfr_length, /* I Input signal subframe length (incl. D preceding samples) */ 63*a58d3d2aSXin Li const opus_int nb_subfr, /* I Number of subframes stacked in x */ 64*a58d3d2aSXin Li const opus_int D, /* I Order */ 65*a58d3d2aSXin Li int arch /* I Run-time architecture */); 66*a58d3d2aSXin Li 67*a58d3d2aSXin Li # define OVERRIDE_silk_burg_modified 68*a58d3d2aSXin Li # define silk_burg_modified(res_nrg, res_nrg_Q, A_Q16, x, minInvGain_Q30, subfr_length, nb_subfr, D, arch) \ 69*a58d3d2aSXin Li ((*SILK_BURG_MODIFIED_IMPL[(arch) & OPUS_ARCHMASK])(res_nrg, res_nrg_Q, A_Q16, x, minInvGain_Q30, subfr_length, nb_subfr, D, arch)) 70*a58d3d2aSXin Li 71*a58d3d2aSXin Li # endif 72*a58d3d2aSXin Li 73*a58d3d2aSXin Li opus_int64 silk_inner_prod16_sse4_1( 74*a58d3d2aSXin Li const opus_int16 *inVec1, 75*a58d3d2aSXin Li const opus_int16 *inVec2, 76*a58d3d2aSXin Li const opus_int len 77*a58d3d2aSXin Li ); 78*a58d3d2aSXin Li 79*a58d3d2aSXin Li 80*a58d3d2aSXin Li # if defined(OPUS_X86_PRESUME_SSE4_1) 81*a58d3d2aSXin Li 82*a58d3d2aSXin Li # define OVERRIDE_silk_inner_prod16 83*a58d3d2aSXin Li # define silk_inner_prod16(inVec1, inVec2, len, arch) \ 84*a58d3d2aSXin Li ((void)(arch),silk_inner_prod16_sse4_1(inVec1, inVec2, len)) 85*a58d3d2aSXin Li 86*a58d3d2aSXin Li # elif defined(OPUS_HAVE_RTCD) 87*a58d3d2aSXin Li 88*a58d3d2aSXin Li extern opus_int64 (*const SILK_INNER_PROD16_IMPL[OPUS_ARCHMASK + 1])( 89*a58d3d2aSXin Li const opus_int16 *inVec1, 90*a58d3d2aSXin Li const opus_int16 *inVec2, 91*a58d3d2aSXin Li const opus_int len); 92*a58d3d2aSXin Li 93*a58d3d2aSXin Li # define OVERRIDE_silk_inner_prod16 94*a58d3d2aSXin Li # define silk_inner_prod16(inVec1, inVec2, len, arch) \ 95*a58d3d2aSXin Li ((*SILK_INNER_PROD16_IMPL[(arch) & OPUS_ARCHMASK])(inVec1, inVec2, len)) 96*a58d3d2aSXin Li 97*a58d3d2aSXin Li # endif 98*a58d3d2aSXin Li # endif 99*a58d3d2aSXin Li #endif 100