xref: /aosp_15_r20/external/libopus/silk/x86/SigProc_FIX_sse.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /* Copyright (c) 2014, Cisco Systems, INC
2*a58d3d2aSXin Li    Written by XiangMingZhu WeiZhou MinPeng YanWang
3*a58d3d2aSXin Li 
4*a58d3d2aSXin Li    Redistribution and use in source and binary forms, with or without
5*a58d3d2aSXin Li    modification, are permitted provided that the following conditions
6*a58d3d2aSXin Li    are met:
7*a58d3d2aSXin Li 
8*a58d3d2aSXin Li    - Redistributions of source code must retain the above copyright
9*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer.
10*a58d3d2aSXin Li 
11*a58d3d2aSXin Li    - Redistributions in binary form must reproduce the above copyright
12*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer in the
13*a58d3d2aSXin Li    documentation and/or other materials provided with the distribution.
14*a58d3d2aSXin Li 
15*a58d3d2aSXin Li    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16*a58d3d2aSXin Li    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17*a58d3d2aSXin Li    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
18*a58d3d2aSXin Li    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
19*a58d3d2aSXin Li    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20*a58d3d2aSXin Li    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21*a58d3d2aSXin Li    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22*a58d3d2aSXin Li    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
23*a58d3d2aSXin Li    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
24*a58d3d2aSXin Li    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25*a58d3d2aSXin Li    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*a58d3d2aSXin Li */
27*a58d3d2aSXin Li 
28*a58d3d2aSXin Li #ifndef SIGPROC_FIX_SSE_H
29*a58d3d2aSXin Li # define SIGPROC_FIX_SSE_H
30*a58d3d2aSXin Li 
31*a58d3d2aSXin Li # ifdef HAVE_CONFIG_H
32*a58d3d2aSXin Li #  include "config.h"
33*a58d3d2aSXin Li # endif
34*a58d3d2aSXin Li 
35*a58d3d2aSXin Li # if defined(OPUS_X86_MAY_HAVE_SSE4_1)
36*a58d3d2aSXin Li void silk_burg_modified_sse4_1(
37*a58d3d2aSXin Li     opus_int32                  *res_nrg,           /* O    Residual energy                                             */
38*a58d3d2aSXin Li     opus_int                    *res_nrg_Q,         /* O    Residual energy Q value                                     */
39*a58d3d2aSXin Li     opus_int32                  A_Q16[],            /* O    Prediction coefficients (length order)                      */
40*a58d3d2aSXin Li     const opus_int16            x[],                /* I    Input signal, length: nb_subfr * ( D + subfr_length )       */
41*a58d3d2aSXin Li     const opus_int32            minInvGain_Q30,     /* I    Inverse of max prediction gain                              */
42*a58d3d2aSXin Li     const opus_int              subfr_length,       /* I    Input signal subframe length (incl. D preceding samples)    */
43*a58d3d2aSXin Li     const opus_int              nb_subfr,           /* I    Number of subframes stacked in x                            */
44*a58d3d2aSXin Li     const opus_int              D,                  /* I    Order                                                       */
45*a58d3d2aSXin Li     int                         arch                /* I    Run-time architecture                                       */
46*a58d3d2aSXin Li );
47*a58d3d2aSXin Li 
48*a58d3d2aSXin Li #  if defined(OPUS_X86_PRESUME_SSE4_1)
49*a58d3d2aSXin Li 
50*a58d3d2aSXin Li #   define OVERRIDE_silk_burg_modified
51*a58d3d2aSXin Li #   define silk_burg_modified(res_nrg, res_nrg_Q, A_Q16, x, minInvGain_Q30, subfr_length, nb_subfr, D, arch) \
52*a58d3d2aSXin Li        ((void)(arch), silk_burg_modified_sse4_1(res_nrg, res_nrg_Q, A_Q16, x, minInvGain_Q30, subfr_length, nb_subfr, D, arch))
53*a58d3d2aSXin Li 
54*a58d3d2aSXin Li #  elif defined(OPUS_HAVE_RTCD)
55*a58d3d2aSXin Li 
56*a58d3d2aSXin Li extern void (*const SILK_BURG_MODIFIED_IMPL[OPUS_ARCHMASK + 1])(
57*a58d3d2aSXin Li     opus_int32                  *res_nrg,           /* O    Residual energy                                             */
58*a58d3d2aSXin Li     opus_int                    *res_nrg_Q,         /* O    Residual energy Q value                                     */
59*a58d3d2aSXin Li     opus_int32                  A_Q16[],            /* O    Prediction coefficients (length order)                      */
60*a58d3d2aSXin Li     const opus_int16            x[],                /* I    Input signal, length: nb_subfr * ( D + subfr_length )       */
61*a58d3d2aSXin Li     const opus_int32            minInvGain_Q30,     /* I    Inverse of max prediction gain                              */
62*a58d3d2aSXin Li     const opus_int              subfr_length,       /* I    Input signal subframe length (incl. D preceding samples)    */
63*a58d3d2aSXin Li     const opus_int              nb_subfr,           /* I    Number of subframes stacked in x                            */
64*a58d3d2aSXin Li     const opus_int              D,                  /* I    Order                                                       */
65*a58d3d2aSXin Li     int                         arch                /* I    Run-time architecture                                       */);
66*a58d3d2aSXin Li 
67*a58d3d2aSXin Li #   define OVERRIDE_silk_burg_modified
68*a58d3d2aSXin Li #   define silk_burg_modified(res_nrg, res_nrg_Q, A_Q16, x, minInvGain_Q30, subfr_length, nb_subfr, D, arch) \
69*a58d3d2aSXin Li      ((*SILK_BURG_MODIFIED_IMPL[(arch) & OPUS_ARCHMASK])(res_nrg, res_nrg_Q, A_Q16, x, minInvGain_Q30, subfr_length, nb_subfr, D, arch))
70*a58d3d2aSXin Li 
71*a58d3d2aSXin Li #  endif
72*a58d3d2aSXin Li 
73*a58d3d2aSXin Li opus_int64 silk_inner_prod16_sse4_1(
74*a58d3d2aSXin Li     const opus_int16 *inVec1,
75*a58d3d2aSXin Li     const opus_int16 *inVec2,
76*a58d3d2aSXin Li     const opus_int   len
77*a58d3d2aSXin Li );
78*a58d3d2aSXin Li 
79*a58d3d2aSXin Li 
80*a58d3d2aSXin Li #  if defined(OPUS_X86_PRESUME_SSE4_1)
81*a58d3d2aSXin Li 
82*a58d3d2aSXin Li #   define OVERRIDE_silk_inner_prod16
83*a58d3d2aSXin Li #   define silk_inner_prod16(inVec1, inVec2, len, arch) \
84*a58d3d2aSXin Li        ((void)(arch),silk_inner_prod16_sse4_1(inVec1, inVec2, len))
85*a58d3d2aSXin Li 
86*a58d3d2aSXin Li #  elif defined(OPUS_HAVE_RTCD)
87*a58d3d2aSXin Li 
88*a58d3d2aSXin Li extern opus_int64 (*const SILK_INNER_PROD16_IMPL[OPUS_ARCHMASK + 1])(
89*a58d3d2aSXin Li                     const opus_int16 *inVec1,
90*a58d3d2aSXin Li                     const opus_int16 *inVec2,
91*a58d3d2aSXin Li                     const opus_int   len);
92*a58d3d2aSXin Li 
93*a58d3d2aSXin Li #   define OVERRIDE_silk_inner_prod16
94*a58d3d2aSXin Li #   define silk_inner_prod16(inVec1, inVec2, len, arch) \
95*a58d3d2aSXin Li      ((*SILK_INNER_PROD16_IMPL[(arch) & OPUS_ARCHMASK])(inVec1, inVec2, len))
96*a58d3d2aSXin Li 
97*a58d3d2aSXin Li #  endif
98*a58d3d2aSXin Li # endif
99*a58d3d2aSXin Li #endif
100