xref: /aosp_15_r20/external/libopus/celt/ecintrin.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /* Copyright (c) 2003-2008 Timothy B. Terriberry
2*a58d3d2aSXin Li    Copyright (c) 2008 Xiph.Org Foundation */
3*a58d3d2aSXin Li /*
4*a58d3d2aSXin Li    Redistribution and use in source and binary forms, with or without
5*a58d3d2aSXin Li    modification, are permitted provided that the following conditions
6*a58d3d2aSXin Li    are met:
7*a58d3d2aSXin Li 
8*a58d3d2aSXin Li    - Redistributions of source code must retain the above copyright
9*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer.
10*a58d3d2aSXin Li 
11*a58d3d2aSXin Li    - Redistributions in binary form must reproduce the above copyright
12*a58d3d2aSXin Li    notice, this list of conditions and the following disclaimer in the
13*a58d3d2aSXin Li    documentation and/or other materials provided with the distribution.
14*a58d3d2aSXin Li 
15*a58d3d2aSXin Li    THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
16*a58d3d2aSXin Li    ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
17*a58d3d2aSXin Li    LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
18*a58d3d2aSXin Li    A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
19*a58d3d2aSXin Li    OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
20*a58d3d2aSXin Li    EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21*a58d3d2aSXin Li    PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
22*a58d3d2aSXin Li    PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
23*a58d3d2aSXin Li    LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
24*a58d3d2aSXin Li    NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
25*a58d3d2aSXin Li    SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26*a58d3d2aSXin Li */
27*a58d3d2aSXin Li 
28*a58d3d2aSXin Li /*Some common macros for potential platform-specific optimization.*/
29*a58d3d2aSXin Li #include "opus_types.h"
30*a58d3d2aSXin Li #include <math.h>
31*a58d3d2aSXin Li #include <limits.h>
32*a58d3d2aSXin Li #include "arch.h"
33*a58d3d2aSXin Li #if !defined(_ecintrin_H)
34*a58d3d2aSXin Li # define _ecintrin_H (1)
35*a58d3d2aSXin Li 
36*a58d3d2aSXin Li /*Some specific platforms may have optimized intrinsic or OPUS_INLINE assembly
37*a58d3d2aSXin Li    versions of these functions which can substantially improve performance.
38*a58d3d2aSXin Li   We define macros for them to allow easy incorporation of these non-ANSI
39*a58d3d2aSXin Li    features.*/
40*a58d3d2aSXin Li 
41*a58d3d2aSXin Li /*Modern gcc (4.x) can compile the naive versions of min and max with cmov if
42*a58d3d2aSXin Li    given an appropriate architecture, but the branchless bit-twiddling versions
43*a58d3d2aSXin Li    are just as fast, and do not require any special target architecture.
44*a58d3d2aSXin Li   Earlier gcc versions (3.x) compiled both code to the same assembly
45*a58d3d2aSXin Li    instructions, because of the way they represented ((_b)>(_a)) internally.*/
46*a58d3d2aSXin Li # define EC_MINI(_a,_b)      ((_a)+(((_b)-(_a))&-((_b)<(_a))))
47*a58d3d2aSXin Li 
48*a58d3d2aSXin Li /*Count leading zeros.
49*a58d3d2aSXin Li   This macro should only be used for implementing ec_ilog(), if it is defined.
50*a58d3d2aSXin Li   All other code should use EC_ILOG() instead.*/
51*a58d3d2aSXin Li #if defined(_MSC_VER) && (_MSC_VER >= 1400)
52*a58d3d2aSXin Li #if defined(_MSC_VER) && (_MSC_VER >= 1910)
53*a58d3d2aSXin Li # include <intrin0.h> /* Improve compiler throughput. */
54*a58d3d2aSXin Li #else
55*a58d3d2aSXin Li # include <intrin.h>
56*a58d3d2aSXin Li #endif
57*a58d3d2aSXin Li /*In _DEBUG mode this is not an intrinsic by default.*/
58*a58d3d2aSXin Li # pragma intrinsic(_BitScanReverse)
59*a58d3d2aSXin Li 
ec_bsr(unsigned long _x)60*a58d3d2aSXin Li static __inline int ec_bsr(unsigned long _x){
61*a58d3d2aSXin Li   unsigned long ret;
62*a58d3d2aSXin Li   _BitScanReverse(&ret,_x);
63*a58d3d2aSXin Li   return (int)ret;
64*a58d3d2aSXin Li }
65*a58d3d2aSXin Li # define EC_CLZ0    (1)
66*a58d3d2aSXin Li # define EC_CLZ(_x) (-ec_bsr(_x))
67*a58d3d2aSXin Li #elif defined(ENABLE_TI_DSPLIB)
68*a58d3d2aSXin Li # include "dsplib.h"
69*a58d3d2aSXin Li # define EC_CLZ0    (31)
70*a58d3d2aSXin Li # define EC_CLZ(_x) (_lnorm(_x))
71*a58d3d2aSXin Li #elif __GNUC_PREREQ(3,4)
72*a58d3d2aSXin Li # if INT_MAX>=2147483647
73*a58d3d2aSXin Li #  define EC_CLZ0    ((int)sizeof(unsigned)*CHAR_BIT)
74*a58d3d2aSXin Li #  define EC_CLZ(_x) (__builtin_clz(_x))
75*a58d3d2aSXin Li # elif LONG_MAX>=2147483647L
76*a58d3d2aSXin Li #  define EC_CLZ0    ((int)sizeof(unsigned long)*CHAR_BIT)
77*a58d3d2aSXin Li #  define EC_CLZ(_x) (__builtin_clzl(_x))
78*a58d3d2aSXin Li # endif
79*a58d3d2aSXin Li #endif
80*a58d3d2aSXin Li 
81*a58d3d2aSXin Li #if defined(EC_CLZ)
82*a58d3d2aSXin Li /*Note that __builtin_clz is not defined when _x==0, according to the gcc
83*a58d3d2aSXin Li    documentation (and that of the BSR instruction that implements it on x86).
84*a58d3d2aSXin Li   The majority of the time we can never pass it zero.
85*a58d3d2aSXin Li   When we need to, it can be special cased.*/
86*a58d3d2aSXin Li # define EC_ILOG(_x) (EC_CLZ0-EC_CLZ(_x))
87*a58d3d2aSXin Li #else
88*a58d3d2aSXin Li int ec_ilog(opus_uint32 _v);
89*a58d3d2aSXin Li # define EC_ILOG(_x) (ec_ilog(_x))
90*a58d3d2aSXin Li #endif
91*a58d3d2aSXin Li #endif
92