xref: /aosp_15_r20/external/libopus/silk/macros.h (revision a58d3d2adb790c104798cd88c8a3aff4fa8b82cc)
1*a58d3d2aSXin Li /***********************************************************************
2*a58d3d2aSXin Li Copyright (c) 2006-2011, Skype Limited. All rights reserved.
3*a58d3d2aSXin Li Redistribution and use in source and binary forms, with or without
4*a58d3d2aSXin Li modification, are permitted provided that the following conditions
5*a58d3d2aSXin Li are met:
6*a58d3d2aSXin Li - Redistributions of source code must retain the above copyright notice,
7*a58d3d2aSXin Li this list of conditions and the following disclaimer.
8*a58d3d2aSXin Li - Redistributions in binary form must reproduce the above copyright
9*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer in the
10*a58d3d2aSXin Li documentation and/or other materials provided with the distribution.
11*a58d3d2aSXin Li - Neither the name of Internet Society, IETF or IETF Trust, nor the
12*a58d3d2aSXin Li names of specific contributors, may be used to endorse or promote
13*a58d3d2aSXin Li products derived from this software without specific prior written
14*a58d3d2aSXin Li permission.
15*a58d3d2aSXin Li THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
16*a58d3d2aSXin Li AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
17*a58d3d2aSXin Li IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
18*a58d3d2aSXin Li ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
19*a58d3d2aSXin Li LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
20*a58d3d2aSXin Li CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
21*a58d3d2aSXin Li SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
22*a58d3d2aSXin Li INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23*a58d3d2aSXin Li CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
24*a58d3d2aSXin Li ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
25*a58d3d2aSXin Li POSSIBILITY OF SUCH DAMAGE.
26*a58d3d2aSXin Li ***********************************************************************/
27*a58d3d2aSXin Li 
28*a58d3d2aSXin Li #ifndef SILK_MACROS_H
29*a58d3d2aSXin Li #define SILK_MACROS_H
30*a58d3d2aSXin Li 
31*a58d3d2aSXin Li #ifdef HAVE_CONFIG_H
32*a58d3d2aSXin Li #include "config.h"
33*a58d3d2aSXin Li #endif
34*a58d3d2aSXin Li 
35*a58d3d2aSXin Li #include "opus_types.h"
36*a58d3d2aSXin Li #include "typedef.h"
37*a58d3d2aSXin Li #include "opus_defines.h"
38*a58d3d2aSXin Li #include "arch.h"
39*a58d3d2aSXin Li 
40*a58d3d2aSXin Li /* This is an OPUS_INLINE header file for general platform. */
41*a58d3d2aSXin Li 
42*a58d3d2aSXin Li /* (a32 * (opus_int32)((opus_int16)(b32))) >> 16 output have to be 32bit int */
43*a58d3d2aSXin Li #if OPUS_FAST_INT64
44*a58d3d2aSXin Li #define silk_SMULWB(a32, b32)            ((opus_int32)(((a32) * (opus_int64)((opus_int16)(b32))) >> 16))
45*a58d3d2aSXin Li #else
46*a58d3d2aSXin Li #define silk_SMULWB(a32, b32)            ((((a32) >> 16) * (opus_int32)((opus_int16)(b32))) + ((((a32) & 0x0000FFFF) * (opus_int32)((opus_int16)(b32))) >> 16))
47*a58d3d2aSXin Li #endif
48*a58d3d2aSXin Li 
49*a58d3d2aSXin Li /* a32 + (b32 * (opus_int32)((opus_int16)(c32))) >> 16 output have to be 32bit int */
50*a58d3d2aSXin Li #if OPUS_FAST_INT64
51*a58d3d2aSXin Li #define silk_SMLAWB(a32, b32, c32)       ((opus_int32)((a32) + (((b32) * (opus_int64)((opus_int16)(c32))) >> 16)))
52*a58d3d2aSXin Li #else
53*a58d3d2aSXin Li #define silk_SMLAWB(a32, b32, c32)       ((a32) + ((((b32) >> 16) * (opus_int32)((opus_int16)(c32))) + ((((b32) & 0x0000FFFF) * (opus_int32)((opus_int16)(c32))) >> 16)))
54*a58d3d2aSXin Li #endif
55*a58d3d2aSXin Li 
56*a58d3d2aSXin Li /* (a32 * (b32 >> 16)) >> 16 */
57*a58d3d2aSXin Li #if OPUS_FAST_INT64
58*a58d3d2aSXin Li #define silk_SMULWT(a32, b32)            ((opus_int32)(((a32) * (opus_int64)((b32) >> 16)) >> 16))
59*a58d3d2aSXin Li #else
60*a58d3d2aSXin Li #define silk_SMULWT(a32, b32)            (((a32) >> 16) * ((b32) >> 16) + ((((a32) & 0x0000FFFF) * ((b32) >> 16)) >> 16))
61*a58d3d2aSXin Li #endif
62*a58d3d2aSXin Li 
63*a58d3d2aSXin Li /* a32 + (b32 * (c32 >> 16)) >> 16 */
64*a58d3d2aSXin Li #if OPUS_FAST_INT64
65*a58d3d2aSXin Li #define silk_SMLAWT(a32, b32, c32)       ((opus_int32)((a32) + (((b32) * ((opus_int64)(c32) >> 16)) >> 16)))
66*a58d3d2aSXin Li #else
67*a58d3d2aSXin Li #define silk_SMLAWT(a32, b32, c32)       ((a32) + (((b32) >> 16) * ((c32) >> 16)) + ((((b32) & 0x0000FFFF) * ((c32) >> 16)) >> 16))
68*a58d3d2aSXin Li #endif
69*a58d3d2aSXin Li 
70*a58d3d2aSXin Li /* (opus_int32)((opus_int16)(a3))) * (opus_int32)((opus_int16)(b32)) output have to be 32bit int */
71*a58d3d2aSXin Li #define silk_SMULBB(a32, b32)            ((opus_int32)((opus_int16)(a32)) * (opus_int32)((opus_int16)(b32)))
72*a58d3d2aSXin Li 
73*a58d3d2aSXin Li /* a32 + (opus_int32)((opus_int16)(b32)) * (opus_int32)((opus_int16)(c32)) output have to be 32bit int */
74*a58d3d2aSXin Li #define silk_SMLABB(a32, b32, c32)       ((a32) + ((opus_int32)((opus_int16)(b32))) * (opus_int32)((opus_int16)(c32)))
75*a58d3d2aSXin Li 
76*a58d3d2aSXin Li /* (opus_int32)((opus_int16)(a32)) * (b32 >> 16) */
77*a58d3d2aSXin Li #define silk_SMULBT(a32, b32)            ((opus_int32)((opus_int16)(a32)) * ((b32) >> 16))
78*a58d3d2aSXin Li 
79*a58d3d2aSXin Li /* a32 + (opus_int32)((opus_int16)(b32)) * (c32 >> 16) */
80*a58d3d2aSXin Li #define silk_SMLABT(a32, b32, c32)       ((a32) + ((opus_int32)((opus_int16)(b32))) * ((c32) >> 16))
81*a58d3d2aSXin Li 
82*a58d3d2aSXin Li /* a64 + (b32 * c32) */
83*a58d3d2aSXin Li #define silk_SMLAL(a64, b32, c32)        (silk_ADD64((a64), ((opus_int64)(b32) * (opus_int64)(c32))))
84*a58d3d2aSXin Li 
85*a58d3d2aSXin Li /* (a32 * b32) >> 16 */
86*a58d3d2aSXin Li #if OPUS_FAST_INT64
87*a58d3d2aSXin Li #define silk_SMULWW(a32, b32)            ((opus_int32)(((opus_int64)(a32) * (b32)) >> 16))
88*a58d3d2aSXin Li #else
89*a58d3d2aSXin Li #define silk_SMULWW(a32, b32)            silk_MLA(silk_SMULWB((a32), (b32)), (a32), silk_RSHIFT_ROUND((b32), 16))
90*a58d3d2aSXin Li #endif
91*a58d3d2aSXin Li 
92*a58d3d2aSXin Li /* a32 + ((b32 * c32) >> 16) */
93*a58d3d2aSXin Li #if OPUS_FAST_INT64
94*a58d3d2aSXin Li #define silk_SMLAWW(a32, b32, c32)       ((opus_int32)((a32) + (((opus_int64)(b32) * (c32)) >> 16)))
95*a58d3d2aSXin Li #else
96*a58d3d2aSXin Li #define silk_SMLAWW(a32, b32, c32)       silk_MLA(silk_SMLAWB((a32), (b32), (c32)), (b32), silk_RSHIFT_ROUND((c32), 16))
97*a58d3d2aSXin Li #endif
98*a58d3d2aSXin Li 
99*a58d3d2aSXin Li /* add/subtract with output saturated */
100*a58d3d2aSXin Li /* use clang builtin overflow detectors */
silk_ADD_SAT32(opus_int32 a,opus_int32 b)101*a58d3d2aSXin Li static OPUS_INLINE opus_int32 silk_ADD_SAT32(opus_int32 a, opus_int32 b) {
102*a58d3d2aSXin Li     opus_int32 c;
103*a58d3d2aSXin Li     if (__builtin_add_overflow(a, b, &c)) {
104*a58d3d2aSXin Li         // overflowed
105*a58d3d2aSXin Li         if (a < 0)      // neg+X can only overflow towards -inf
106*a58d3d2aSXin Li             c = silk_int32_MIN;
107*a58d3d2aSXin Li         else
108*a58d3d2aSXin Li             c = silk_int32_MAX;
109*a58d3d2aSXin Li     }
110*a58d3d2aSXin Li     return c;
111*a58d3d2aSXin Li }
112*a58d3d2aSXin Li 
113*a58d3d2aSXin Li /* use clang builtin overflow detectors */
silk_SUB_SAT32(opus_int32 a,opus_int32 b)114*a58d3d2aSXin Li static OPUS_INLINE opus_int32 silk_SUB_SAT32(opus_int32 a, opus_int32 b) {
115*a58d3d2aSXin Li     opus_int32 c;
116*a58d3d2aSXin Li     if (__builtin_sub_overflow(a, b, &c)) {
117*a58d3d2aSXin Li         // overflowed,
118*a58d3d2aSXin Li         if (a < 0) // neg-X only overflows towards -inf
119*a58d3d2aSXin Li             c = silk_int32_MIN;
120*a58d3d2aSXin Li         else
121*a58d3d2aSXin Li             c = silk_int32_MAX;
122*a58d3d2aSXin Li     }
123*a58d3d2aSXin Li     return c;
124*a58d3d2aSXin Li }
125*a58d3d2aSXin Li 
126*a58d3d2aSXin Li #if defined(MIPSr1_ASM)
127*a58d3d2aSXin Li #include "mips/macros_mipsr1.h"
128*a58d3d2aSXin Li #endif
129*a58d3d2aSXin Li 
130*a58d3d2aSXin Li #include "ecintrin.h"
131*a58d3d2aSXin Li #ifndef OVERRIDE_silk_CLZ16
silk_CLZ16(opus_int16 in16)132*a58d3d2aSXin Li static OPUS_INLINE opus_int32 silk_CLZ16(opus_int16 in16)
133*a58d3d2aSXin Li {
134*a58d3d2aSXin Li     return 32 - EC_ILOG(in16<<16|0x8000);
135*a58d3d2aSXin Li }
136*a58d3d2aSXin Li #endif
137*a58d3d2aSXin Li 
138*a58d3d2aSXin Li #ifndef OVERRIDE_silk_CLZ32
silk_CLZ32(opus_int32 in32)139*a58d3d2aSXin Li static OPUS_INLINE opus_int32 silk_CLZ32(opus_int32 in32)
140*a58d3d2aSXin Li {
141*a58d3d2aSXin Li     return in32 ? 32 - EC_ILOG(in32) : 32;
142*a58d3d2aSXin Li }
143*a58d3d2aSXin Li #endif
144*a58d3d2aSXin Li 
145*a58d3d2aSXin Li /* Row based */
146*a58d3d2aSXin Li #define matrix_ptr(Matrix_base_adr, row, column, N) \
147*a58d3d2aSXin Li     (*((Matrix_base_adr) + ((row)*(N)+(column))))
148*a58d3d2aSXin Li #define matrix_adr(Matrix_base_adr, row, column, N) \
149*a58d3d2aSXin Li       ((Matrix_base_adr) + ((row)*(N)+(column)))
150*a58d3d2aSXin Li 
151*a58d3d2aSXin Li /* Column based */
152*a58d3d2aSXin Li #ifndef matrix_c_ptr
153*a58d3d2aSXin Li #   define matrix_c_ptr(Matrix_base_adr, row, column, M) \
154*a58d3d2aSXin Li     (*((Matrix_base_adr) + ((row)+(M)*(column))))
155*a58d3d2aSXin Li #endif
156*a58d3d2aSXin Li 
157*a58d3d2aSXin Li #ifdef OPUS_ARM_INLINE_ASM
158*a58d3d2aSXin Li #include "arm/macros_armv4.h"
159*a58d3d2aSXin Li #endif
160*a58d3d2aSXin Li 
161*a58d3d2aSXin Li #ifdef OPUS_ARM_INLINE_EDSP
162*a58d3d2aSXin Li #include "arm/macros_armv5e.h"
163*a58d3d2aSXin Li #endif
164*a58d3d2aSXin Li 
165*a58d3d2aSXin Li #ifdef OPUS_ARM_PRESUME_AARCH64_NEON_INTR
166*a58d3d2aSXin Li #include "arm/macros_arm64.h"
167*a58d3d2aSXin Li #endif
168*a58d3d2aSXin Li 
169*a58d3d2aSXin Li #endif /* SILK_MACROS_H */
170*a58d3d2aSXin Li 
171