1*a58d3d2aSXin Li /* Copyright (c) 2003-2008 Jean-Marc Valin
2*a58d3d2aSXin Li Copyright (c) 2007-2008 CSIRO
3*a58d3d2aSXin Li Copyright (c) 2007-2009 Xiph.Org Foundation
4*a58d3d2aSXin Li Written by Jean-Marc Valin */
5*a58d3d2aSXin Li /**
6*a58d3d2aSXin Li @file arch.h
7*a58d3d2aSXin Li @brief Various architecture definitions for CELT
8*a58d3d2aSXin Li */
9*a58d3d2aSXin Li /*
10*a58d3d2aSXin Li Redistribution and use in source and binary forms, with or without
11*a58d3d2aSXin Li modification, are permitted provided that the following conditions
12*a58d3d2aSXin Li are met:
13*a58d3d2aSXin Li
14*a58d3d2aSXin Li - Redistributions of source code must retain the above copyright
15*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer.
16*a58d3d2aSXin Li
17*a58d3d2aSXin Li - Redistributions in binary form must reproduce the above copyright
18*a58d3d2aSXin Li notice, this list of conditions and the following disclaimer in the
19*a58d3d2aSXin Li documentation and/or other materials provided with the distribution.
20*a58d3d2aSXin Li
21*a58d3d2aSXin Li THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22*a58d3d2aSXin Li ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23*a58d3d2aSXin Li LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24*a58d3d2aSXin Li A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
25*a58d3d2aSXin Li OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
26*a58d3d2aSXin Li EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
27*a58d3d2aSXin Li PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
28*a58d3d2aSXin Li PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
29*a58d3d2aSXin Li LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
30*a58d3d2aSXin Li NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
31*a58d3d2aSXin Li SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32*a58d3d2aSXin Li */
33*a58d3d2aSXin Li
34*a58d3d2aSXin Li #ifndef ARCH_H
35*a58d3d2aSXin Li #define ARCH_H
36*a58d3d2aSXin Li
37*a58d3d2aSXin Li #include "opus_types.h"
38*a58d3d2aSXin Li #include "opus_defines.h"
39*a58d3d2aSXin Li
40*a58d3d2aSXin Li # if !defined(__GNUC_PREREQ)
41*a58d3d2aSXin Li # if defined(__GNUC__)&&defined(__GNUC_MINOR__)
42*a58d3d2aSXin Li # define __GNUC_PREREQ(_maj,_min) \
43*a58d3d2aSXin Li ((__GNUC__<<16)+__GNUC_MINOR__>=((_maj)<<16)+(_min))
44*a58d3d2aSXin Li # else
45*a58d3d2aSXin Li # define __GNUC_PREREQ(_maj,_min) 0
46*a58d3d2aSXin Li # endif
47*a58d3d2aSXin Li # endif
48*a58d3d2aSXin Li
49*a58d3d2aSXin Li #if OPUS_GNUC_PREREQ(3, 0)
50*a58d3d2aSXin Li #define opus_likely(x) (__builtin_expect(!!(x), 1))
51*a58d3d2aSXin Li #define opus_unlikely(x) (__builtin_expect(!!(x), 0))
52*a58d3d2aSXin Li #else
53*a58d3d2aSXin Li #define opus_likely(x) (!!(x))
54*a58d3d2aSXin Li #define opus_unlikely(x) (!!(x))
55*a58d3d2aSXin Li #endif
56*a58d3d2aSXin Li
57*a58d3d2aSXin Li #define CELT_SIG_SCALE 32768.f
58*a58d3d2aSXin Li
59*a58d3d2aSXin Li #define CELT_FATAL(str) celt_fatal(str, __FILE__, __LINE__);
60*a58d3d2aSXin Li
61*a58d3d2aSXin Li #if defined(ENABLE_ASSERTIONS) || defined(ENABLE_HARDENING)
62*a58d3d2aSXin Li #ifdef __GNUC__
63*a58d3d2aSXin Li __attribute__((noreturn))
64*a58d3d2aSXin Li #endif
65*a58d3d2aSXin Li void celt_fatal(const char *str, const char *file, int line);
66*a58d3d2aSXin Li
67*a58d3d2aSXin Li #if defined(CELT_C) && !defined(OVERRIDE_celt_fatal)
68*a58d3d2aSXin Li #include <stdio.h>
69*a58d3d2aSXin Li #include <stdlib.h>
70*a58d3d2aSXin Li #ifdef __GNUC__
71*a58d3d2aSXin Li __attribute__((noreturn))
72*a58d3d2aSXin Li #endif
celt_fatal(const char * str,const char * file,int line)73*a58d3d2aSXin Li void celt_fatal(const char *str, const char *file, int line)
74*a58d3d2aSXin Li {
75*a58d3d2aSXin Li fprintf (stderr, "Fatal (internal) error in %s, line %d: %s\n", file, line, str);
76*a58d3d2aSXin Li #if defined(_MSC_VER)
77*a58d3d2aSXin Li _set_abort_behavior( 0, _WRITE_ABORT_MSG);
78*a58d3d2aSXin Li #endif
79*a58d3d2aSXin Li abort();
80*a58d3d2aSXin Li }
81*a58d3d2aSXin Li #endif
82*a58d3d2aSXin Li
83*a58d3d2aSXin Li #define celt_assert(cond) {if (!(cond)) {CELT_FATAL("assertion failed: " #cond);}}
84*a58d3d2aSXin Li #define celt_assert2(cond, message) {if (!(cond)) {CELT_FATAL("assertion failed: " #cond "\n" message);}}
85*a58d3d2aSXin Li #define MUST_SUCCEED(call) celt_assert((call) == OPUS_OK)
86*a58d3d2aSXin Li #else
87*a58d3d2aSXin Li #define celt_assert(cond)
88*a58d3d2aSXin Li #define celt_assert2(cond, message)
89*a58d3d2aSXin Li #define MUST_SUCCEED(call) do {if((call) != OPUS_OK) {RESTORE_STACK; return OPUS_INTERNAL_ERROR;} } while (0)
90*a58d3d2aSXin Li #endif
91*a58d3d2aSXin Li
92*a58d3d2aSXin Li #if defined(ENABLE_ASSERTIONS)
93*a58d3d2aSXin Li #define celt_sig_assert(cond) {if (!(cond)) {CELT_FATAL("signal assertion failed: " #cond);}}
94*a58d3d2aSXin Li #else
95*a58d3d2aSXin Li #define celt_sig_assert(cond)
96*a58d3d2aSXin Li #endif
97*a58d3d2aSXin Li
98*a58d3d2aSXin Li #define IMUL32(a,b) ((a)*(b))
99*a58d3d2aSXin Li
100*a58d3d2aSXin Li #define MIN16(a,b) ((a) < (b) ? (a) : (b)) /**< Minimum 16-bit value. */
101*a58d3d2aSXin Li #define MAX16(a,b) ((a) > (b) ? (a) : (b)) /**< Maximum 16-bit value. */
102*a58d3d2aSXin Li #define MIN32(a,b) ((a) < (b) ? (a) : (b)) /**< Minimum 32-bit value. */
103*a58d3d2aSXin Li #define MAX32(a,b) ((a) > (b) ? (a) : (b)) /**< Maximum 32-bit value. */
104*a58d3d2aSXin Li #define IMIN(a,b) ((a) < (b) ? (a) : (b)) /**< Minimum int value. */
105*a58d3d2aSXin Li #define IMAX(a,b) ((a) > (b) ? (a) : (b)) /**< Maximum int value. */
106*a58d3d2aSXin Li #define UADD32(a,b) ((a)+(b))
107*a58d3d2aSXin Li #define USUB32(a,b) ((a)-(b))
108*a58d3d2aSXin Li
109*a58d3d2aSXin Li /* Set this if opus_int64 is a native type of the CPU. */
110*a58d3d2aSXin Li /* Assume that all LP64 architectures have fast 64-bit types; also x86_64
111*a58d3d2aSXin Li (which can be ILP32 for x32) and Win64 (which is LLP64). */
112*a58d3d2aSXin Li #if defined(__x86_64__) || defined(__LP64__) || defined(_WIN64)
113*a58d3d2aSXin Li #define OPUS_FAST_INT64 1
114*a58d3d2aSXin Li #else
115*a58d3d2aSXin Li #define OPUS_FAST_INT64 0
116*a58d3d2aSXin Li #endif
117*a58d3d2aSXin Li
118*a58d3d2aSXin Li #define PRINT_MIPS(file)
119*a58d3d2aSXin Li
120*a58d3d2aSXin Li #ifdef FIXED_POINT
121*a58d3d2aSXin Li
122*a58d3d2aSXin Li typedef opus_int16 opus_val16;
123*a58d3d2aSXin Li typedef opus_int32 opus_val32;
124*a58d3d2aSXin Li typedef opus_int64 opus_val64;
125*a58d3d2aSXin Li
126*a58d3d2aSXin Li typedef opus_val32 celt_sig;
127*a58d3d2aSXin Li typedef opus_val16 celt_norm;
128*a58d3d2aSXin Li typedef opus_val32 celt_ener;
129*a58d3d2aSXin Li
130*a58d3d2aSXin Li #define celt_isnan(x) 0
131*a58d3d2aSXin Li
132*a58d3d2aSXin Li #define Q15ONE 32767
133*a58d3d2aSXin Li
134*a58d3d2aSXin Li #define SIG_SHIFT 12
135*a58d3d2aSXin Li /* Safe saturation value for 32-bit signals. Should be less than
136*a58d3d2aSXin Li 2^31*(1-0.85) to avoid blowing up on DC at deemphasis.*/
137*a58d3d2aSXin Li #define SIG_SAT (300000000)
138*a58d3d2aSXin Li
139*a58d3d2aSXin Li #define NORM_SCALING 16384
140*a58d3d2aSXin Li
141*a58d3d2aSXin Li #define DB_SHIFT 10
142*a58d3d2aSXin Li
143*a58d3d2aSXin Li #define EPSILON 1
144*a58d3d2aSXin Li #define VERY_SMALL 0
145*a58d3d2aSXin Li #define VERY_LARGE16 ((opus_val16)32767)
146*a58d3d2aSXin Li #define Q15_ONE ((opus_val16)32767)
147*a58d3d2aSXin Li
148*a58d3d2aSXin Li #define SCALEIN(a) (a)
149*a58d3d2aSXin Li #define SCALEOUT(a) (a)
150*a58d3d2aSXin Li
151*a58d3d2aSXin Li #define ABS16(x) ((x) < 0 ? (-(x)) : (x))
152*a58d3d2aSXin Li #define ABS32(x) ((x) < 0 ? (-(x)) : (x))
153*a58d3d2aSXin Li
SAT16(opus_int32 x)154*a58d3d2aSXin Li static OPUS_INLINE opus_int16 SAT16(opus_int32 x) {
155*a58d3d2aSXin Li return x > 32767 ? 32767 : x < -32768 ? -32768 : (opus_int16)x;
156*a58d3d2aSXin Li }
157*a58d3d2aSXin Li
158*a58d3d2aSXin Li #ifdef FIXED_DEBUG
159*a58d3d2aSXin Li #include "fixed_debug.h"
160*a58d3d2aSXin Li #else
161*a58d3d2aSXin Li
162*a58d3d2aSXin Li #include "fixed_generic.h"
163*a58d3d2aSXin Li
164*a58d3d2aSXin Li #ifdef OPUS_ARM_PRESUME_AARCH64_NEON_INTR
165*a58d3d2aSXin Li #include "arm/fixed_arm64.h"
166*a58d3d2aSXin Li #elif defined (OPUS_ARM_INLINE_EDSP)
167*a58d3d2aSXin Li #include "arm/fixed_armv5e.h"
168*a58d3d2aSXin Li #elif defined (OPUS_ARM_INLINE_ASM)
169*a58d3d2aSXin Li #include "arm/fixed_armv4.h"
170*a58d3d2aSXin Li #elif defined (BFIN_ASM)
171*a58d3d2aSXin Li #include "fixed_bfin.h"
172*a58d3d2aSXin Li #elif defined (TI_C5X_ASM)
173*a58d3d2aSXin Li #include "fixed_c5x.h"
174*a58d3d2aSXin Li #elif defined (TI_C6X_ASM)
175*a58d3d2aSXin Li #include "fixed_c6x.h"
176*a58d3d2aSXin Li #endif
177*a58d3d2aSXin Li
178*a58d3d2aSXin Li #endif
179*a58d3d2aSXin Li
180*a58d3d2aSXin Li #else /* FIXED_POINT */
181*a58d3d2aSXin Li
182*a58d3d2aSXin Li typedef float opus_val16;
183*a58d3d2aSXin Li typedef float opus_val32;
184*a58d3d2aSXin Li typedef float opus_val64;
185*a58d3d2aSXin Li
186*a58d3d2aSXin Li typedef float celt_sig;
187*a58d3d2aSXin Li typedef float celt_norm;
188*a58d3d2aSXin Li typedef float celt_ener;
189*a58d3d2aSXin Li
190*a58d3d2aSXin Li #ifdef FLOAT_APPROX
191*a58d3d2aSXin Li /* This code should reliably detect NaN/inf even when -ffast-math is used.
192*a58d3d2aSXin Li Assumes IEEE 754 format. */
celt_isnan(float x)193*a58d3d2aSXin Li static OPUS_INLINE int celt_isnan(float x)
194*a58d3d2aSXin Li {
195*a58d3d2aSXin Li union {float f; opus_uint32 i;} in;
196*a58d3d2aSXin Li in.f = x;
197*a58d3d2aSXin Li return ((in.i>>23)&0xFF)==0xFF && (in.i&0x007FFFFF)!=0;
198*a58d3d2aSXin Li }
199*a58d3d2aSXin Li #else
200*a58d3d2aSXin Li #ifdef __FAST_MATH__
201*a58d3d2aSXin Li #error Cannot build libopus with -ffast-math unless FLOAT_APPROX is defined. This could result in crashes on extreme (e.g. NaN) input
202*a58d3d2aSXin Li #endif
203*a58d3d2aSXin Li #define celt_isnan(x) ((x)!=(x))
204*a58d3d2aSXin Li #endif
205*a58d3d2aSXin Li
206*a58d3d2aSXin Li #define Q15ONE 1.0f
207*a58d3d2aSXin Li
208*a58d3d2aSXin Li #define NORM_SCALING 1.f
209*a58d3d2aSXin Li
210*a58d3d2aSXin Li #define EPSILON 1e-15f
211*a58d3d2aSXin Li #define VERY_SMALL 1e-30f
212*a58d3d2aSXin Li #define VERY_LARGE16 1e15f
213*a58d3d2aSXin Li #define Q15_ONE ((opus_val16)1.f)
214*a58d3d2aSXin Li
215*a58d3d2aSXin Li /* This appears to be the same speed as C99's fabsf() but it's more portable. */
216*a58d3d2aSXin Li #define ABS16(x) ((float)fabs(x))
217*a58d3d2aSXin Li #define ABS32(x) ((float)fabs(x))
218*a58d3d2aSXin Li
219*a58d3d2aSXin Li #define QCONST16(x,bits) (x)
220*a58d3d2aSXin Li #define QCONST32(x,bits) (x)
221*a58d3d2aSXin Li
222*a58d3d2aSXin Li #define NEG16(x) (-(x))
223*a58d3d2aSXin Li #define NEG32(x) (-(x))
224*a58d3d2aSXin Li #define NEG32_ovflw(x) (-(x))
225*a58d3d2aSXin Li #define EXTRACT16(x) (x)
226*a58d3d2aSXin Li #define EXTEND32(x) (x)
227*a58d3d2aSXin Li #define SHR16(a,shift) (a)
228*a58d3d2aSXin Li #define SHL16(a,shift) (a)
229*a58d3d2aSXin Li #define SHR32(a,shift) (a)
230*a58d3d2aSXin Li #define SHL32(a,shift) (a)
231*a58d3d2aSXin Li #define PSHR32(a,shift) (a)
232*a58d3d2aSXin Li #define VSHR32(a,shift) (a)
233*a58d3d2aSXin Li
234*a58d3d2aSXin Li #define PSHR(a,shift) (a)
235*a58d3d2aSXin Li #define SHR(a,shift) (a)
236*a58d3d2aSXin Li #define SHL(a,shift) (a)
237*a58d3d2aSXin Li #define SATURATE(x,a) (x)
238*a58d3d2aSXin Li #define SATURATE16(x) (x)
239*a58d3d2aSXin Li
240*a58d3d2aSXin Li #define ROUND16(a,shift) (a)
241*a58d3d2aSXin Li #define SROUND16(a,shift) (a)
242*a58d3d2aSXin Li #define HALF16(x) (.5f*(x))
243*a58d3d2aSXin Li #define HALF32(x) (.5f*(x))
244*a58d3d2aSXin Li
245*a58d3d2aSXin Li #define ADD16(a,b) ((a)+(b))
246*a58d3d2aSXin Li #define SUB16(a,b) ((a)-(b))
247*a58d3d2aSXin Li #define ADD32(a,b) ((a)+(b))
248*a58d3d2aSXin Li #define SUB32(a,b) ((a)-(b))
249*a58d3d2aSXin Li #define ADD32_ovflw(a,b) ((a)+(b))
250*a58d3d2aSXin Li #define SUB32_ovflw(a,b) ((a)-(b))
251*a58d3d2aSXin Li #define MULT16_16_16(a,b) ((a)*(b))
252*a58d3d2aSXin Li #define MULT16_16(a,b) ((opus_val32)(a)*(opus_val32)(b))
253*a58d3d2aSXin Li #define MAC16_16(c,a,b) ((c)+(opus_val32)(a)*(opus_val32)(b))
254*a58d3d2aSXin Li
255*a58d3d2aSXin Li #define MULT16_32_Q15(a,b) ((a)*(b))
256*a58d3d2aSXin Li #define MULT16_32_Q16(a,b) ((a)*(b))
257*a58d3d2aSXin Li
258*a58d3d2aSXin Li #define MULT32_32_Q31(a,b) ((a)*(b))
259*a58d3d2aSXin Li
260*a58d3d2aSXin Li #define MAC16_32_Q15(c,a,b) ((c)+(a)*(b))
261*a58d3d2aSXin Li #define MAC16_32_Q16(c,a,b) ((c)+(a)*(b))
262*a58d3d2aSXin Li
263*a58d3d2aSXin Li #define MULT16_16_Q11_32(a,b) ((a)*(b))
264*a58d3d2aSXin Li #define MULT16_16_Q11(a,b) ((a)*(b))
265*a58d3d2aSXin Li #define MULT16_16_Q13(a,b) ((a)*(b))
266*a58d3d2aSXin Li #define MULT16_16_Q14(a,b) ((a)*(b))
267*a58d3d2aSXin Li #define MULT16_16_Q15(a,b) ((a)*(b))
268*a58d3d2aSXin Li #define MULT16_16_P15(a,b) ((a)*(b))
269*a58d3d2aSXin Li #define MULT16_16_P13(a,b) ((a)*(b))
270*a58d3d2aSXin Li #define MULT16_16_P14(a,b) ((a)*(b))
271*a58d3d2aSXin Li #define MULT16_32_P16(a,b) ((a)*(b))
272*a58d3d2aSXin Li
273*a58d3d2aSXin Li #define DIV32_16(a,b) (((opus_val32)(a))/(opus_val16)(b))
274*a58d3d2aSXin Li #define DIV32(a,b) (((opus_val32)(a))/(opus_val32)(b))
275*a58d3d2aSXin Li
276*a58d3d2aSXin Li #define SCALEIN(a) ((a)*CELT_SIG_SCALE)
277*a58d3d2aSXin Li #define SCALEOUT(a) ((a)*(1/CELT_SIG_SCALE))
278*a58d3d2aSXin Li
279*a58d3d2aSXin Li #define SIG2WORD16(x) (x)
280*a58d3d2aSXin Li
281*a58d3d2aSXin Li #endif /* !FIXED_POINT */
282*a58d3d2aSXin Li
283*a58d3d2aSXin Li #ifndef GLOBAL_STACK_SIZE
284*a58d3d2aSXin Li #ifdef FIXED_POINT
285*a58d3d2aSXin Li #define GLOBAL_STACK_SIZE 120000
286*a58d3d2aSXin Li #else
287*a58d3d2aSXin Li #define GLOBAL_STACK_SIZE 120000
288*a58d3d2aSXin Li #endif
289*a58d3d2aSXin Li #endif
290*a58d3d2aSXin Li
291*a58d3d2aSXin Li #endif /* ARCH_H */
292