1*344a7f5eSAndroid Build Coastguard Worker /*===---- f16cintrin.h - F16C intrinsics -----------------------------------===
2*344a7f5eSAndroid Build Coastguard Worker *
3*344a7f5eSAndroid Build Coastguard Worker * Permission is hereby granted, free of charge, to any person obtaining a copy
4*344a7f5eSAndroid Build Coastguard Worker * of this software and associated documentation files (the "Software"), to deal
5*344a7f5eSAndroid Build Coastguard Worker * in the Software without restriction, including without limitation the rights
6*344a7f5eSAndroid Build Coastguard Worker * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
7*344a7f5eSAndroid Build Coastguard Worker * copies of the Software, and to permit persons to whom the Software is
8*344a7f5eSAndroid Build Coastguard Worker * furnished to do so, subject to the following conditions:
9*344a7f5eSAndroid Build Coastguard Worker *
10*344a7f5eSAndroid Build Coastguard Worker * The above copyright notice and this permission notice shall be included in
11*344a7f5eSAndroid Build Coastguard Worker * all copies or substantial portions of the Software.
12*344a7f5eSAndroid Build Coastguard Worker *
13*344a7f5eSAndroid Build Coastguard Worker * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14*344a7f5eSAndroid Build Coastguard Worker * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15*344a7f5eSAndroid Build Coastguard Worker * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
16*344a7f5eSAndroid Build Coastguard Worker * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17*344a7f5eSAndroid Build Coastguard Worker * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
18*344a7f5eSAndroid Build Coastguard Worker * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
19*344a7f5eSAndroid Build Coastguard Worker * THE SOFTWARE.
20*344a7f5eSAndroid Build Coastguard Worker *
21*344a7f5eSAndroid Build Coastguard Worker *===-----------------------------------------------------------------------===
22*344a7f5eSAndroid Build Coastguard Worker */
23*344a7f5eSAndroid Build Coastguard Worker
24*344a7f5eSAndroid Build Coastguard Worker #if !defined __X86INTRIN_H && !defined __EMMINTRIN_H && !defined __IMMINTRIN_H
25*344a7f5eSAndroid Build Coastguard Worker #error "Never use <f16cintrin.h> directly; include <emmintrin.h> instead."
26*344a7f5eSAndroid Build Coastguard Worker #endif
27*344a7f5eSAndroid Build Coastguard Worker
28*344a7f5eSAndroid Build Coastguard Worker #ifndef __F16CINTRIN_H
29*344a7f5eSAndroid Build Coastguard Worker #define __F16CINTRIN_H
30*344a7f5eSAndroid Build Coastguard Worker
31*344a7f5eSAndroid Build Coastguard Worker /* Define the default attributes for the functions in this file. */
32*344a7f5eSAndroid Build Coastguard Worker #define __DEFAULT_FN_ATTRS \
33*344a7f5eSAndroid Build Coastguard Worker __attribute__((__always_inline__, __nodebug__, __target__("f16c")))
34*344a7f5eSAndroid Build Coastguard Worker
35*344a7f5eSAndroid Build Coastguard Worker /// \brief Converts a 16-bit half-precision float value into a 32-bit float
36*344a7f5eSAndroid Build Coastguard Worker /// value.
37*344a7f5eSAndroid Build Coastguard Worker ///
38*344a7f5eSAndroid Build Coastguard Worker /// \headerfile <x86intrin.h>
39*344a7f5eSAndroid Build Coastguard Worker ///
40*344a7f5eSAndroid Build Coastguard Worker /// This intrinsic corresponds to the \c VCVTPH2PS instruction.
41*344a7f5eSAndroid Build Coastguard Worker ///
42*344a7f5eSAndroid Build Coastguard Worker /// \param __a
43*344a7f5eSAndroid Build Coastguard Worker /// A 16-bit half-precision float value.
44*344a7f5eSAndroid Build Coastguard Worker /// \returns The converted 32-bit float value.
45*344a7f5eSAndroid Build Coastguard Worker static __inline float __DEFAULT_FN_ATTRS
_cvtsh_ss(unsigned short __a)46*344a7f5eSAndroid Build Coastguard Worker _cvtsh_ss(unsigned short __a)
47*344a7f5eSAndroid Build Coastguard Worker {
48*344a7f5eSAndroid Build Coastguard Worker __v8hi v = {(short)__a, 0, 0, 0, 0, 0, 0, 0};
49*344a7f5eSAndroid Build Coastguard Worker __v4sf r = __builtin_ia32_vcvtph2ps(v);
50*344a7f5eSAndroid Build Coastguard Worker return r[0];
51*344a7f5eSAndroid Build Coastguard Worker }
52*344a7f5eSAndroid Build Coastguard Worker
53*344a7f5eSAndroid Build Coastguard Worker /// \brief Converts a 32-bit single-precision float value to a 16-bit
54*344a7f5eSAndroid Build Coastguard Worker /// half-precision float value.
55*344a7f5eSAndroid Build Coastguard Worker ///
56*344a7f5eSAndroid Build Coastguard Worker /// \headerfile <x86intrin.h>
57*344a7f5eSAndroid Build Coastguard Worker ///
58*344a7f5eSAndroid Build Coastguard Worker /// \code
59*344a7f5eSAndroid Build Coastguard Worker /// unsigned short _cvtss_sh(float a, const int imm);
60*344a7f5eSAndroid Build Coastguard Worker /// \endcode
61*344a7f5eSAndroid Build Coastguard Worker ///
62*344a7f5eSAndroid Build Coastguard Worker /// This intrinsic corresponds to the \c VCVTPS2PH instruction.
63*344a7f5eSAndroid Build Coastguard Worker ///
64*344a7f5eSAndroid Build Coastguard Worker /// \param a
65*344a7f5eSAndroid Build Coastguard Worker /// A 32-bit single-precision float value to be converted to a 16-bit
66*344a7f5eSAndroid Build Coastguard Worker /// half-precision float value.
67*344a7f5eSAndroid Build Coastguard Worker /// \param imm
68*344a7f5eSAndroid Build Coastguard Worker /// An immediate value controlling rounding using bits [2:0]:
69*344a7f5eSAndroid Build Coastguard Worker /// 000: Nearest
70*344a7f5eSAndroid Build Coastguard Worker /// 001: Down
71*344a7f5eSAndroid Build Coastguard Worker /// 010: Up
72*344a7f5eSAndroid Build Coastguard Worker /// 011: Truncate
73*344a7f5eSAndroid Build Coastguard Worker /// 1XX: Use MXCSR.RC for rounding
74*344a7f5eSAndroid Build Coastguard Worker /// \returns The converted 16-bit half-precision float value.
75*344a7f5eSAndroid Build Coastguard Worker #define _cvtss_sh(a, imm) \
76*344a7f5eSAndroid Build Coastguard Worker ((unsigned short)(((__v8hi)__builtin_ia32_vcvtps2ph((__v4sf){a, 0, 0, 0}, \
77*344a7f5eSAndroid Build Coastguard Worker (imm)))[0]))
78*344a7f5eSAndroid Build Coastguard Worker
79*344a7f5eSAndroid Build Coastguard Worker /// \brief Converts a 128-bit vector containing 32-bit float values into a
80*344a7f5eSAndroid Build Coastguard Worker /// 128-bit vector containing 16-bit half-precision float values.
81*344a7f5eSAndroid Build Coastguard Worker ///
82*344a7f5eSAndroid Build Coastguard Worker /// \headerfile <x86intrin.h>
83*344a7f5eSAndroid Build Coastguard Worker ///
84*344a7f5eSAndroid Build Coastguard Worker /// \code
85*344a7f5eSAndroid Build Coastguard Worker /// __m128i _mm_cvtps_ph(__m128 a, const int imm);
86*344a7f5eSAndroid Build Coastguard Worker /// \endcode
87*344a7f5eSAndroid Build Coastguard Worker ///
88*344a7f5eSAndroid Build Coastguard Worker /// This intrinsic corresponds to the \c VCVTPS2PH instruction.
89*344a7f5eSAndroid Build Coastguard Worker ///
90*344a7f5eSAndroid Build Coastguard Worker /// \param a
91*344a7f5eSAndroid Build Coastguard Worker /// A 128-bit vector containing 32-bit float values.
92*344a7f5eSAndroid Build Coastguard Worker /// \param imm
93*344a7f5eSAndroid Build Coastguard Worker /// An immediate value controlling rounding using bits [2:0]:
94*344a7f5eSAndroid Build Coastguard Worker /// 000: Nearest
95*344a7f5eSAndroid Build Coastguard Worker /// 001: Down
96*344a7f5eSAndroid Build Coastguard Worker /// 010: Up
97*344a7f5eSAndroid Build Coastguard Worker /// 011: Truncate
98*344a7f5eSAndroid Build Coastguard Worker /// 1XX: Use MXCSR.RC for rounding
99*344a7f5eSAndroid Build Coastguard Worker /// \returns A 128-bit vector containing converted 16-bit half-precision float
100*344a7f5eSAndroid Build Coastguard Worker /// values. The lower 64 bits are used to store the converted 16-bit
101*344a7f5eSAndroid Build Coastguard Worker /// half-precision floating-point values.
102*344a7f5eSAndroid Build Coastguard Worker #define _mm_cvtps_ph(a, imm) \
103*344a7f5eSAndroid Build Coastguard Worker ((__m128i)__builtin_ia32_vcvtps2ph((__v4sf)(__m128)(a), (imm)))
104*344a7f5eSAndroid Build Coastguard Worker
105*344a7f5eSAndroid Build Coastguard Worker /// \brief Converts a 128-bit vector containing 16-bit half-precision float
106*344a7f5eSAndroid Build Coastguard Worker /// values into a 128-bit vector containing 32-bit float values.
107*344a7f5eSAndroid Build Coastguard Worker ///
108*344a7f5eSAndroid Build Coastguard Worker /// \headerfile <x86intrin.h>
109*344a7f5eSAndroid Build Coastguard Worker ///
110*344a7f5eSAndroid Build Coastguard Worker /// This intrinsic corresponds to the \c VCVTPH2PS instruction.
111*344a7f5eSAndroid Build Coastguard Worker ///
112*344a7f5eSAndroid Build Coastguard Worker /// \param __a
113*344a7f5eSAndroid Build Coastguard Worker /// A 128-bit vector containing 16-bit half-precision float values. The lower
114*344a7f5eSAndroid Build Coastguard Worker /// 64 bits are used in the conversion.
115*344a7f5eSAndroid Build Coastguard Worker /// \returns A 128-bit vector of [4 x float] containing converted float values.
116*344a7f5eSAndroid Build Coastguard Worker static __inline __m128 __DEFAULT_FN_ATTRS
_mm_cvtph_ps(__m128i __a)117*344a7f5eSAndroid Build Coastguard Worker _mm_cvtph_ps(__m128i __a)
118*344a7f5eSAndroid Build Coastguard Worker {
119*344a7f5eSAndroid Build Coastguard Worker return (__m128)__builtin_ia32_vcvtph2ps((__v8hi)__a);
120*344a7f5eSAndroid Build Coastguard Worker }
121*344a7f5eSAndroid Build Coastguard Worker
122*344a7f5eSAndroid Build Coastguard Worker #undef __DEFAULT_FN_ATTRS
123*344a7f5eSAndroid Build Coastguard Worker
124*344a7f5eSAndroid Build Coastguard Worker #endif /* __F16CINTRIN_H */
125