1*bed243d3SAndroid Build Coastguard Worker /*===---- avx512vpopcntdqintrin.h - AVX512VPOPCNTDQ intrinsics -------------===
2*bed243d3SAndroid Build Coastguard Worker *
3*bed243d3SAndroid Build Coastguard Worker *
4*bed243d3SAndroid Build Coastguard Worker * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
5*bed243d3SAndroid Build Coastguard Worker * See https://llvm.org/LICENSE.txt for license information.
6*bed243d3SAndroid Build Coastguard Worker * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7*bed243d3SAndroid Build Coastguard Worker *
8*bed243d3SAndroid Build Coastguard Worker *===-----------------------------------------------------------------------===
9*bed243d3SAndroid Build Coastguard Worker */
10*bed243d3SAndroid Build Coastguard Worker #ifndef __IMMINTRIN_H
11*bed243d3SAndroid Build Coastguard Worker #error \
12*bed243d3SAndroid Build Coastguard Worker "Never use <avx512vpopcntdqvlintrin.h> directly; include <immintrin.h> instead."
13*bed243d3SAndroid Build Coastguard Worker #endif
14*bed243d3SAndroid Build Coastguard Worker
15*bed243d3SAndroid Build Coastguard Worker #ifndef __AVX512VPOPCNTDQVLINTRIN_H
16*bed243d3SAndroid Build Coastguard Worker #define __AVX512VPOPCNTDQVLINTRIN_H
17*bed243d3SAndroid Build Coastguard Worker
18*bed243d3SAndroid Build Coastguard Worker /* Define the default attributes for the functions in this file. */
19*bed243d3SAndroid Build Coastguard Worker #define __DEFAULT_FN_ATTRS128 \
20*bed243d3SAndroid Build Coastguard Worker __attribute__((__always_inline__, __nodebug__, \
21*bed243d3SAndroid Build Coastguard Worker __target__("avx512vpopcntdq,avx512vl,no-evex512"), \
22*bed243d3SAndroid Build Coastguard Worker __min_vector_width__(128)))
23*bed243d3SAndroid Build Coastguard Worker #define __DEFAULT_FN_ATTRS256 \
24*bed243d3SAndroid Build Coastguard Worker __attribute__((__always_inline__, __nodebug__, \
25*bed243d3SAndroid Build Coastguard Worker __target__("avx512vpopcntdq,avx512vl,no-evex512"), \
26*bed243d3SAndroid Build Coastguard Worker __min_vector_width__(256)))
27*bed243d3SAndroid Build Coastguard Worker
28*bed243d3SAndroid Build Coastguard Worker static __inline__ __m128i __DEFAULT_FN_ATTRS128
_mm_popcnt_epi64(__m128i __A)29*bed243d3SAndroid Build Coastguard Worker _mm_popcnt_epi64(__m128i __A) {
30*bed243d3SAndroid Build Coastguard Worker return (__m128i)__builtin_ia32_vpopcntq_128((__v2di)__A);
31*bed243d3SAndroid Build Coastguard Worker }
32*bed243d3SAndroid Build Coastguard Worker
33*bed243d3SAndroid Build Coastguard Worker static __inline__ __m128i __DEFAULT_FN_ATTRS128
_mm_mask_popcnt_epi64(__m128i __W,__mmask8 __U,__m128i __A)34*bed243d3SAndroid Build Coastguard Worker _mm_mask_popcnt_epi64(__m128i __W, __mmask8 __U, __m128i __A) {
35*bed243d3SAndroid Build Coastguard Worker return (__m128i)__builtin_ia32_selectq_128(
36*bed243d3SAndroid Build Coastguard Worker (__mmask8)__U, (__v2di)_mm_popcnt_epi64(__A), (__v2di)__W);
37*bed243d3SAndroid Build Coastguard Worker }
38*bed243d3SAndroid Build Coastguard Worker
39*bed243d3SAndroid Build Coastguard Worker static __inline__ __m128i __DEFAULT_FN_ATTRS128
_mm_maskz_popcnt_epi64(__mmask8 __U,__m128i __A)40*bed243d3SAndroid Build Coastguard Worker _mm_maskz_popcnt_epi64(__mmask8 __U, __m128i __A) {
41*bed243d3SAndroid Build Coastguard Worker return _mm_mask_popcnt_epi64((__m128i)_mm_setzero_si128(), __U, __A);
42*bed243d3SAndroid Build Coastguard Worker }
43*bed243d3SAndroid Build Coastguard Worker
44*bed243d3SAndroid Build Coastguard Worker static __inline__ __m128i __DEFAULT_FN_ATTRS128
_mm_popcnt_epi32(__m128i __A)45*bed243d3SAndroid Build Coastguard Worker _mm_popcnt_epi32(__m128i __A) {
46*bed243d3SAndroid Build Coastguard Worker return (__m128i)__builtin_ia32_vpopcntd_128((__v4si)__A);
47*bed243d3SAndroid Build Coastguard Worker }
48*bed243d3SAndroid Build Coastguard Worker
49*bed243d3SAndroid Build Coastguard Worker static __inline__ __m128i __DEFAULT_FN_ATTRS128
_mm_mask_popcnt_epi32(__m128i __W,__mmask8 __U,__m128i __A)50*bed243d3SAndroid Build Coastguard Worker _mm_mask_popcnt_epi32(__m128i __W, __mmask8 __U, __m128i __A) {
51*bed243d3SAndroid Build Coastguard Worker return (__m128i)__builtin_ia32_selectd_128(
52*bed243d3SAndroid Build Coastguard Worker (__mmask8)__U, (__v4si)_mm_popcnt_epi32(__A), (__v4si)__W);
53*bed243d3SAndroid Build Coastguard Worker }
54*bed243d3SAndroid Build Coastguard Worker
55*bed243d3SAndroid Build Coastguard Worker static __inline__ __m128i __DEFAULT_FN_ATTRS128
_mm_maskz_popcnt_epi32(__mmask8 __U,__m128i __A)56*bed243d3SAndroid Build Coastguard Worker _mm_maskz_popcnt_epi32(__mmask8 __U, __m128i __A) {
57*bed243d3SAndroid Build Coastguard Worker return _mm_mask_popcnt_epi32((__m128i)_mm_setzero_si128(), __U, __A);
58*bed243d3SAndroid Build Coastguard Worker }
59*bed243d3SAndroid Build Coastguard Worker
60*bed243d3SAndroid Build Coastguard Worker static __inline__ __m256i __DEFAULT_FN_ATTRS256
_mm256_popcnt_epi64(__m256i __A)61*bed243d3SAndroid Build Coastguard Worker _mm256_popcnt_epi64(__m256i __A) {
62*bed243d3SAndroid Build Coastguard Worker return (__m256i)__builtin_ia32_vpopcntq_256((__v4di)__A);
63*bed243d3SAndroid Build Coastguard Worker }
64*bed243d3SAndroid Build Coastguard Worker
65*bed243d3SAndroid Build Coastguard Worker static __inline__ __m256i __DEFAULT_FN_ATTRS256
_mm256_mask_popcnt_epi64(__m256i __W,__mmask8 __U,__m256i __A)66*bed243d3SAndroid Build Coastguard Worker _mm256_mask_popcnt_epi64(__m256i __W, __mmask8 __U, __m256i __A) {
67*bed243d3SAndroid Build Coastguard Worker return (__m256i)__builtin_ia32_selectq_256(
68*bed243d3SAndroid Build Coastguard Worker (__mmask8)__U, (__v4di)_mm256_popcnt_epi64(__A), (__v4di)__W);
69*bed243d3SAndroid Build Coastguard Worker }
70*bed243d3SAndroid Build Coastguard Worker
71*bed243d3SAndroid Build Coastguard Worker static __inline__ __m256i __DEFAULT_FN_ATTRS256
_mm256_maskz_popcnt_epi64(__mmask8 __U,__m256i __A)72*bed243d3SAndroid Build Coastguard Worker _mm256_maskz_popcnt_epi64(__mmask8 __U, __m256i __A) {
73*bed243d3SAndroid Build Coastguard Worker return _mm256_mask_popcnt_epi64((__m256i)_mm256_setzero_si256(), __U, __A);
74*bed243d3SAndroid Build Coastguard Worker }
75*bed243d3SAndroid Build Coastguard Worker
76*bed243d3SAndroid Build Coastguard Worker static __inline__ __m256i __DEFAULT_FN_ATTRS256
_mm256_popcnt_epi32(__m256i __A)77*bed243d3SAndroid Build Coastguard Worker _mm256_popcnt_epi32(__m256i __A) {
78*bed243d3SAndroid Build Coastguard Worker return (__m256i)__builtin_ia32_vpopcntd_256((__v8si)__A);
79*bed243d3SAndroid Build Coastguard Worker }
80*bed243d3SAndroid Build Coastguard Worker
81*bed243d3SAndroid Build Coastguard Worker static __inline__ __m256i __DEFAULT_FN_ATTRS256
_mm256_mask_popcnt_epi32(__m256i __W,__mmask8 __U,__m256i __A)82*bed243d3SAndroid Build Coastguard Worker _mm256_mask_popcnt_epi32(__m256i __W, __mmask8 __U, __m256i __A) {
83*bed243d3SAndroid Build Coastguard Worker return (__m256i)__builtin_ia32_selectd_256(
84*bed243d3SAndroid Build Coastguard Worker (__mmask8)__U, (__v8si)_mm256_popcnt_epi32(__A), (__v8si)__W);
85*bed243d3SAndroid Build Coastguard Worker }
86*bed243d3SAndroid Build Coastguard Worker
87*bed243d3SAndroid Build Coastguard Worker static __inline__ __m256i __DEFAULT_FN_ATTRS256
_mm256_maskz_popcnt_epi32(__mmask8 __U,__m256i __A)88*bed243d3SAndroid Build Coastguard Worker _mm256_maskz_popcnt_epi32(__mmask8 __U, __m256i __A) {
89*bed243d3SAndroid Build Coastguard Worker return _mm256_mask_popcnt_epi32((__m256i)_mm256_setzero_si256(), __U, __A);
90*bed243d3SAndroid Build Coastguard Worker }
91*bed243d3SAndroid Build Coastguard Worker
92*bed243d3SAndroid Build Coastguard Worker #undef __DEFAULT_FN_ATTRS128
93*bed243d3SAndroid Build Coastguard Worker #undef __DEFAULT_FN_ATTRS256
94*bed243d3SAndroid Build Coastguard Worker
95*bed243d3SAndroid Build Coastguard Worker #endif
96