1*67e74705SXin Li // RUN: %clang_cc1 %s -triple=x86_64-apple-darwin -target-feature +ssse3 -emit-llvm -o - -Werror | FileCheck %s
2*67e74705SXin Li
3*67e74705SXin Li // Don't include mm_malloc.h, it's system specific.
4*67e74705SXin Li #define __MM_MALLOC_H
5*67e74705SXin Li
6*67e74705SXin Li #include <x86intrin.h>
7*67e74705SXin Li
8*67e74705SXin Li // NOTE: This should match the tests in llvm/test/CodeGen/X86/ssse3-intrinsics-fast-isel.ll
9*67e74705SXin Li
test_mm_abs_epi8(__m128i a)10*67e74705SXin Li __m128i test_mm_abs_epi8(__m128i a) {
11*67e74705SXin Li // CHECK-LABEL: test_mm_abs_epi8
12*67e74705SXin Li // CHECK: call <16 x i8> @llvm.x86.ssse3.pabs.b.128(<16 x i8> %{{.*}})
13*67e74705SXin Li return _mm_abs_epi8(a);
14*67e74705SXin Li }
15*67e74705SXin Li
test_mm_abs_epi16(__m128i a)16*67e74705SXin Li __m128i test_mm_abs_epi16(__m128i a) {
17*67e74705SXin Li // CHECK-LABEL: test_mm_abs_epi16
18*67e74705SXin Li // CHECK: call <8 x i16> @llvm.x86.ssse3.pabs.w.128(<8 x i16> %{{.*}})
19*67e74705SXin Li return _mm_abs_epi16(a);
20*67e74705SXin Li }
21*67e74705SXin Li
test_mm_abs_epi32(__m128i a)22*67e74705SXin Li __m128i test_mm_abs_epi32(__m128i a) {
23*67e74705SXin Li // CHECK-LABEL: test_mm_abs_epi32
24*67e74705SXin Li // CHECK: call <4 x i32> @llvm.x86.ssse3.pabs.d.128(<4 x i32> %{{.*}})
25*67e74705SXin Li return _mm_abs_epi32(a);
26*67e74705SXin Li }
27*67e74705SXin Li
test_mm_alignr_epi8(__m128i a,__m128i b)28*67e74705SXin Li __m128i test_mm_alignr_epi8(__m128i a, __m128i b) {
29*67e74705SXin Li // CHECK-LABEL: test_mm_alignr_epi8
30*67e74705SXin Li // CHECK: shufflevector <16 x i8> %{{.*}}, <16 x i8> %{{.*}}, <16 x i32> <i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 16, i32 17>
31*67e74705SXin Li return _mm_alignr_epi8(a, b, 2);
32*67e74705SXin Li }
33*67e74705SXin Li
test2_mm_alignr_epi8(__m128i a,__m128i b)34*67e74705SXin Li __m128i test2_mm_alignr_epi8(__m128i a, __m128i b) {
35*67e74705SXin Li // CHECK-LABEL: test2_mm_alignr_epi8
36*67e74705SXin Li // CHECK: shufflevector <16 x i8> %{{.*}}, <16 x i8> zeroinitializer, <16 x i32> <i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7, i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15, i32 16>
37*67e74705SXin Li return _mm_alignr_epi8(a, b, 17);
38*67e74705SXin Li }
39*67e74705SXin Li
test_mm_hadd_epi16(__m128i a,__m128i b)40*67e74705SXin Li __m128i test_mm_hadd_epi16(__m128i a, __m128i b) {
41*67e74705SXin Li // CHECK-LABEL: test_mm_hadd_epi16
42*67e74705SXin Li // CHECK: call <8 x i16> @llvm.x86.ssse3.phadd.w.128(<8 x i16> %{{.*}}, <8 x i16> %{{.*}})
43*67e74705SXin Li return _mm_hadd_epi16(a, b);
44*67e74705SXin Li }
45*67e74705SXin Li
test_mm_hadd_epi32(__m128i a,__m128i b)46*67e74705SXin Li __m128i test_mm_hadd_epi32(__m128i a, __m128i b) {
47*67e74705SXin Li // CHECK-LABEL: test_mm_hadd_epi32
48*67e74705SXin Li // CHECK: call <4 x i32> @llvm.x86.ssse3.phadd.d.128(<4 x i32> %{{.*}}, <4 x i32> %{{.*}})
49*67e74705SXin Li return _mm_hadd_epi32(a, b);
50*67e74705SXin Li }
51*67e74705SXin Li
test_mm_hadds_epi16(__m128i a,__m128i b)52*67e74705SXin Li __m128i test_mm_hadds_epi16(__m128i a, __m128i b) {
53*67e74705SXin Li // CHECK-LABEL: test_mm_hadds_epi16
54*67e74705SXin Li // CHECK: call <8 x i16> @llvm.x86.ssse3.phadd.sw.128(<8 x i16> %{{.*}}, <8 x i16> %{{.*}})
55*67e74705SXin Li return _mm_hadds_epi16(a, b);
56*67e74705SXin Li }
57*67e74705SXin Li
test_mm_hsub_epi16(__m128i a,__m128i b)58*67e74705SXin Li __m128i test_mm_hsub_epi16(__m128i a, __m128i b) {
59*67e74705SXin Li // CHECK-LABEL: test_mm_hsub_epi16
60*67e74705SXin Li // CHECK: call <8 x i16> @llvm.x86.ssse3.phsub.w.128(<8 x i16> %{{.*}}, <8 x i16> %{{.*}})
61*67e74705SXin Li return _mm_hsub_epi16(a, b);
62*67e74705SXin Li }
63*67e74705SXin Li
test_mm_hsub_epi32(__m128i a,__m128i b)64*67e74705SXin Li __m128i test_mm_hsub_epi32(__m128i a, __m128i b) {
65*67e74705SXin Li // CHECK-LABEL: test_mm_hsub_epi32
66*67e74705SXin Li // CHECK: call <4 x i32> @llvm.x86.ssse3.phsub.d.128(<4 x i32> %{{.*}}, <4 x i32> %{{.*}})
67*67e74705SXin Li return _mm_hsub_epi32(a, b);
68*67e74705SXin Li }
69*67e74705SXin Li
test_mm_hsubs_epi16(__m128i a,__m128i b)70*67e74705SXin Li __m128i test_mm_hsubs_epi16(__m128i a, __m128i b) {
71*67e74705SXin Li // CHECK-LABEL: test_mm_hsubs_epi16
72*67e74705SXin Li // CHECK: call <8 x i16> @llvm.x86.ssse3.phsub.sw.128(<8 x i16> %{{.*}}, <8 x i16> %{{.*}})
73*67e74705SXin Li return _mm_hsubs_epi16(a, b);
74*67e74705SXin Li }
75*67e74705SXin Li
test_mm_maddubs_epi16(__m128i a,__m128i b)76*67e74705SXin Li __m128i test_mm_maddubs_epi16(__m128i a, __m128i b) {
77*67e74705SXin Li // CHECK-LABEL: test_mm_maddubs_epi16
78*67e74705SXin Li // CHECK: call <8 x i16> @llvm.x86.ssse3.pmadd.ub.sw.128(<16 x i8> %{{.*}}, <16 x i8> %{{.*}})
79*67e74705SXin Li return _mm_maddubs_epi16(a, b);
80*67e74705SXin Li }
81*67e74705SXin Li
test_mm_mulhrs_epi16(__m128i a,__m128i b)82*67e74705SXin Li __m128i test_mm_mulhrs_epi16(__m128i a, __m128i b) {
83*67e74705SXin Li // CHECK-LABEL: test_mm_mulhrs_epi16
84*67e74705SXin Li // CHECK: call <8 x i16> @llvm.x86.ssse3.pmul.hr.sw.128(<8 x i16> %{{.*}}, <8 x i16> %{{.*}})
85*67e74705SXin Li return _mm_mulhrs_epi16(a, b);
86*67e74705SXin Li }
87*67e74705SXin Li
test_mm_shuffle_epi8(__m128i a,__m128i b)88*67e74705SXin Li __m128i test_mm_shuffle_epi8(__m128i a, __m128i b) {
89*67e74705SXin Li // CHECK-LABEL: test_mm_shuffle_epi8
90*67e74705SXin Li // CHECK: call <16 x i8> @llvm.x86.ssse3.pshuf.b.128(<16 x i8> %{{.*}}, <16 x i8> %{{.*}})
91*67e74705SXin Li return _mm_shuffle_epi8(a, b);
92*67e74705SXin Li }
93*67e74705SXin Li
test_mm_sign_epi8(__m128i a,__m128i b)94*67e74705SXin Li __m128i test_mm_sign_epi8(__m128i a, __m128i b) {
95*67e74705SXin Li // CHECK-LABEL: test_mm_sign_epi8
96*67e74705SXin Li // CHECK: call <16 x i8> @llvm.x86.ssse3.psign.b.128(<16 x i8> %{{.*}}, <16 x i8> %{{.*}})
97*67e74705SXin Li return _mm_sign_epi8(a, b);
98*67e74705SXin Li }
99*67e74705SXin Li
test_mm_sign_epi16(__m128i a,__m128i b)100*67e74705SXin Li __m128i test_mm_sign_epi16(__m128i a, __m128i b) {
101*67e74705SXin Li // CHECK-LABEL: test_mm_sign_epi16
102*67e74705SXin Li // CHECK: call <8 x i16> @llvm.x86.ssse3.psign.w.128(<8 x i16> %{{.*}}, <8 x i16> %{{.*}})
103*67e74705SXin Li return _mm_sign_epi16(a, b);
104*67e74705SXin Li }
105*67e74705SXin Li
test_mm_sign_epi32(__m128i a,__m128i b)106*67e74705SXin Li __m128i test_mm_sign_epi32(__m128i a, __m128i b) {
107*67e74705SXin Li // CHECK-LABEL: test_mm_sign_epi32
108*67e74705SXin Li // CHECK: call <4 x i32> @llvm.x86.ssse3.psign.d.128(<4 x i32> %{{.*}}, <4 x i32> %{{.*}})
109*67e74705SXin Li return _mm_sign_epi32(a, b);
110*67e74705SXin Li }
111