1*67e74705SXin Li // RUN: %clang_cc1 -triple arm64-apple-ios7 -target-feature +neon -ffreestanding -emit-llvm -o - %s | opt -S -mem2reg | FileCheck %s
2*67e74705SXin Li // RUN: %clang_cc1 -triple aarch64_be-linux-gnu -target-feature +neon -ffreestanding -emit-llvm -o - %s | opt -S -mem2reg | FileCheck %s --check-prefix CHECK-BE
3*67e74705SXin Li
4*67e74705SXin Li #include <arm_neon.h>
5*67e74705SXin Li
test_vdupb_lane_s8(int8x8_t src)6*67e74705SXin Li int8_t test_vdupb_lane_s8(int8x8_t src) {
7*67e74705SXin Li return vdupb_lane_s8(src, 2);
8*67e74705SXin Li // CHECK-LABEL: @test_vdupb_lane_s8
9*67e74705SXin Li // CHECK: extractelement <8 x i8> %src, i32 2
10*67e74705SXin Li
11*67e74705SXin Li // CHECK-BE-LABEL: @test_vdupb_lane_s8
12*67e74705SXin Li // CHECK-BE: [[REV:%.*]] = shufflevector <8 x i8> {{.*}}, <8 x i32> <i32 7, i32 6, i32 5, i32 4, i32 3, i32 2, i32 1, i32 0>
13*67e74705SXin Li // CHECK-BE: extractelement <8 x i8> [[REV]], i32 2
14*67e74705SXin Li }
15*67e74705SXin Li
test_vdupb_lane_u8(uint8x8_t src)16*67e74705SXin Li uint8_t test_vdupb_lane_u8(uint8x8_t src) {
17*67e74705SXin Li return vdupb_lane_u8(src, 2);
18*67e74705SXin Li // CHECK-LABEL: @test_vdupb_lane_u8
19*67e74705SXin Li // CHECK: extractelement <8 x i8> %src, i32 2
20*67e74705SXin Li
21*67e74705SXin Li // CHECK-BE-LABEL: @test_vdupb_lane_u8
22*67e74705SXin Li // CHECK-BE: [[REV:%.*]] = shufflevector <8 x i8> {{.*}}, <8 x i32> <i32 7, i32 6, i32 5, i32 4, i32 3, i32 2, i32 1, i32 0>
23*67e74705SXin Li // CHECK-BE: extractelement <8 x i8> [[REV]], i32 2
24*67e74705SXin Li }
25*67e74705SXin Li
test_vduph_lane_s16(int16x4_t src)26*67e74705SXin Li int16_t test_vduph_lane_s16(int16x4_t src) {
27*67e74705SXin Li return vduph_lane_s16(src, 2);
28*67e74705SXin Li // CHECK-LABEL: @test_vduph_lane_s16
29*67e74705SXin Li // CHECK: [[TMP1:%.*]] = bitcast <4 x i16> %src to [[TYPE:.*]]
30*67e74705SXin Li // CHECK: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <4 x i16>
31*67e74705SXin Li // CHECK: extractelement <4 x i16> [[TMP2]], i32 2
32*67e74705SXin Li
33*67e74705SXin Li // CHECK-BE-LABEL: @test_vduph_lane_s16
34*67e74705SXin Li // CHECK-BE: [[REV:%.*]] = shufflevector <4 x i16> {{.*}}, <4 x i32> <i32 3, i32 2, i32 1, i32 0>
35*67e74705SXin Li // CHECK-BE: [[TMP1:%.*]] = bitcast <4 x i16> [[REV]] to [[TYPE:.*]]
36*67e74705SXin Li // CHECK-BE: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <4 x i16>
37*67e74705SXin Li // CHECK-BE: extractelement <4 x i16> [[TMP2]], i32 2
38*67e74705SXin Li }
39*67e74705SXin Li
test_vduph_lane_u16(uint16x4_t src)40*67e74705SXin Li uint16_t test_vduph_lane_u16(uint16x4_t src) {
41*67e74705SXin Li return vduph_lane_u16(src, 2);
42*67e74705SXin Li // CHECK-LABEL: @test_vduph_lane_u16
43*67e74705SXin Li // CHECK: [[TMP1:%.*]] = bitcast <4 x i16> %src to [[TYPE:.*]]
44*67e74705SXin Li // CHECK: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <4 x i16>
45*67e74705SXin Li // CHECK: extractelement <4 x i16> [[TMP2]], i32 2
46*67e74705SXin Li
47*67e74705SXin Li // CHECK-BE-LABEL: @test_vduph_lane_u16
48*67e74705SXin Li // CHECK-BE: [[REV:%.*]] = shufflevector <4 x i16> {{.*}}, <4 x i32> <i32 3, i32 2, i32 1, i32 0>
49*67e74705SXin Li // CHECK-BE: [[TMP1:%.*]] = bitcast <4 x i16> [[REV]] to [[TYPE:.*]]
50*67e74705SXin Li // CHECK-BE: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <4 x i16>
51*67e74705SXin Li // CHECK-BE: extractelement <4 x i16> [[TMP2]], i32 2
52*67e74705SXin Li }
53*67e74705SXin Li
test_vdups_lane_s32(int32x2_t src)54*67e74705SXin Li int32_t test_vdups_lane_s32(int32x2_t src) {
55*67e74705SXin Li return vdups_lane_s32(src, 0);
56*67e74705SXin Li // CHECK-LABEL: @test_vdups_lane_s32
57*67e74705SXin Li // CHECK: [[TMP1:%.*]] = bitcast <2 x i32> %src to [[TYPE:.*]]
58*67e74705SXin Li // CHECK: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <2 x i32>
59*67e74705SXin Li // CHECK: extractelement <2 x i32> [[TMP2]], i32 0
60*67e74705SXin Li
61*67e74705SXin Li // CHECK-BE-LABEL: @test_vdups_lane_s32
62*67e74705SXin Li // CHECK-BE: [[REV:%.*]] = shufflevector <2 x i32> {{.*}}, <2 x i32> <i32 1, i32 0>
63*67e74705SXin Li // CHECK-BE: [[TMP1:%.*]] = bitcast <2 x i32> [[REV]] to [[TYPE:.*]]
64*67e74705SXin Li // CHECK-BE: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <2 x i32>
65*67e74705SXin Li // CHECK-BE: extractelement <2 x i32> [[TMP2]], i32 0
66*67e74705SXin Li }
67*67e74705SXin Li
test_vdups_lane_u32(uint32x2_t src)68*67e74705SXin Li uint32_t test_vdups_lane_u32(uint32x2_t src) {
69*67e74705SXin Li return vdups_lane_u32(src, 0);
70*67e74705SXin Li // CHECK-LABEL: @test_vdups_lane_u32
71*67e74705SXin Li // CHECK: [[TMP1:%.*]] = bitcast <2 x i32> %src to [[TYPE:.*]]
72*67e74705SXin Li // CHECK: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <2 x i32>
73*67e74705SXin Li // CHECK: extractelement <2 x i32> [[TMP2]], i32 0
74*67e74705SXin Li
75*67e74705SXin Li // CHECK-BE-LABEL: @test_vdups_lane_u32
76*67e74705SXin Li // CHECK-BE: [[REV:%.*]] = shufflevector <2 x i32> {{.*}}, <2 x i32> <i32 1, i32 0>
77*67e74705SXin Li // CHECK-BE: [[TMP1:%.*]] = bitcast <2 x i32> [[REV]] to [[TYPE:.*]]
78*67e74705SXin Li // CHECK-BE: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <2 x i32>
79*67e74705SXin Li // CHECK-BE: extractelement <2 x i32> [[TMP2]], i32 0
80*67e74705SXin Li }
81*67e74705SXin Li
test_vdups_lane_f32(float32x2_t src)82*67e74705SXin Li float32_t test_vdups_lane_f32(float32x2_t src) {
83*67e74705SXin Li return vdups_lane_f32(src, 0);
84*67e74705SXin Li // CHECK-LABEL: @test_vdups_lane_f32
85*67e74705SXin Li // CHECK: [[TMP1:%.*]] = bitcast <2 x float> %src to [[TYPE:.*]]
86*67e74705SXin Li // CHECK: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <2 x float>
87*67e74705SXin Li // CHECK: extractelement <2 x float> [[TMP2]], i32 0
88*67e74705SXin Li
89*67e74705SXin Li // CHECK-BE-LABEL: @test_vdups_lane_f32
90*67e74705SXin Li // CHECK-BE: [[REV:%.*]] = shufflevector <2 x float> {{.*}}, <2 x i32> <i32 1, i32 0>
91*67e74705SXin Li // CHECK-BE: [[TMP1:%.*]] = bitcast <2 x float> [[REV]] to [[TYPE:.*]]
92*67e74705SXin Li // CHECK-BE: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <2 x float>
93*67e74705SXin Li // CHECK-BE: extractelement <2 x float> [[TMP2]], i32 0
94*67e74705SXin Li }
95*67e74705SXin Li
test_vdupd_lane_s64(int64x1_t src)96*67e74705SXin Li int64_t test_vdupd_lane_s64(int64x1_t src) {
97*67e74705SXin Li return vdupd_lane_s64(src, 0);
98*67e74705SXin Li // CHECK-LABEL: @test_vdupd_lane_s64
99*67e74705SXin Li // CHECK: [[TMP1:%.*]] = bitcast <1 x i64> %src to [[TYPE:.*]]
100*67e74705SXin Li // CHECK: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <1 x i64>
101*67e74705SXin Li // CHECK: extractelement <1 x i64> [[TMP2]], i32 0
102*67e74705SXin Li
103*67e74705SXin Li // CHECK-BE-LABEL: @test_vdupd_lane_s64
104*67e74705SXin Li // CHECK-BE: extractelement <1 x i64> {{.*}}, i32 0
105*67e74705SXin Li }
106*67e74705SXin Li
test_vdupd_lane_u64(uint64x1_t src)107*67e74705SXin Li uint64_t test_vdupd_lane_u64(uint64x1_t src) {
108*67e74705SXin Li return vdupd_lane_u64(src, 0);
109*67e74705SXin Li // CHECK-LABEL: @test_vdupd_lane_u64
110*67e74705SXin Li // CHECK: [[TMP1:%.*]] = bitcast <1 x i64> %src to [[TYPE:.*]]
111*67e74705SXin Li // CHECK: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <1 x i64>
112*67e74705SXin Li // CHECK: extractelement <1 x i64> [[TMP2]], i32 0
113*67e74705SXin Li
114*67e74705SXin Li // CHECK-BE-LABEL: @test_vdupd_lane_u64
115*67e74705SXin Li // CHECK-BE: extractelement <1 x i64> {{.*}}, i32 0
116*67e74705SXin Li }
117*67e74705SXin Li
test_vdupd_lane_f64(float64x1_t src)118*67e74705SXin Li float64_t test_vdupd_lane_f64(float64x1_t src) {
119*67e74705SXin Li return vdupd_lane_f64(src, 0);
120*67e74705SXin Li // CHECK-LABEL: @test_vdupd_lane_f64
121*67e74705SXin Li // CHECK: [[TMP1:%.*]] = bitcast <1 x double> %src to [[TYPE:.*]]
122*67e74705SXin Li // CHECK: [[TMP2:%.*]] = bitcast [[TYPE]] [[TMP1]] to <1 x double>
123*67e74705SXin Li // CHECK: extractelement <1 x double> [[TMP2]], i32 0
124*67e74705SXin Li
125*67e74705SXin Li // CHECK-BE-LABEL: @test_vdupd_lane_f64
126*67e74705SXin Li // CHECK-BE: extractelement <1 x double> {{.*}}, i32 0
127*67e74705SXin Li }
128