1*67e74705SXin Li // RUN: %clang_cc1 -triple thumbv7-apple-darwin \
2*67e74705SXin Li // RUN: -target-abi apcs-gnu \
3*67e74705SXin Li // RUN: -target-cpu cortex-a8 \
4*67e74705SXin Li // RUN: -mfloat-abi soft \
5*67e74705SXin Li // RUN: -target-feature +soft-float-abi \
6*67e74705SXin Li // RUN: -ffreestanding \
7*67e74705SXin Li // RUN: -emit-llvm -w -o - %s | opt -S -mem2reg | FileCheck %s
8*67e74705SXin Li
9*67e74705SXin Li #include <arm_neon.h>
10*67e74705SXin Li
11*67e74705SXin Li // Check that the vget_low/vget_high intrinsics generate a single shuffle
12*67e74705SXin Li // without any bitcasting.
low_s8(int8x16_t a)13*67e74705SXin Li int8x8_t low_s8(int8x16_t a) {
14*67e74705SXin Li // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
15*67e74705SXin Li return vget_low_s8(a);
16*67e74705SXin Li }
17*67e74705SXin Li
low_u8(uint8x16_t a)18*67e74705SXin Li uint8x8_t low_u8 (uint8x16_t a) {
19*67e74705SXin Li // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
20*67e74705SXin Li return vget_low_u8(a);
21*67e74705SXin Li }
22*67e74705SXin Li
low_s16(int16x8_t a)23*67e74705SXin Li int16x4_t low_s16( int16x8_t a) {
24*67e74705SXin Li // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
25*67e74705SXin Li return vget_low_s16(a);
26*67e74705SXin Li }
27*67e74705SXin Li
low_u16(uint16x8_t a)28*67e74705SXin Li uint16x4_t low_u16(uint16x8_t a) {
29*67e74705SXin Li // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
30*67e74705SXin Li return vget_low_u16(a);
31*67e74705SXin Li }
32*67e74705SXin Li
low_s32(int32x4_t a)33*67e74705SXin Li int32x2_t low_s32( int32x4_t a) {
34*67e74705SXin Li // CHECK: shufflevector <4 x i32> %a, <4 x i32> %a, <2 x i32> <i32 0, i32 1>
35*67e74705SXin Li return vget_low_s32(a);
36*67e74705SXin Li }
37*67e74705SXin Li
low_u32(uint32x4_t a)38*67e74705SXin Li uint32x2_t low_u32(uint32x4_t a) {
39*67e74705SXin Li // CHECK: shufflevector <4 x i32> %a, <4 x i32> %a, <2 x i32> <i32 0, i32 1>
40*67e74705SXin Li return vget_low_u32(a);
41*67e74705SXin Li }
42*67e74705SXin Li
low_s64(int64x2_t a)43*67e74705SXin Li int64x1_t low_s64( int64x2_t a) {
44*67e74705SXin Li // CHECK: shufflevector <2 x i64> %a, <2 x i64> %a, <1 x i32> zeroinitializer
45*67e74705SXin Li return vget_low_s64(a);
46*67e74705SXin Li }
47*67e74705SXin Li
low_u64(uint64x2_t a)48*67e74705SXin Li uint64x1_t low_u64(uint64x2_t a) {
49*67e74705SXin Li // CHECK: shufflevector <2 x i64> %a, <2 x i64> %a, <1 x i32> zeroinitializer
50*67e74705SXin Li return vget_low_u64(a);
51*67e74705SXin Li }
52*67e74705SXin Li
low_p8(poly8x16_t a)53*67e74705SXin Li poly8x8_t low_p8 (poly8x16_t a) {
54*67e74705SXin Li // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 0, i32 1, i32 2, i32 3, i32 4, i32 5, i32 6, i32 7>
55*67e74705SXin Li return vget_low_p8(a);
56*67e74705SXin Li }
57*67e74705SXin Li
low_p16(poly16x8_t a)58*67e74705SXin Li poly16x4_t low_p16(poly16x8_t a) {
59*67e74705SXin Li // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 0, i32 1, i32 2, i32 3>
60*67e74705SXin Li return vget_low_p16(a);
61*67e74705SXin Li }
62*67e74705SXin Li
low_f32(float32x4_t a)63*67e74705SXin Li float32x2_t low_f32(float32x4_t a) {
64*67e74705SXin Li // CHECK: shufflevector <4 x float> %a, <4 x float> %a, <2 x i32> <i32 0, i32 1>
65*67e74705SXin Li return vget_low_f32(a);
66*67e74705SXin Li }
67*67e74705SXin Li
68*67e74705SXin Li
high_s8(int8x16_t a)69*67e74705SXin Li int8x8_t high_s8(int8x16_t a) {
70*67e74705SXin Li // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
71*67e74705SXin Li return vget_high_s8(a);
72*67e74705SXin Li }
73*67e74705SXin Li
high_u8(uint8x16_t a)74*67e74705SXin Li uint8x8_t high_u8 (uint8x16_t a) {
75*67e74705SXin Li // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
76*67e74705SXin Li return vget_high_u8(a);
77*67e74705SXin Li }
78*67e74705SXin Li
high_s16(int16x8_t a)79*67e74705SXin Li int16x4_t high_s16( int16x8_t a) {
80*67e74705SXin Li // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
81*67e74705SXin Li return vget_high_s16(a);
82*67e74705SXin Li }
83*67e74705SXin Li
high_u16(uint16x8_t a)84*67e74705SXin Li uint16x4_t high_u16(uint16x8_t a) {
85*67e74705SXin Li // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
86*67e74705SXin Li return vget_high_u16(a);
87*67e74705SXin Li }
88*67e74705SXin Li
high_s32(int32x4_t a)89*67e74705SXin Li int32x2_t high_s32( int32x4_t a) {
90*67e74705SXin Li // CHECK: shufflevector <4 x i32> %a, <4 x i32> %a, <2 x i32> <i32 2, i32 3>
91*67e74705SXin Li return vget_high_s32(a);
92*67e74705SXin Li }
93*67e74705SXin Li
high_u32(uint32x4_t a)94*67e74705SXin Li uint32x2_t high_u32(uint32x4_t a) {
95*67e74705SXin Li // CHECK: shufflevector <4 x i32> %a, <4 x i32> %a, <2 x i32> <i32 2, i32 3>
96*67e74705SXin Li return vget_high_u32(a);
97*67e74705SXin Li }
98*67e74705SXin Li
high_s64(int64x2_t a)99*67e74705SXin Li int64x1_t high_s64( int64x2_t a) {
100*67e74705SXin Li // CHECK: shufflevector <2 x i64> %a, <2 x i64> %a, <1 x i32> <i32 1>
101*67e74705SXin Li return vget_high_s64(a);
102*67e74705SXin Li }
103*67e74705SXin Li
high_u64(uint64x2_t a)104*67e74705SXin Li uint64x1_t high_u64(uint64x2_t a) {
105*67e74705SXin Li // CHECK: shufflevector <2 x i64> %a, <2 x i64> %a, <1 x i32> <i32 1>
106*67e74705SXin Li return vget_high_u64(a);
107*67e74705SXin Li }
108*67e74705SXin Li
high_p8(poly8x16_t a)109*67e74705SXin Li poly8x8_t high_p8 (poly8x16_t a) {
110*67e74705SXin Li // CHECK: shufflevector <16 x i8> %a, <16 x i8> %a, <8 x i32> <i32 8, i32 9, i32 10, i32 11, i32 12, i32 13, i32 14, i32 15>
111*67e74705SXin Li return vget_high_p8(a);
112*67e74705SXin Li }
113*67e74705SXin Li
high_p16(poly16x8_t a)114*67e74705SXin Li poly16x4_t high_p16(poly16x8_t a) {
115*67e74705SXin Li // CHECK: shufflevector <8 x i16> %a, <8 x i16> %a, <4 x i32> <i32 4, i32 5, i32 6, i32 7>
116*67e74705SXin Li return vget_high_p16(a);
117*67e74705SXin Li }
118*67e74705SXin Li
high_f32(float32x4_t a)119*67e74705SXin Li float32x2_t high_f32(float32x4_t a) {
120*67e74705SXin Li // CHECK: shufflevector <4 x float> %a, <4 x float> %a, <2 x i32> <i32 2, i32 3>
121*67e74705SXin Li return vget_high_f32(a);
122*67e74705SXin Li }
123*67e74705SXin Li
124