1*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=arm-eabi -mattr=+neon -fast-isel=0 -O0 %s -o - | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Workerdefine void @vst3i8(i8* %A, <8 x i8>* %B) nounwind { 4*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3i8: 5*9880d681SAndroid Build Coastguard Worker;Check the alignment value. Max for this instruction is 64 bits: 6*9880d681SAndroid Build Coastguard Worker;This test runs at -O0 so do not check for specific register numbers. 7*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.8 {d{{.*}}, d{{.*}}, d{{.*}}}, [r{{.*}}:64] 8*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i8>, <8 x i8>* %B 9*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v8i8(i8* %A, <8 x i8> %tmp1, <8 x i8> %tmp1, <8 x i8> %tmp1, i32 32) 10*9880d681SAndroid Build Coastguard Worker ret void 11*9880d681SAndroid Build Coastguard Worker} 12*9880d681SAndroid Build Coastguard Worker 13*9880d681SAndroid Build Coastguard Workerdefine void @vst3i16(i16* %A, <4 x i16>* %B) nounwind { 14*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3i16: 15*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.16 16*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast i16* %A to i8* 17*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i16>, <4 x i16>* %B 18*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v4i16(i8* %tmp0, <4 x i16> %tmp1, <4 x i16> %tmp1, <4 x i16> %tmp1, i32 1) 19*9880d681SAndroid Build Coastguard Worker ret void 20*9880d681SAndroid Build Coastguard Worker} 21*9880d681SAndroid Build Coastguard Worker 22*9880d681SAndroid Build Coastguard Workerdefine void @vst3i32(i32* %A, <2 x i32>* %B) nounwind { 23*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3i32: 24*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.32 25*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast i32* %A to i8* 26*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x i32>, <2 x i32>* %B 27*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v2i32(i8* %tmp0, <2 x i32> %tmp1, <2 x i32> %tmp1, <2 x i32> %tmp1, i32 1) 28*9880d681SAndroid Build Coastguard Worker ret void 29*9880d681SAndroid Build Coastguard Worker} 30*9880d681SAndroid Build Coastguard Worker 31*9880d681SAndroid Build Coastguard Worker;Check for a post-increment updating store. 32*9880d681SAndroid Build Coastguard Workerdefine void @vst3i32_update(i32** %ptr, <2 x i32>* %B) nounwind { 33*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3i32_update: 34*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.32 {d{{.*}}, d{{.*}}, d{{.*}}}, [r{{.*}}]! 35*9880d681SAndroid Build Coastguard Worker %A = load i32*, i32** %ptr 36*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast i32* %A to i8* 37*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x i32>, <2 x i32>* %B 38*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v2i32(i8* %tmp0, <2 x i32> %tmp1, <2 x i32> %tmp1, <2 x i32> %tmp1, i32 1) 39*9880d681SAndroid Build Coastguard Worker %tmp2 = getelementptr i32, i32* %A, i32 6 40*9880d681SAndroid Build Coastguard Worker store i32* %tmp2, i32** %ptr 41*9880d681SAndroid Build Coastguard Worker ret void 42*9880d681SAndroid Build Coastguard Worker} 43*9880d681SAndroid Build Coastguard Worker 44*9880d681SAndroid Build Coastguard Workerdefine void @vst3f(float* %A, <2 x float>* %B) nounwind { 45*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3f: 46*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.32 47*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast float* %A to i8* 48*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x float>, <2 x float>* %B 49*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v2f32(i8* %tmp0, <2 x float> %tmp1, <2 x float> %tmp1, <2 x float> %tmp1, i32 1) 50*9880d681SAndroid Build Coastguard Worker ret void 51*9880d681SAndroid Build Coastguard Worker} 52*9880d681SAndroid Build Coastguard Worker 53*9880d681SAndroid Build Coastguard Workerdefine void @vst3i64(i64* %A, <1 x i64>* %B) nounwind { 54*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3i64: 55*9880d681SAndroid Build Coastguard Worker;Check the alignment value. Max for this instruction is 64 bits: 56*9880d681SAndroid Build Coastguard Worker;This test runs at -O0 so do not check for specific register numbers. 57*9880d681SAndroid Build Coastguard Worker;CHECK: vst1.64 {d{{.*}}, d{{.*}}, d{{.*}}}, [r{{.*}}:64] 58*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast i64* %A to i8* 59*9880d681SAndroid Build Coastguard Worker %tmp1 = load <1 x i64>, <1 x i64>* %B 60*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v1i64(i8* %tmp0, <1 x i64> %tmp1, <1 x i64> %tmp1, <1 x i64> %tmp1, i32 16) 61*9880d681SAndroid Build Coastguard Worker ret void 62*9880d681SAndroid Build Coastguard Worker} 63*9880d681SAndroid Build Coastguard Worker 64*9880d681SAndroid Build Coastguard Workerdefine void @vst3i64_update(i64** %ptr, <1 x i64>* %B) nounwind { 65*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3i64_update 66*9880d681SAndroid Build Coastguard Worker;CHECK: vst1.64 {d{{.*}}, d{{.*}}, d{{.*}}}, [r{{.*}}]! 67*9880d681SAndroid Build Coastguard Worker %A = load i64*, i64** %ptr 68*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast i64* %A to i8* 69*9880d681SAndroid Build Coastguard Worker %tmp1 = load <1 x i64>, <1 x i64>* %B 70*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v1i64(i8* %tmp0, <1 x i64> %tmp1, <1 x i64> %tmp1, <1 x i64> %tmp1, i32 1) 71*9880d681SAndroid Build Coastguard Worker %tmp2 = getelementptr i64, i64* %A, i32 3 72*9880d681SAndroid Build Coastguard Worker store i64* %tmp2, i64** %ptr 73*9880d681SAndroid Build Coastguard Worker ret void 74*9880d681SAndroid Build Coastguard Worker} 75*9880d681SAndroid Build Coastguard Worker 76*9880d681SAndroid Build Coastguard Workerdefine void @vst3Qi8(i8* %A, <16 x i8>* %B) nounwind { 77*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3Qi8: 78*9880d681SAndroid Build Coastguard Worker;Check the alignment value. Max for this instruction is 64 bits: 79*9880d681SAndroid Build Coastguard Worker;This test runs at -O0 so do not check for specific register numbers. 80*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.8 {d{{.*}}, d{{.*}}, d{{.*}}}, [r{{.*}}:64]! 81*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.8 {d{{.*}}, d{{.*}}, d{{.*}}}, [r{{.*}}:64] 82*9880d681SAndroid Build Coastguard Worker %tmp1 = load <16 x i8>, <16 x i8>* %B 83*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v16i8(i8* %A, <16 x i8> %tmp1, <16 x i8> %tmp1, <16 x i8> %tmp1, i32 32) 84*9880d681SAndroid Build Coastguard Worker ret void 85*9880d681SAndroid Build Coastguard Worker} 86*9880d681SAndroid Build Coastguard Worker 87*9880d681SAndroid Build Coastguard Workerdefine void @vst3Qi16(i16* %A, <8 x i16>* %B) nounwind { 88*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3Qi16: 89*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.16 90*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.16 91*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast i16* %A to i8* 92*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i16>, <8 x i16>* %B 93*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v8i16(i8* %tmp0, <8 x i16> %tmp1, <8 x i16> %tmp1, <8 x i16> %tmp1, i32 1) 94*9880d681SAndroid Build Coastguard Worker ret void 95*9880d681SAndroid Build Coastguard Worker} 96*9880d681SAndroid Build Coastguard Worker 97*9880d681SAndroid Build Coastguard Worker;Check for a post-increment updating store. 98*9880d681SAndroid Build Coastguard Workerdefine void @vst3Qi16_update(i16** %ptr, <8 x i16>* %B) nounwind { 99*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3Qi16_update: 100*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.16 {d{{.*}}, d{{.*}}, d{{.*}}}, [r{{.*}}]! 101*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.16 {d{{.*}}, d{{.*}}, d{{.*}}}, [r{{.*}}]! 102*9880d681SAndroid Build Coastguard Worker %A = load i16*, i16** %ptr 103*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast i16* %A to i8* 104*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i16>, <8 x i16>* %B 105*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v8i16(i8* %tmp0, <8 x i16> %tmp1, <8 x i16> %tmp1, <8 x i16> %tmp1, i32 1) 106*9880d681SAndroid Build Coastguard Worker %tmp2 = getelementptr i16, i16* %A, i32 24 107*9880d681SAndroid Build Coastguard Worker store i16* %tmp2, i16** %ptr 108*9880d681SAndroid Build Coastguard Worker ret void 109*9880d681SAndroid Build Coastguard Worker} 110*9880d681SAndroid Build Coastguard Worker 111*9880d681SAndroid Build Coastguard Workerdefine void @vst3Qi32(i32* %A, <4 x i32>* %B) nounwind { 112*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3Qi32: 113*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.32 114*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.32 115*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast i32* %A to i8* 116*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i32>, <4 x i32>* %B 117*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v4i32(i8* %tmp0, <4 x i32> %tmp1, <4 x i32> %tmp1, <4 x i32> %tmp1, i32 1) 118*9880d681SAndroid Build Coastguard Worker ret void 119*9880d681SAndroid Build Coastguard Worker} 120*9880d681SAndroid Build Coastguard Worker 121*9880d681SAndroid Build Coastguard Workerdefine void @vst3Qf(float* %A, <4 x float>* %B) nounwind { 122*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vst3Qf: 123*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.32 124*9880d681SAndroid Build Coastguard Worker;CHECK: vst3.32 125*9880d681SAndroid Build Coastguard Worker %tmp0 = bitcast float* %A to i8* 126*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x float>, <4 x float>* %B 127*9880d681SAndroid Build Coastguard Worker call void @llvm.arm.neon.vst3.p0i8.v4f32(i8* %tmp0, <4 x float> %tmp1, <4 x float> %tmp1, <4 x float> %tmp1, i32 1) 128*9880d681SAndroid Build Coastguard Worker ret void 129*9880d681SAndroid Build Coastguard Worker} 130*9880d681SAndroid Build Coastguard Worker 131*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.arm.neon.vst3.p0i8.v8i8(i8*, <8 x i8>, <8 x i8>, <8 x i8>, i32) nounwind 132*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.arm.neon.vst3.p0i8.v4i16(i8*, <4 x i16>, <4 x i16>, <4 x i16>, i32) nounwind 133*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.arm.neon.vst3.p0i8.v2i32(i8*, <2 x i32>, <2 x i32>, <2 x i32>, i32) nounwind 134*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.arm.neon.vst3.p0i8.v2f32(i8*, <2 x float>, <2 x float>, <2 x float>, i32) nounwind 135*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.arm.neon.vst3.p0i8.v1i64(i8*, <1 x i64>, <1 x i64>, <1 x i64>, i32) nounwind 136*9880d681SAndroid Build Coastguard Worker 137*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.arm.neon.vst3.p0i8.v16i8(i8*, <16 x i8>, <16 x i8>, <16 x i8>, i32) nounwind 138*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.arm.neon.vst3.p0i8.v8i16(i8*, <8 x i16>, <8 x i16>, <8 x i16>, i32) nounwind 139*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.arm.neon.vst3.p0i8.v4i32(i8*, <4 x i32>, <4 x i32>, <4 x i32>, i32) nounwind 140*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.arm.neon.vst3.p0i8.v4f32(i8*, <4 x float>, <4 x float>, <4 x float>, i32) nounwind 141