1*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=arm-eabi -mattr=+neon %s -o - | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @vmlsi8(<8 x i8>* %A, <8 x i8>* %B, <8 x i8> * %C) nounwind { 4*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsi8: 5*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i8 6*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i8>, <8 x i8>* %A 7*9880d681SAndroid Build Coastguard Worker %tmp2 = load <8 x i8>, <8 x i8>* %B 8*9880d681SAndroid Build Coastguard Worker %tmp3 = load <8 x i8>, <8 x i8>* %C 9*9880d681SAndroid Build Coastguard Worker %tmp4 = mul <8 x i8> %tmp2, %tmp3 10*9880d681SAndroid Build Coastguard Worker %tmp5 = sub <8 x i8> %tmp1, %tmp4 11*9880d681SAndroid Build Coastguard Worker ret <8 x i8> %tmp5 12*9880d681SAndroid Build Coastguard Worker} 13*9880d681SAndroid Build Coastguard Worker 14*9880d681SAndroid Build Coastguard Workerdefine <4 x i16> @vmlsi16(<4 x i16>* %A, <4 x i16>* %B, <4 x i16>* %C) nounwind { 15*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsi16: 16*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i16 17*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i16>, <4 x i16>* %A 18*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x i16>, <4 x i16>* %B 19*9880d681SAndroid Build Coastguard Worker %tmp3 = load <4 x i16>, <4 x i16>* %C 20*9880d681SAndroid Build Coastguard Worker %tmp4 = mul <4 x i16> %tmp2, %tmp3 21*9880d681SAndroid Build Coastguard Worker %tmp5 = sub <4 x i16> %tmp1, %tmp4 22*9880d681SAndroid Build Coastguard Worker ret <4 x i16> %tmp5 23*9880d681SAndroid Build Coastguard Worker} 24*9880d681SAndroid Build Coastguard Worker 25*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @vmlsi32(<2 x i32>* %A, <2 x i32>* %B, <2 x i32>* %C) nounwind { 26*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsi32: 27*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i32 28*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x i32>, <2 x i32>* %A 29*9880d681SAndroid Build Coastguard Worker %tmp2 = load <2 x i32>, <2 x i32>* %B 30*9880d681SAndroid Build Coastguard Worker %tmp3 = load <2 x i32>, <2 x i32>* %C 31*9880d681SAndroid Build Coastguard Worker %tmp4 = mul <2 x i32> %tmp2, %tmp3 32*9880d681SAndroid Build Coastguard Worker %tmp5 = sub <2 x i32> %tmp1, %tmp4 33*9880d681SAndroid Build Coastguard Worker ret <2 x i32> %tmp5 34*9880d681SAndroid Build Coastguard Worker} 35*9880d681SAndroid Build Coastguard Worker 36*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @vmlsf32(<2 x float>* %A, <2 x float>* %B, <2 x float>* %C) nounwind { 37*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsf32: 38*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.f32 39*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x float>, <2 x float>* %A 40*9880d681SAndroid Build Coastguard Worker %tmp2 = load <2 x float>, <2 x float>* %B 41*9880d681SAndroid Build Coastguard Worker %tmp3 = load <2 x float>, <2 x float>* %C 42*9880d681SAndroid Build Coastguard Worker %tmp4 = fmul <2 x float> %tmp2, %tmp3 43*9880d681SAndroid Build Coastguard Worker %tmp5 = fsub <2 x float> %tmp1, %tmp4 44*9880d681SAndroid Build Coastguard Worker ret <2 x float> %tmp5 45*9880d681SAndroid Build Coastguard Worker} 46*9880d681SAndroid Build Coastguard Worker 47*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @vmlsQi8(<16 x i8>* %A, <16 x i8>* %B, <16 x i8> * %C) nounwind { 48*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsQi8: 49*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i8 50*9880d681SAndroid Build Coastguard Worker %tmp1 = load <16 x i8>, <16 x i8>* %A 51*9880d681SAndroid Build Coastguard Worker %tmp2 = load <16 x i8>, <16 x i8>* %B 52*9880d681SAndroid Build Coastguard Worker %tmp3 = load <16 x i8>, <16 x i8>* %C 53*9880d681SAndroid Build Coastguard Worker %tmp4 = mul <16 x i8> %tmp2, %tmp3 54*9880d681SAndroid Build Coastguard Worker %tmp5 = sub <16 x i8> %tmp1, %tmp4 55*9880d681SAndroid Build Coastguard Worker ret <16 x i8> %tmp5 56*9880d681SAndroid Build Coastguard Worker} 57*9880d681SAndroid Build Coastguard Worker 58*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @vmlsQi16(<8 x i16>* %A, <8 x i16>* %B, <8 x i16>* %C) nounwind { 59*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsQi16: 60*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i16 61*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i16>, <8 x i16>* %A 62*9880d681SAndroid Build Coastguard Worker %tmp2 = load <8 x i16>, <8 x i16>* %B 63*9880d681SAndroid Build Coastguard Worker %tmp3 = load <8 x i16>, <8 x i16>* %C 64*9880d681SAndroid Build Coastguard Worker %tmp4 = mul <8 x i16> %tmp2, %tmp3 65*9880d681SAndroid Build Coastguard Worker %tmp5 = sub <8 x i16> %tmp1, %tmp4 66*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %tmp5 67*9880d681SAndroid Build Coastguard Worker} 68*9880d681SAndroid Build Coastguard Worker 69*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @vmlsQi32(<4 x i32>* %A, <4 x i32>* %B, <4 x i32>* %C) nounwind { 70*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsQi32: 71*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i32 72*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i32>, <4 x i32>* %A 73*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x i32>, <4 x i32>* %B 74*9880d681SAndroid Build Coastguard Worker %tmp3 = load <4 x i32>, <4 x i32>* %C 75*9880d681SAndroid Build Coastguard Worker %tmp4 = mul <4 x i32> %tmp2, %tmp3 76*9880d681SAndroid Build Coastguard Worker %tmp5 = sub <4 x i32> %tmp1, %tmp4 77*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %tmp5 78*9880d681SAndroid Build Coastguard Worker} 79*9880d681SAndroid Build Coastguard Worker 80*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @vmlsQf32(<4 x float>* %A, <4 x float>* %B, <4 x float>* %C) nounwind { 81*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsQf32: 82*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.f32 83*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x float>, <4 x float>* %A 84*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x float>, <4 x float>* %B 85*9880d681SAndroid Build Coastguard Worker %tmp3 = load <4 x float>, <4 x float>* %C 86*9880d681SAndroid Build Coastguard Worker %tmp4 = fmul <4 x float> %tmp2, %tmp3 87*9880d681SAndroid Build Coastguard Worker %tmp5 = fsub <4 x float> %tmp1, %tmp4 88*9880d681SAndroid Build Coastguard Worker ret <4 x float> %tmp5 89*9880d681SAndroid Build Coastguard Worker} 90*9880d681SAndroid Build Coastguard Worker 91*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @vmlsls8(<8 x i16>* %A, <8 x i8>* %B, <8 x i8>* %C) nounwind { 92*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsls8: 93*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.s8 94*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i16>, <8 x i16>* %A 95*9880d681SAndroid Build Coastguard Worker %tmp2 = load <8 x i8>, <8 x i8>* %B 96*9880d681SAndroid Build Coastguard Worker %tmp3 = load <8 x i8>, <8 x i8>* %C 97*9880d681SAndroid Build Coastguard Worker %tmp4 = sext <8 x i8> %tmp2 to <8 x i16> 98*9880d681SAndroid Build Coastguard Worker %tmp5 = sext <8 x i8> %tmp3 to <8 x i16> 99*9880d681SAndroid Build Coastguard Worker %tmp6 = mul <8 x i16> %tmp4, %tmp5 100*9880d681SAndroid Build Coastguard Worker %tmp7 = sub <8 x i16> %tmp1, %tmp6 101*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %tmp7 102*9880d681SAndroid Build Coastguard Worker} 103*9880d681SAndroid Build Coastguard Worker 104*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @vmlsls16(<4 x i32>* %A, <4 x i16>* %B, <4 x i16>* %C) nounwind { 105*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsls16: 106*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.s16 107*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i32>, <4 x i32>* %A 108*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x i16>, <4 x i16>* %B 109*9880d681SAndroid Build Coastguard Worker %tmp3 = load <4 x i16>, <4 x i16>* %C 110*9880d681SAndroid Build Coastguard Worker %tmp4 = sext <4 x i16> %tmp2 to <4 x i32> 111*9880d681SAndroid Build Coastguard Worker %tmp5 = sext <4 x i16> %tmp3 to <4 x i32> 112*9880d681SAndroid Build Coastguard Worker %tmp6 = mul <4 x i32> %tmp4, %tmp5 113*9880d681SAndroid Build Coastguard Worker %tmp7 = sub <4 x i32> %tmp1, %tmp6 114*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %tmp7 115*9880d681SAndroid Build Coastguard Worker} 116*9880d681SAndroid Build Coastguard Worker 117*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @vmlsls32(<2 x i64>* %A, <2 x i32>* %B, <2 x i32>* %C) nounwind { 118*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsls32: 119*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.s32 120*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x i64>, <2 x i64>* %A 121*9880d681SAndroid Build Coastguard Worker %tmp2 = load <2 x i32>, <2 x i32>* %B 122*9880d681SAndroid Build Coastguard Worker %tmp3 = load <2 x i32>, <2 x i32>* %C 123*9880d681SAndroid Build Coastguard Worker %tmp4 = sext <2 x i32> %tmp2 to <2 x i64> 124*9880d681SAndroid Build Coastguard Worker %tmp5 = sext <2 x i32> %tmp3 to <2 x i64> 125*9880d681SAndroid Build Coastguard Worker %tmp6 = mul <2 x i64> %tmp4, %tmp5 126*9880d681SAndroid Build Coastguard Worker %tmp7 = sub <2 x i64> %tmp1, %tmp6 127*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %tmp7 128*9880d681SAndroid Build Coastguard Worker} 129*9880d681SAndroid Build Coastguard Worker 130*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @vmlslu8(<8 x i16>* %A, <8 x i8>* %B, <8 x i8>* %C) nounwind { 131*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlslu8: 132*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.u8 133*9880d681SAndroid Build Coastguard Worker %tmp1 = load <8 x i16>, <8 x i16>* %A 134*9880d681SAndroid Build Coastguard Worker %tmp2 = load <8 x i8>, <8 x i8>* %B 135*9880d681SAndroid Build Coastguard Worker %tmp3 = load <8 x i8>, <8 x i8>* %C 136*9880d681SAndroid Build Coastguard Worker %tmp4 = zext <8 x i8> %tmp2 to <8 x i16> 137*9880d681SAndroid Build Coastguard Worker %tmp5 = zext <8 x i8> %tmp3 to <8 x i16> 138*9880d681SAndroid Build Coastguard Worker %tmp6 = mul <8 x i16> %tmp4, %tmp5 139*9880d681SAndroid Build Coastguard Worker %tmp7 = sub <8 x i16> %tmp1, %tmp6 140*9880d681SAndroid Build Coastguard Worker ret <8 x i16> %tmp7 141*9880d681SAndroid Build Coastguard Worker} 142*9880d681SAndroid Build Coastguard Worker 143*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @vmlslu16(<4 x i32>* %A, <4 x i16>* %B, <4 x i16>* %C) nounwind { 144*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlslu16: 145*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.u16 146*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i32>, <4 x i32>* %A 147*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x i16>, <4 x i16>* %B 148*9880d681SAndroid Build Coastguard Worker %tmp3 = load <4 x i16>, <4 x i16>* %C 149*9880d681SAndroid Build Coastguard Worker %tmp4 = zext <4 x i16> %tmp2 to <4 x i32> 150*9880d681SAndroid Build Coastguard Worker %tmp5 = zext <4 x i16> %tmp3 to <4 x i32> 151*9880d681SAndroid Build Coastguard Worker %tmp6 = mul <4 x i32> %tmp4, %tmp5 152*9880d681SAndroid Build Coastguard Worker %tmp7 = sub <4 x i32> %tmp1, %tmp6 153*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %tmp7 154*9880d681SAndroid Build Coastguard Worker} 155*9880d681SAndroid Build Coastguard Worker 156*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @vmlslu32(<2 x i64>* %A, <2 x i32>* %B, <2 x i32>* %C) nounwind { 157*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlslu32: 158*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.u32 159*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x i64>, <2 x i64>* %A 160*9880d681SAndroid Build Coastguard Worker %tmp2 = load <2 x i32>, <2 x i32>* %B 161*9880d681SAndroid Build Coastguard Worker %tmp3 = load <2 x i32>, <2 x i32>* %C 162*9880d681SAndroid Build Coastguard Worker %tmp4 = zext <2 x i32> %tmp2 to <2 x i64> 163*9880d681SAndroid Build Coastguard Worker %tmp5 = zext <2 x i32> %tmp3 to <2 x i64> 164*9880d681SAndroid Build Coastguard Worker %tmp6 = mul <2 x i64> %tmp4, %tmp5 165*9880d681SAndroid Build Coastguard Worker %tmp7 = sub <2 x i64> %tmp1, %tmp6 166*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %tmp7 167*9880d681SAndroid Build Coastguard Worker} 168*9880d681SAndroid Build Coastguard Worker 169*9880d681SAndroid Build Coastguard Workerdefine arm_aapcs_vfpcc <4 x i32> @test_vmlsl_lanes16(<4 x i32> %arg0_int32x4_t, <4 x i16> %arg1_int16x4_t, <4 x i16> %arg2_int16x4_t) nounwind readnone { 170*9880d681SAndroid Build Coastguard Workerentry: 171*9880d681SAndroid Build Coastguard Worker; CHECK: test_vmlsl_lanes16 172*9880d681SAndroid Build Coastguard Worker; CHECK: vmlsl.s16 q0, d2, d3[1] 173*9880d681SAndroid Build Coastguard Worker %0 = shufflevector <4 x i16> %arg2_int16x4_t, <4 x i16> undef, <4 x i32> <i32 1, i32 1, i32 1, i32 1> ; <<4 x i16>> [#uses=1] 174*9880d681SAndroid Build Coastguard Worker %1 = sext <4 x i16> %arg1_int16x4_t to <4 x i32> 175*9880d681SAndroid Build Coastguard Worker %2 = sext <4 x i16> %0 to <4 x i32> 176*9880d681SAndroid Build Coastguard Worker %3 = mul <4 x i32> %1, %2 177*9880d681SAndroid Build Coastguard Worker %4 = sub <4 x i32> %arg0_int32x4_t, %3 178*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %4 179*9880d681SAndroid Build Coastguard Worker} 180*9880d681SAndroid Build Coastguard Worker 181*9880d681SAndroid Build Coastguard Workerdefine arm_aapcs_vfpcc <2 x i64> @test_vmlsl_lanes32(<2 x i64> %arg0_int64x2_t, <2 x i32> %arg1_int32x2_t, <2 x i32> %arg2_int32x2_t) nounwind readnone { 182*9880d681SAndroid Build Coastguard Workerentry: 183*9880d681SAndroid Build Coastguard Worker; CHECK: test_vmlsl_lanes32 184*9880d681SAndroid Build Coastguard Worker; CHECK: vmlsl.s32 q0, d2, d3[1] 185*9880d681SAndroid Build Coastguard Worker %0 = shufflevector <2 x i32> %arg2_int32x2_t, <2 x i32> undef, <2 x i32> <i32 1, i32 1> ; <<2 x i32>> [#uses=1] 186*9880d681SAndroid Build Coastguard Worker %1 = sext <2 x i32> %arg1_int32x2_t to <2 x i64> 187*9880d681SAndroid Build Coastguard Worker %2 = sext <2 x i32> %0 to <2 x i64> 188*9880d681SAndroid Build Coastguard Worker %3 = mul <2 x i64> %1, %2 189*9880d681SAndroid Build Coastguard Worker %4 = sub <2 x i64> %arg0_int64x2_t, %3 190*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %4 191*9880d681SAndroid Build Coastguard Worker} 192*9880d681SAndroid Build Coastguard Worker 193*9880d681SAndroid Build Coastguard Workerdefine arm_aapcs_vfpcc <4 x i32> @test_vmlsl_laneu16(<4 x i32> %arg0_uint32x4_t, <4 x i16> %arg1_uint16x4_t, <4 x i16> %arg2_uint16x4_t) nounwind readnone { 194*9880d681SAndroid Build Coastguard Workerentry: 195*9880d681SAndroid Build Coastguard Worker; CHECK: test_vmlsl_laneu16 196*9880d681SAndroid Build Coastguard Worker; CHECK: vmlsl.u16 q0, d2, d3[1] 197*9880d681SAndroid Build Coastguard Worker %0 = shufflevector <4 x i16> %arg2_uint16x4_t, <4 x i16> undef, <4 x i32> <i32 1, i32 1, i32 1, i32 1> ; <<4 x i16>> [#uses=1] 198*9880d681SAndroid Build Coastguard Worker %1 = zext <4 x i16> %arg1_uint16x4_t to <4 x i32> 199*9880d681SAndroid Build Coastguard Worker %2 = zext <4 x i16> %0 to <4 x i32> 200*9880d681SAndroid Build Coastguard Worker %3 = mul <4 x i32> %1, %2 201*9880d681SAndroid Build Coastguard Worker %4 = sub <4 x i32> %arg0_uint32x4_t, %3 202*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %4 203*9880d681SAndroid Build Coastguard Worker} 204*9880d681SAndroid Build Coastguard Worker 205*9880d681SAndroid Build Coastguard Workerdefine arm_aapcs_vfpcc <2 x i64> @test_vmlsl_laneu32(<2 x i64> %arg0_uint64x2_t, <2 x i32> %arg1_uint32x2_t, <2 x i32> %arg2_uint32x2_t) nounwind readnone { 206*9880d681SAndroid Build Coastguard Workerentry: 207*9880d681SAndroid Build Coastguard Worker; CHECK: test_vmlsl_laneu32 208*9880d681SAndroid Build Coastguard Worker; CHECK: vmlsl.u32 q0, d2, d3[1] 209*9880d681SAndroid Build Coastguard Worker %0 = shufflevector <2 x i32> %arg2_uint32x2_t, <2 x i32> undef, <2 x i32> <i32 1, i32 1> ; <<2 x i32>> [#uses=1] 210*9880d681SAndroid Build Coastguard Worker %1 = zext <2 x i32> %arg1_uint32x2_t to <2 x i64> 211*9880d681SAndroid Build Coastguard Worker %2 = zext <2 x i32> %0 to <2 x i64> 212*9880d681SAndroid Build Coastguard Worker %3 = mul <2 x i64> %1, %2 213*9880d681SAndroid Build Coastguard Worker %4 = sub <2 x i64> %arg0_uint64x2_t, %3 214*9880d681SAndroid Build Coastguard Worker ret <2 x i64> %4 215*9880d681SAndroid Build Coastguard Worker} 216