xref: /aosp_15_r20/external/llvm/test/CodeGen/ARM/vmls.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=arm-eabi -mattr=+neon %s -o - | FileCheck %s
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Workerdefine <8 x i8> @vmlsi8(<8 x i8>* %A, <8 x i8>* %B, <8 x i8> * %C) nounwind {
4*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsi8:
5*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i8
6*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <8 x i8>, <8 x i8>* %A
7*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <8 x i8>, <8 x i8>* %B
8*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <8 x i8>, <8 x i8>* %C
9*9880d681SAndroid Build Coastguard Worker	%tmp4 = mul <8 x i8> %tmp2, %tmp3
10*9880d681SAndroid Build Coastguard Worker	%tmp5 = sub <8 x i8> %tmp1, %tmp4
11*9880d681SAndroid Build Coastguard Worker	ret <8 x i8> %tmp5
12*9880d681SAndroid Build Coastguard Worker}
13*9880d681SAndroid Build Coastguard Worker
14*9880d681SAndroid Build Coastguard Workerdefine <4 x i16> @vmlsi16(<4 x i16>* %A, <4 x i16>* %B, <4 x i16>* %C) nounwind {
15*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsi16:
16*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i16
17*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x i16>, <4 x i16>* %A
18*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x i16>, <4 x i16>* %B
19*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <4 x i16>, <4 x i16>* %C
20*9880d681SAndroid Build Coastguard Worker	%tmp4 = mul <4 x i16> %tmp2, %tmp3
21*9880d681SAndroid Build Coastguard Worker	%tmp5 = sub <4 x i16> %tmp1, %tmp4
22*9880d681SAndroid Build Coastguard Worker	ret <4 x i16> %tmp5
23*9880d681SAndroid Build Coastguard Worker}
24*9880d681SAndroid Build Coastguard Worker
25*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @vmlsi32(<2 x i32>* %A, <2 x i32>* %B, <2 x i32>* %C) nounwind {
26*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsi32:
27*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i32
28*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x i32>, <2 x i32>* %A
29*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <2 x i32>, <2 x i32>* %B
30*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <2 x i32>, <2 x i32>* %C
31*9880d681SAndroid Build Coastguard Worker	%tmp4 = mul <2 x i32> %tmp2, %tmp3
32*9880d681SAndroid Build Coastguard Worker	%tmp5 = sub <2 x i32> %tmp1, %tmp4
33*9880d681SAndroid Build Coastguard Worker	ret <2 x i32> %tmp5
34*9880d681SAndroid Build Coastguard Worker}
35*9880d681SAndroid Build Coastguard Worker
36*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @vmlsf32(<2 x float>* %A, <2 x float>* %B, <2 x float>* %C) nounwind {
37*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsf32:
38*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.f32
39*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x float>, <2 x float>* %A
40*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <2 x float>, <2 x float>* %B
41*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <2 x float>, <2 x float>* %C
42*9880d681SAndroid Build Coastguard Worker	%tmp4 = fmul <2 x float> %tmp2, %tmp3
43*9880d681SAndroid Build Coastguard Worker	%tmp5 = fsub <2 x float> %tmp1, %tmp4
44*9880d681SAndroid Build Coastguard Worker	ret <2 x float> %tmp5
45*9880d681SAndroid Build Coastguard Worker}
46*9880d681SAndroid Build Coastguard Worker
47*9880d681SAndroid Build Coastguard Workerdefine <16 x i8> @vmlsQi8(<16 x i8>* %A, <16 x i8>* %B, <16 x i8> * %C) nounwind {
48*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsQi8:
49*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i8
50*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <16 x i8>, <16 x i8>* %A
51*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <16 x i8>, <16 x i8>* %B
52*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <16 x i8>, <16 x i8>* %C
53*9880d681SAndroid Build Coastguard Worker	%tmp4 = mul <16 x i8> %tmp2, %tmp3
54*9880d681SAndroid Build Coastguard Worker	%tmp5 = sub <16 x i8> %tmp1, %tmp4
55*9880d681SAndroid Build Coastguard Worker	ret <16 x i8> %tmp5
56*9880d681SAndroid Build Coastguard Worker}
57*9880d681SAndroid Build Coastguard Worker
58*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @vmlsQi16(<8 x i16>* %A, <8 x i16>* %B, <8 x i16>* %C) nounwind {
59*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsQi16:
60*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i16
61*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <8 x i16>, <8 x i16>* %A
62*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <8 x i16>, <8 x i16>* %B
63*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <8 x i16>, <8 x i16>* %C
64*9880d681SAndroid Build Coastguard Worker	%tmp4 = mul <8 x i16> %tmp2, %tmp3
65*9880d681SAndroid Build Coastguard Worker	%tmp5 = sub <8 x i16> %tmp1, %tmp4
66*9880d681SAndroid Build Coastguard Worker	ret <8 x i16> %tmp5
67*9880d681SAndroid Build Coastguard Worker}
68*9880d681SAndroid Build Coastguard Worker
69*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @vmlsQi32(<4 x i32>* %A, <4 x i32>* %B, <4 x i32>* %C) nounwind {
70*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsQi32:
71*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.i32
72*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x i32>, <4 x i32>* %A
73*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x i32>, <4 x i32>* %B
74*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <4 x i32>, <4 x i32>* %C
75*9880d681SAndroid Build Coastguard Worker	%tmp4 = mul <4 x i32> %tmp2, %tmp3
76*9880d681SAndroid Build Coastguard Worker	%tmp5 = sub <4 x i32> %tmp1, %tmp4
77*9880d681SAndroid Build Coastguard Worker	ret <4 x i32> %tmp5
78*9880d681SAndroid Build Coastguard Worker}
79*9880d681SAndroid Build Coastguard Worker
80*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @vmlsQf32(<4 x float>* %A, <4 x float>* %B, <4 x float>* %C) nounwind {
81*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsQf32:
82*9880d681SAndroid Build Coastguard Worker;CHECK: vmls.f32
83*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x float>, <4 x float>* %A
84*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x float>, <4 x float>* %B
85*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <4 x float>, <4 x float>* %C
86*9880d681SAndroid Build Coastguard Worker	%tmp4 = fmul <4 x float> %tmp2, %tmp3
87*9880d681SAndroid Build Coastguard Worker	%tmp5 = fsub <4 x float> %tmp1, %tmp4
88*9880d681SAndroid Build Coastguard Worker	ret <4 x float> %tmp5
89*9880d681SAndroid Build Coastguard Worker}
90*9880d681SAndroid Build Coastguard Worker
91*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @vmlsls8(<8 x i16>* %A, <8 x i8>* %B, <8 x i8>* %C) nounwind {
92*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsls8:
93*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.s8
94*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <8 x i16>, <8 x i16>* %A
95*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <8 x i8>, <8 x i8>* %B
96*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <8 x i8>, <8 x i8>* %C
97*9880d681SAndroid Build Coastguard Worker	%tmp4 = sext <8 x i8> %tmp2 to <8 x i16>
98*9880d681SAndroid Build Coastguard Worker	%tmp5 = sext <8 x i8> %tmp3 to <8 x i16>
99*9880d681SAndroid Build Coastguard Worker	%tmp6 = mul <8 x i16> %tmp4, %tmp5
100*9880d681SAndroid Build Coastguard Worker	%tmp7 = sub <8 x i16> %tmp1, %tmp6
101*9880d681SAndroid Build Coastguard Worker	ret <8 x i16> %tmp7
102*9880d681SAndroid Build Coastguard Worker}
103*9880d681SAndroid Build Coastguard Worker
104*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @vmlsls16(<4 x i32>* %A, <4 x i16>* %B, <4 x i16>* %C) nounwind {
105*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsls16:
106*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.s16
107*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x i32>, <4 x i32>* %A
108*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x i16>, <4 x i16>* %B
109*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <4 x i16>, <4 x i16>* %C
110*9880d681SAndroid Build Coastguard Worker	%tmp4 = sext <4 x i16> %tmp2 to <4 x i32>
111*9880d681SAndroid Build Coastguard Worker	%tmp5 = sext <4 x i16> %tmp3 to <4 x i32>
112*9880d681SAndroid Build Coastguard Worker	%tmp6 = mul <4 x i32> %tmp4, %tmp5
113*9880d681SAndroid Build Coastguard Worker	%tmp7 = sub <4 x i32> %tmp1, %tmp6
114*9880d681SAndroid Build Coastguard Worker	ret <4 x i32> %tmp7
115*9880d681SAndroid Build Coastguard Worker}
116*9880d681SAndroid Build Coastguard Worker
117*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @vmlsls32(<2 x i64>* %A, <2 x i32>* %B, <2 x i32>* %C) nounwind {
118*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlsls32:
119*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.s32
120*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x i64>, <2 x i64>* %A
121*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <2 x i32>, <2 x i32>* %B
122*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <2 x i32>, <2 x i32>* %C
123*9880d681SAndroid Build Coastguard Worker	%tmp4 = sext <2 x i32> %tmp2 to <2 x i64>
124*9880d681SAndroid Build Coastguard Worker	%tmp5 = sext <2 x i32> %tmp3 to <2 x i64>
125*9880d681SAndroid Build Coastguard Worker	%tmp6 = mul <2 x i64> %tmp4, %tmp5
126*9880d681SAndroid Build Coastguard Worker	%tmp7 = sub <2 x i64> %tmp1, %tmp6
127*9880d681SAndroid Build Coastguard Worker	ret <2 x i64> %tmp7
128*9880d681SAndroid Build Coastguard Worker}
129*9880d681SAndroid Build Coastguard Worker
130*9880d681SAndroid Build Coastguard Workerdefine <8 x i16> @vmlslu8(<8 x i16>* %A, <8 x i8>* %B, <8 x i8>* %C) nounwind {
131*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlslu8:
132*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.u8
133*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <8 x i16>, <8 x i16>* %A
134*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <8 x i8>, <8 x i8>* %B
135*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <8 x i8>, <8 x i8>* %C
136*9880d681SAndroid Build Coastguard Worker	%tmp4 = zext <8 x i8> %tmp2 to <8 x i16>
137*9880d681SAndroid Build Coastguard Worker	%tmp5 = zext <8 x i8> %tmp3 to <8 x i16>
138*9880d681SAndroid Build Coastguard Worker	%tmp6 = mul <8 x i16> %tmp4, %tmp5
139*9880d681SAndroid Build Coastguard Worker	%tmp7 = sub <8 x i16> %tmp1, %tmp6
140*9880d681SAndroid Build Coastguard Worker	ret <8 x i16> %tmp7
141*9880d681SAndroid Build Coastguard Worker}
142*9880d681SAndroid Build Coastguard Worker
143*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @vmlslu16(<4 x i32>* %A, <4 x i16>* %B, <4 x i16>* %C) nounwind {
144*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlslu16:
145*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.u16
146*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x i32>, <4 x i32>* %A
147*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x i16>, <4 x i16>* %B
148*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <4 x i16>, <4 x i16>* %C
149*9880d681SAndroid Build Coastguard Worker	%tmp4 = zext <4 x i16> %tmp2 to <4 x i32>
150*9880d681SAndroid Build Coastguard Worker	%tmp5 = zext <4 x i16> %tmp3 to <4 x i32>
151*9880d681SAndroid Build Coastguard Worker	%tmp6 = mul <4 x i32> %tmp4, %tmp5
152*9880d681SAndroid Build Coastguard Worker	%tmp7 = sub <4 x i32> %tmp1, %tmp6
153*9880d681SAndroid Build Coastguard Worker	ret <4 x i32> %tmp7
154*9880d681SAndroid Build Coastguard Worker}
155*9880d681SAndroid Build Coastguard Worker
156*9880d681SAndroid Build Coastguard Workerdefine <2 x i64> @vmlslu32(<2 x i64>* %A, <2 x i32>* %B, <2 x i32>* %C) nounwind {
157*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: vmlslu32:
158*9880d681SAndroid Build Coastguard Worker;CHECK: vmlsl.u32
159*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x i64>, <2 x i64>* %A
160*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <2 x i32>, <2 x i32>* %B
161*9880d681SAndroid Build Coastguard Worker	%tmp3 = load <2 x i32>, <2 x i32>* %C
162*9880d681SAndroid Build Coastguard Worker	%tmp4 = zext <2 x i32> %tmp2 to <2 x i64>
163*9880d681SAndroid Build Coastguard Worker	%tmp5 = zext <2 x i32> %tmp3 to <2 x i64>
164*9880d681SAndroid Build Coastguard Worker	%tmp6 = mul <2 x i64> %tmp4, %tmp5
165*9880d681SAndroid Build Coastguard Worker	%tmp7 = sub <2 x i64> %tmp1, %tmp6
166*9880d681SAndroid Build Coastguard Worker	ret <2 x i64> %tmp7
167*9880d681SAndroid Build Coastguard Worker}
168*9880d681SAndroid Build Coastguard Worker
169*9880d681SAndroid Build Coastguard Workerdefine arm_aapcs_vfpcc <4 x i32> @test_vmlsl_lanes16(<4 x i32> %arg0_int32x4_t, <4 x i16> %arg1_int16x4_t, <4 x i16> %arg2_int16x4_t) nounwind readnone {
170*9880d681SAndroid Build Coastguard Workerentry:
171*9880d681SAndroid Build Coastguard Worker; CHECK: test_vmlsl_lanes16
172*9880d681SAndroid Build Coastguard Worker; CHECK: vmlsl.s16 q0, d2, d3[1]
173*9880d681SAndroid Build Coastguard Worker  %0 = shufflevector <4 x i16> %arg2_int16x4_t, <4 x i16> undef, <4 x i32> <i32 1, i32 1, i32 1, i32 1> ; <<4 x i16>> [#uses=1]
174*9880d681SAndroid Build Coastguard Worker  %1 = sext <4 x i16> %arg1_int16x4_t to <4 x i32>
175*9880d681SAndroid Build Coastguard Worker  %2 = sext <4 x i16> %0 to <4 x i32>
176*9880d681SAndroid Build Coastguard Worker  %3 = mul <4 x i32> %1, %2
177*9880d681SAndroid Build Coastguard Worker  %4 = sub <4 x i32> %arg0_int32x4_t, %3
178*9880d681SAndroid Build Coastguard Worker  ret <4 x i32> %4
179*9880d681SAndroid Build Coastguard Worker}
180*9880d681SAndroid Build Coastguard Worker
181*9880d681SAndroid Build Coastguard Workerdefine arm_aapcs_vfpcc <2 x i64> @test_vmlsl_lanes32(<2 x i64> %arg0_int64x2_t, <2 x i32> %arg1_int32x2_t, <2 x i32> %arg2_int32x2_t) nounwind readnone {
182*9880d681SAndroid Build Coastguard Workerentry:
183*9880d681SAndroid Build Coastguard Worker; CHECK: test_vmlsl_lanes32
184*9880d681SAndroid Build Coastguard Worker; CHECK: vmlsl.s32 q0, d2, d3[1]
185*9880d681SAndroid Build Coastguard Worker  %0 = shufflevector <2 x i32> %arg2_int32x2_t, <2 x i32> undef, <2 x i32> <i32 1, i32 1> ; <<2 x i32>> [#uses=1]
186*9880d681SAndroid Build Coastguard Worker  %1 = sext <2 x i32> %arg1_int32x2_t to <2 x i64>
187*9880d681SAndroid Build Coastguard Worker  %2 = sext <2 x i32> %0 to <2 x i64>
188*9880d681SAndroid Build Coastguard Worker  %3 = mul <2 x i64> %1, %2
189*9880d681SAndroid Build Coastguard Worker  %4 = sub <2 x i64> %arg0_int64x2_t, %3
190*9880d681SAndroid Build Coastguard Worker  ret <2 x i64> %4
191*9880d681SAndroid Build Coastguard Worker}
192*9880d681SAndroid Build Coastguard Worker
193*9880d681SAndroid Build Coastguard Workerdefine arm_aapcs_vfpcc <4 x i32> @test_vmlsl_laneu16(<4 x i32> %arg0_uint32x4_t, <4 x i16> %arg1_uint16x4_t, <4 x i16> %arg2_uint16x4_t) nounwind readnone {
194*9880d681SAndroid Build Coastguard Workerentry:
195*9880d681SAndroid Build Coastguard Worker; CHECK: test_vmlsl_laneu16
196*9880d681SAndroid Build Coastguard Worker; CHECK: vmlsl.u16 q0, d2, d3[1]
197*9880d681SAndroid Build Coastguard Worker  %0 = shufflevector <4 x i16> %arg2_uint16x4_t, <4 x i16> undef, <4 x i32> <i32 1, i32 1, i32 1, i32 1> ; <<4 x i16>> [#uses=1]
198*9880d681SAndroid Build Coastguard Worker  %1 = zext <4 x i16> %arg1_uint16x4_t to <4 x i32>
199*9880d681SAndroid Build Coastguard Worker  %2 = zext <4 x i16> %0 to <4 x i32>
200*9880d681SAndroid Build Coastguard Worker  %3 = mul <4 x i32> %1, %2
201*9880d681SAndroid Build Coastguard Worker  %4 = sub <4 x i32> %arg0_uint32x4_t, %3
202*9880d681SAndroid Build Coastguard Worker  ret <4 x i32> %4
203*9880d681SAndroid Build Coastguard Worker}
204*9880d681SAndroid Build Coastguard Worker
205*9880d681SAndroid Build Coastguard Workerdefine arm_aapcs_vfpcc <2 x i64> @test_vmlsl_laneu32(<2 x i64> %arg0_uint64x2_t, <2 x i32> %arg1_uint32x2_t, <2 x i32> %arg2_uint32x2_t) nounwind readnone {
206*9880d681SAndroid Build Coastguard Workerentry:
207*9880d681SAndroid Build Coastguard Worker; CHECK: test_vmlsl_laneu32
208*9880d681SAndroid Build Coastguard Worker; CHECK: vmlsl.u32 q0, d2, d3[1]
209*9880d681SAndroid Build Coastguard Worker  %0 = shufflevector <2 x i32> %arg2_uint32x2_t, <2 x i32> undef, <2 x i32> <i32 1, i32 1> ; <<2 x i32>> [#uses=1]
210*9880d681SAndroid Build Coastguard Worker  %1 = zext <2 x i32> %arg1_uint32x2_t to <2 x i64>
211*9880d681SAndroid Build Coastguard Worker  %2 = zext <2 x i32> %0 to <2 x i64>
212*9880d681SAndroid Build Coastguard Worker  %3 = mul <2 x i64> %1, %2
213*9880d681SAndroid Build Coastguard Worker  %4 = sub <2 x i64> %arg0_uint64x2_t, %3
214*9880d681SAndroid Build Coastguard Worker  ret <2 x i64> %4
215*9880d681SAndroid Build Coastguard Worker}
216