xref: /aosp_15_r20/external/llvm/test/CodeGen/X86/fma-intrinsics-phi-213-to-231.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx2,+fma | FileCheck %s
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddsubpd_loop_128:
4*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmaddsub231pd %xmm1, %xmm0, %xmm2
5*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
6*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
7*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmaddsubpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) {
8*9880d681SAndroid Build Coastguard Workerentry:
9*9880d681SAndroid Build Coastguard Worker  br label %for.cond
10*9880d681SAndroid Build Coastguard Worker
11*9880d681SAndroid Build Coastguard Workerfor.cond:
12*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ]
13*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
14*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
15*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
16*9880d681SAndroid Build Coastguard Worker
17*9880d681SAndroid Build Coastguard Workerfor.body:
18*9880d681SAndroid Build Coastguard Worker  br label %for.inc
19*9880d681SAndroid Build Coastguard Worker
20*9880d681SAndroid Build Coastguard Workerfor.inc:
21*9880d681SAndroid Build Coastguard Worker  %0 = call <2 x double> @llvm.x86.fma.vfmaddsub.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0)
22*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
23*9880d681SAndroid Build Coastguard Worker  br label %for.cond
24*9880d681SAndroid Build Coastguard Worker
25*9880d681SAndroid Build Coastguard Workerfor.end:
26*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %c.addr.0
27*9880d681SAndroid Build Coastguard Worker}
28*9880d681SAndroid Build Coastguard Worker
29*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubaddpd_loop_128:
30*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmsubadd231pd %xmm1, %xmm0, %xmm2
31*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
32*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
33*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmsubaddpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) {
34*9880d681SAndroid Build Coastguard Workerentry:
35*9880d681SAndroid Build Coastguard Worker  br label %for.cond
36*9880d681SAndroid Build Coastguard Worker
37*9880d681SAndroid Build Coastguard Workerfor.cond:
38*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ]
39*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
40*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
41*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
42*9880d681SAndroid Build Coastguard Worker
43*9880d681SAndroid Build Coastguard Workerfor.body:
44*9880d681SAndroid Build Coastguard Worker  br label %for.inc
45*9880d681SAndroid Build Coastguard Worker
46*9880d681SAndroid Build Coastguard Workerfor.inc:
47*9880d681SAndroid Build Coastguard Worker  %0 = call <2 x double> @llvm.x86.fma.vfmsubadd.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0)
48*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
49*9880d681SAndroid Build Coastguard Worker  br label %for.cond
50*9880d681SAndroid Build Coastguard Worker
51*9880d681SAndroid Build Coastguard Workerfor.end:
52*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %c.addr.0
53*9880d681SAndroid Build Coastguard Worker}
54*9880d681SAndroid Build Coastguard Worker
55*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddpd_loop_128:
56*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmadd231pd %xmm1, %xmm0, %xmm2
57*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
58*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
59*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmaddpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) {
60*9880d681SAndroid Build Coastguard Workerentry:
61*9880d681SAndroid Build Coastguard Worker  br label %for.cond
62*9880d681SAndroid Build Coastguard Worker
63*9880d681SAndroid Build Coastguard Workerfor.cond:
64*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ]
65*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
66*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
67*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
68*9880d681SAndroid Build Coastguard Worker
69*9880d681SAndroid Build Coastguard Workerfor.body:
70*9880d681SAndroid Build Coastguard Worker  br label %for.inc
71*9880d681SAndroid Build Coastguard Worker
72*9880d681SAndroid Build Coastguard Workerfor.inc:
73*9880d681SAndroid Build Coastguard Worker  %0 = call <2 x double> @llvm.x86.fma.vfmadd.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0)
74*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
75*9880d681SAndroid Build Coastguard Worker  br label %for.cond
76*9880d681SAndroid Build Coastguard Worker
77*9880d681SAndroid Build Coastguard Workerfor.end:
78*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %c.addr.0
79*9880d681SAndroid Build Coastguard Worker}
80*9880d681SAndroid Build Coastguard Worker
81*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubpd_loop_128:
82*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmsub231pd %xmm1, %xmm0, %xmm2
83*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
84*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
85*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmsubpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) {
86*9880d681SAndroid Build Coastguard Workerentry:
87*9880d681SAndroid Build Coastguard Worker  br label %for.cond
88*9880d681SAndroid Build Coastguard Worker
89*9880d681SAndroid Build Coastguard Workerfor.cond:
90*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ]
91*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
92*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
93*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
94*9880d681SAndroid Build Coastguard Worker
95*9880d681SAndroid Build Coastguard Workerfor.body:
96*9880d681SAndroid Build Coastguard Worker  br label %for.inc
97*9880d681SAndroid Build Coastguard Worker
98*9880d681SAndroid Build Coastguard Workerfor.inc:
99*9880d681SAndroid Build Coastguard Worker  %0 = call <2 x double> @llvm.x86.fma.vfmsub.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0)
100*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
101*9880d681SAndroid Build Coastguard Worker  br label %for.cond
102*9880d681SAndroid Build Coastguard Worker
103*9880d681SAndroid Build Coastguard Workerfor.end:
104*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %c.addr.0
105*9880d681SAndroid Build Coastguard Worker}
106*9880d681SAndroid Build Coastguard Worker
107*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmaddpd_loop_128:
108*9880d681SAndroid Build Coastguard Worker; CHECK:   vfnmadd231pd %xmm1, %xmm0, %xmm2
109*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
110*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
111*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fnmaddpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) {
112*9880d681SAndroid Build Coastguard Workerentry:
113*9880d681SAndroid Build Coastguard Worker  br label %for.cond
114*9880d681SAndroid Build Coastguard Worker
115*9880d681SAndroid Build Coastguard Workerfor.cond:
116*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ]
117*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
118*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
119*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
120*9880d681SAndroid Build Coastguard Worker
121*9880d681SAndroid Build Coastguard Workerfor.body:
122*9880d681SAndroid Build Coastguard Worker  br label %for.inc
123*9880d681SAndroid Build Coastguard Worker
124*9880d681SAndroid Build Coastguard Workerfor.inc:
125*9880d681SAndroid Build Coastguard Worker  %0 = call <2 x double> @llvm.x86.fma.vfnmadd.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0)
126*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
127*9880d681SAndroid Build Coastguard Worker  br label %for.cond
128*9880d681SAndroid Build Coastguard Worker
129*9880d681SAndroid Build Coastguard Workerfor.end:
130*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %c.addr.0
131*9880d681SAndroid Build Coastguard Worker}
132*9880d681SAndroid Build Coastguard Worker
133*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmsubpd_loop_128:
134*9880d681SAndroid Build Coastguard Worker; CHECK:   vfnmsub231pd %xmm1, %xmm0, %xmm2
135*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
136*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
137*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fnmsubpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) {
138*9880d681SAndroid Build Coastguard Workerentry:
139*9880d681SAndroid Build Coastguard Worker  br label %for.cond
140*9880d681SAndroid Build Coastguard Worker
141*9880d681SAndroid Build Coastguard Workerfor.cond:
142*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ]
143*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
144*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
145*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
146*9880d681SAndroid Build Coastguard Worker
147*9880d681SAndroid Build Coastguard Workerfor.body:
148*9880d681SAndroid Build Coastguard Worker  br label %for.inc
149*9880d681SAndroid Build Coastguard Worker
150*9880d681SAndroid Build Coastguard Workerfor.inc:
151*9880d681SAndroid Build Coastguard Worker  %0 = call <2 x double> @llvm.x86.fma.vfnmsub.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0)
152*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
153*9880d681SAndroid Build Coastguard Worker  br label %for.cond
154*9880d681SAndroid Build Coastguard Worker
155*9880d681SAndroid Build Coastguard Workerfor.end:
156*9880d681SAndroid Build Coastguard Worker  ret <2 x double> %c.addr.0
157*9880d681SAndroid Build Coastguard Worker}
158*9880d681SAndroid Build Coastguard Worker
159*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfmaddsub.pd(<2 x double>, <2 x double>, <2 x double>)
160*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfmsubadd.pd(<2 x double>, <2 x double>, <2 x double>)
161*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfmadd.pd(<2 x double>, <2 x double>, <2 x double>)
162*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfmsub.pd(<2 x double>, <2 x double>, <2 x double>)
163*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfnmadd.pd(<2 x double>, <2 x double>, <2 x double>)
164*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfnmsub.pd(<2 x double>, <2 x double>, <2 x double>)
165*9880d681SAndroid Build Coastguard Worker
166*9880d681SAndroid Build Coastguard Worker
167*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddsubps_loop_128:
168*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmaddsub231ps %xmm1, %xmm0, %xmm2
169*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
170*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
171*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmaddsubps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) {
172*9880d681SAndroid Build Coastguard Workerentry:
173*9880d681SAndroid Build Coastguard Worker  br label %for.cond
174*9880d681SAndroid Build Coastguard Worker
175*9880d681SAndroid Build Coastguard Workerfor.cond:
176*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ]
177*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
178*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
179*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
180*9880d681SAndroid Build Coastguard Worker
181*9880d681SAndroid Build Coastguard Workerfor.body:
182*9880d681SAndroid Build Coastguard Worker  br label %for.inc
183*9880d681SAndroid Build Coastguard Worker
184*9880d681SAndroid Build Coastguard Workerfor.inc:
185*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x float> @llvm.x86.fma.vfmaddsub.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0)
186*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
187*9880d681SAndroid Build Coastguard Worker  br label %for.cond
188*9880d681SAndroid Build Coastguard Worker
189*9880d681SAndroid Build Coastguard Workerfor.end:
190*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %c.addr.0
191*9880d681SAndroid Build Coastguard Worker}
192*9880d681SAndroid Build Coastguard Worker
193*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubaddps_loop_128:
194*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmsubadd231ps %xmm1, %xmm0, %xmm2
195*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
196*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
197*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmsubaddps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) {
198*9880d681SAndroid Build Coastguard Workerentry:
199*9880d681SAndroid Build Coastguard Worker  br label %for.cond
200*9880d681SAndroid Build Coastguard Worker
201*9880d681SAndroid Build Coastguard Workerfor.cond:
202*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ]
203*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
204*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
205*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
206*9880d681SAndroid Build Coastguard Worker
207*9880d681SAndroid Build Coastguard Workerfor.body:
208*9880d681SAndroid Build Coastguard Worker  br label %for.inc
209*9880d681SAndroid Build Coastguard Worker
210*9880d681SAndroid Build Coastguard Workerfor.inc:
211*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x float> @llvm.x86.fma.vfmsubadd.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0)
212*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
213*9880d681SAndroid Build Coastguard Worker  br label %for.cond
214*9880d681SAndroid Build Coastguard Worker
215*9880d681SAndroid Build Coastguard Workerfor.end:
216*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %c.addr.0
217*9880d681SAndroid Build Coastguard Worker}
218*9880d681SAndroid Build Coastguard Worker
219*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddps_loop_128:
220*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmadd231ps %xmm1, %xmm0, %xmm2
221*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
222*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
223*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmaddps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) {
224*9880d681SAndroid Build Coastguard Workerentry:
225*9880d681SAndroid Build Coastguard Worker  br label %for.cond
226*9880d681SAndroid Build Coastguard Worker
227*9880d681SAndroid Build Coastguard Workerfor.cond:
228*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ]
229*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
230*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
231*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
232*9880d681SAndroid Build Coastguard Worker
233*9880d681SAndroid Build Coastguard Workerfor.body:
234*9880d681SAndroid Build Coastguard Worker  br label %for.inc
235*9880d681SAndroid Build Coastguard Worker
236*9880d681SAndroid Build Coastguard Workerfor.inc:
237*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x float> @llvm.x86.fma.vfmadd.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0)
238*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
239*9880d681SAndroid Build Coastguard Worker  br label %for.cond
240*9880d681SAndroid Build Coastguard Worker
241*9880d681SAndroid Build Coastguard Workerfor.end:
242*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %c.addr.0
243*9880d681SAndroid Build Coastguard Worker}
244*9880d681SAndroid Build Coastguard Worker
245*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubps_loop_128:
246*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmsub231ps %xmm1, %xmm0, %xmm2
247*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
248*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
249*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmsubps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) {
250*9880d681SAndroid Build Coastguard Workerentry:
251*9880d681SAndroid Build Coastguard Worker  br label %for.cond
252*9880d681SAndroid Build Coastguard Worker
253*9880d681SAndroid Build Coastguard Workerfor.cond:
254*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ]
255*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
256*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
257*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
258*9880d681SAndroid Build Coastguard Worker
259*9880d681SAndroid Build Coastguard Workerfor.body:
260*9880d681SAndroid Build Coastguard Worker  br label %for.inc
261*9880d681SAndroid Build Coastguard Worker
262*9880d681SAndroid Build Coastguard Workerfor.inc:
263*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x float> @llvm.x86.fma.vfmsub.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0)
264*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
265*9880d681SAndroid Build Coastguard Worker  br label %for.cond
266*9880d681SAndroid Build Coastguard Worker
267*9880d681SAndroid Build Coastguard Workerfor.end:
268*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %c.addr.0
269*9880d681SAndroid Build Coastguard Worker}
270*9880d681SAndroid Build Coastguard Worker
271*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmaddps_loop_128:
272*9880d681SAndroid Build Coastguard Worker; CHECK:   vfnmadd231ps %xmm1, %xmm0, %xmm2
273*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
274*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
275*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fnmaddps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) {
276*9880d681SAndroid Build Coastguard Workerentry:
277*9880d681SAndroid Build Coastguard Worker  br label %for.cond
278*9880d681SAndroid Build Coastguard Worker
279*9880d681SAndroid Build Coastguard Workerfor.cond:
280*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ]
281*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
282*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
283*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
284*9880d681SAndroid Build Coastguard Worker
285*9880d681SAndroid Build Coastguard Workerfor.body:
286*9880d681SAndroid Build Coastguard Worker  br label %for.inc
287*9880d681SAndroid Build Coastguard Worker
288*9880d681SAndroid Build Coastguard Workerfor.inc:
289*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x float> @llvm.x86.fma.vfnmadd.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0)
290*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
291*9880d681SAndroid Build Coastguard Worker  br label %for.cond
292*9880d681SAndroid Build Coastguard Worker
293*9880d681SAndroid Build Coastguard Workerfor.end:
294*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %c.addr.0
295*9880d681SAndroid Build Coastguard Worker}
296*9880d681SAndroid Build Coastguard Worker
297*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmsubps_loop_128:
298*9880d681SAndroid Build Coastguard Worker; CHECK:   vfnmsub231ps %xmm1, %xmm0, %xmm2
299*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %xmm2, %xmm0
300*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
301*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fnmsubps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) {
302*9880d681SAndroid Build Coastguard Workerentry:
303*9880d681SAndroid Build Coastguard Worker  br label %for.cond
304*9880d681SAndroid Build Coastguard Worker
305*9880d681SAndroid Build Coastguard Workerfor.cond:
306*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ]
307*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
308*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
309*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
310*9880d681SAndroid Build Coastguard Worker
311*9880d681SAndroid Build Coastguard Workerfor.body:
312*9880d681SAndroid Build Coastguard Worker  br label %for.inc
313*9880d681SAndroid Build Coastguard Worker
314*9880d681SAndroid Build Coastguard Workerfor.inc:
315*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x float> @llvm.x86.fma.vfnmsub.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0)
316*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
317*9880d681SAndroid Build Coastguard Worker  br label %for.cond
318*9880d681SAndroid Build Coastguard Worker
319*9880d681SAndroid Build Coastguard Workerfor.end:
320*9880d681SAndroid Build Coastguard Worker  ret <4 x float> %c.addr.0
321*9880d681SAndroid Build Coastguard Worker}
322*9880d681SAndroid Build Coastguard Worker
323*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfmaddsub.ps(<4 x float>, <4 x float>, <4 x float>)
324*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfmsubadd.ps(<4 x float>, <4 x float>, <4 x float>)
325*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfmadd.ps(<4 x float>, <4 x float>, <4 x float>)
326*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfmsub.ps(<4 x float>, <4 x float>, <4 x float>)
327*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfnmadd.ps(<4 x float>, <4 x float>, <4 x float>)
328*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfnmsub.ps(<4 x float>, <4 x float>, <4 x float>)
329*9880d681SAndroid Build Coastguard Worker
330*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddsubpd_loop_256:
331*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmaddsub231pd %ymm1, %ymm0, %ymm2
332*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
333*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
334*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fmaddsubpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) {
335*9880d681SAndroid Build Coastguard Workerentry:
336*9880d681SAndroid Build Coastguard Worker  br label %for.cond
337*9880d681SAndroid Build Coastguard Worker
338*9880d681SAndroid Build Coastguard Workerfor.cond:
339*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ]
340*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
341*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
342*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
343*9880d681SAndroid Build Coastguard Worker
344*9880d681SAndroid Build Coastguard Workerfor.body:
345*9880d681SAndroid Build Coastguard Worker  br label %for.inc
346*9880d681SAndroid Build Coastguard Worker
347*9880d681SAndroid Build Coastguard Workerfor.inc:
348*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x double> @llvm.x86.fma.vfmaddsub.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0)
349*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
350*9880d681SAndroid Build Coastguard Worker  br label %for.cond
351*9880d681SAndroid Build Coastguard Worker
352*9880d681SAndroid Build Coastguard Workerfor.end:
353*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %c.addr.0
354*9880d681SAndroid Build Coastguard Worker}
355*9880d681SAndroid Build Coastguard Worker
356*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubaddpd_loop_256:
357*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmsubadd231pd %ymm1, %ymm0, %ymm2
358*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
359*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
360*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fmsubaddpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) {
361*9880d681SAndroid Build Coastguard Workerentry:
362*9880d681SAndroid Build Coastguard Worker  br label %for.cond
363*9880d681SAndroid Build Coastguard Worker
364*9880d681SAndroid Build Coastguard Workerfor.cond:
365*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ]
366*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
367*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
368*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
369*9880d681SAndroid Build Coastguard Worker
370*9880d681SAndroid Build Coastguard Workerfor.body:
371*9880d681SAndroid Build Coastguard Worker  br label %for.inc
372*9880d681SAndroid Build Coastguard Worker
373*9880d681SAndroid Build Coastguard Workerfor.inc:
374*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x double> @llvm.x86.fma.vfmsubadd.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0)
375*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
376*9880d681SAndroid Build Coastguard Worker  br label %for.cond
377*9880d681SAndroid Build Coastguard Worker
378*9880d681SAndroid Build Coastguard Workerfor.end:
379*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %c.addr.0
380*9880d681SAndroid Build Coastguard Worker}
381*9880d681SAndroid Build Coastguard Worker
382*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddpd_loop_256:
383*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmadd231pd %ymm1, %ymm0, %ymm2
384*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
385*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
386*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fmaddpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) {
387*9880d681SAndroid Build Coastguard Workerentry:
388*9880d681SAndroid Build Coastguard Worker  br label %for.cond
389*9880d681SAndroid Build Coastguard Worker
390*9880d681SAndroid Build Coastguard Workerfor.cond:
391*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ]
392*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
393*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
394*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
395*9880d681SAndroid Build Coastguard Worker
396*9880d681SAndroid Build Coastguard Workerfor.body:
397*9880d681SAndroid Build Coastguard Worker  br label %for.inc
398*9880d681SAndroid Build Coastguard Worker
399*9880d681SAndroid Build Coastguard Workerfor.inc:
400*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x double> @llvm.x86.fma.vfmadd.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0)
401*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
402*9880d681SAndroid Build Coastguard Worker  br label %for.cond
403*9880d681SAndroid Build Coastguard Worker
404*9880d681SAndroid Build Coastguard Workerfor.end:
405*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %c.addr.0
406*9880d681SAndroid Build Coastguard Worker}
407*9880d681SAndroid Build Coastguard Worker
408*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubpd_loop_256:
409*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmsub231pd %ymm1, %ymm0, %ymm2
410*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
411*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
412*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fmsubpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) {
413*9880d681SAndroid Build Coastguard Workerentry:
414*9880d681SAndroid Build Coastguard Worker  br label %for.cond
415*9880d681SAndroid Build Coastguard Worker
416*9880d681SAndroid Build Coastguard Workerfor.cond:
417*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ]
418*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
419*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
420*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
421*9880d681SAndroid Build Coastguard Worker
422*9880d681SAndroid Build Coastguard Workerfor.body:
423*9880d681SAndroid Build Coastguard Worker  br label %for.inc
424*9880d681SAndroid Build Coastguard Worker
425*9880d681SAndroid Build Coastguard Workerfor.inc:
426*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x double> @llvm.x86.fma.vfmsub.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0)
427*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
428*9880d681SAndroid Build Coastguard Worker  br label %for.cond
429*9880d681SAndroid Build Coastguard Worker
430*9880d681SAndroid Build Coastguard Workerfor.end:
431*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %c.addr.0
432*9880d681SAndroid Build Coastguard Worker}
433*9880d681SAndroid Build Coastguard Worker
434*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmaddpd_loop_256:
435*9880d681SAndroid Build Coastguard Worker; CHECK:   vfnmadd231pd %ymm1, %ymm0, %ymm2
436*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
437*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
438*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fnmaddpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) {
439*9880d681SAndroid Build Coastguard Workerentry:
440*9880d681SAndroid Build Coastguard Worker  br label %for.cond
441*9880d681SAndroid Build Coastguard Worker
442*9880d681SAndroid Build Coastguard Workerfor.cond:
443*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ]
444*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
445*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
446*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
447*9880d681SAndroid Build Coastguard Worker
448*9880d681SAndroid Build Coastguard Workerfor.body:
449*9880d681SAndroid Build Coastguard Worker  br label %for.inc
450*9880d681SAndroid Build Coastguard Worker
451*9880d681SAndroid Build Coastguard Workerfor.inc:
452*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x double> @llvm.x86.fma.vfnmadd.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0)
453*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
454*9880d681SAndroid Build Coastguard Worker  br label %for.cond
455*9880d681SAndroid Build Coastguard Worker
456*9880d681SAndroid Build Coastguard Workerfor.end:
457*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %c.addr.0
458*9880d681SAndroid Build Coastguard Worker}
459*9880d681SAndroid Build Coastguard Worker
460*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmsubpd_loop_256:
461*9880d681SAndroid Build Coastguard Worker; CHECK:   vfnmsub231pd %ymm1, %ymm0, %ymm2
462*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
463*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
464*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fnmsubpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) {
465*9880d681SAndroid Build Coastguard Workerentry:
466*9880d681SAndroid Build Coastguard Worker  br label %for.cond
467*9880d681SAndroid Build Coastguard Worker
468*9880d681SAndroid Build Coastguard Workerfor.cond:
469*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ]
470*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
471*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
472*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
473*9880d681SAndroid Build Coastguard Worker
474*9880d681SAndroid Build Coastguard Workerfor.body:
475*9880d681SAndroid Build Coastguard Worker  br label %for.inc
476*9880d681SAndroid Build Coastguard Worker
477*9880d681SAndroid Build Coastguard Workerfor.inc:
478*9880d681SAndroid Build Coastguard Worker  %0 = call <4 x double> @llvm.x86.fma.vfnmsub.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0)
479*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
480*9880d681SAndroid Build Coastguard Worker  br label %for.cond
481*9880d681SAndroid Build Coastguard Worker
482*9880d681SAndroid Build Coastguard Workerfor.end:
483*9880d681SAndroid Build Coastguard Worker  ret <4 x double> %c.addr.0
484*9880d681SAndroid Build Coastguard Worker}
485*9880d681SAndroid Build Coastguard Worker
486*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfmaddsub.pd.256(<4 x double>, <4 x double>, <4 x double>)
487*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfmsubadd.pd.256(<4 x double>, <4 x double>, <4 x double>)
488*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfmadd.pd.256(<4 x double>, <4 x double>, <4 x double>)
489*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfmsub.pd.256(<4 x double>, <4 x double>, <4 x double>)
490*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfnmadd.pd.256(<4 x double>, <4 x double>, <4 x double>)
491*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfnmsub.pd.256(<4 x double>, <4 x double>, <4 x double>)
492*9880d681SAndroid Build Coastguard Worker
493*9880d681SAndroid Build Coastguard Worker
494*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddsubps_loop_256:
495*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmaddsub231ps %ymm1, %ymm0, %ymm2
496*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
497*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
498*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fmaddsubps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) {
499*9880d681SAndroid Build Coastguard Workerentry:
500*9880d681SAndroid Build Coastguard Worker  br label %for.cond
501*9880d681SAndroid Build Coastguard Worker
502*9880d681SAndroid Build Coastguard Workerfor.cond:
503*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ]
504*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
505*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
506*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
507*9880d681SAndroid Build Coastguard Worker
508*9880d681SAndroid Build Coastguard Workerfor.body:
509*9880d681SAndroid Build Coastguard Worker  br label %for.inc
510*9880d681SAndroid Build Coastguard Worker
511*9880d681SAndroid Build Coastguard Workerfor.inc:
512*9880d681SAndroid Build Coastguard Worker  %0 = call <8 x float> @llvm.x86.fma.vfmaddsub.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0)
513*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
514*9880d681SAndroid Build Coastguard Worker  br label %for.cond
515*9880d681SAndroid Build Coastguard Worker
516*9880d681SAndroid Build Coastguard Workerfor.end:
517*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %c.addr.0
518*9880d681SAndroid Build Coastguard Worker}
519*9880d681SAndroid Build Coastguard Worker
520*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubaddps_loop_256:
521*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmsubadd231ps %ymm1, %ymm0, %ymm2
522*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
523*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
524*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fmsubaddps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) {
525*9880d681SAndroid Build Coastguard Workerentry:
526*9880d681SAndroid Build Coastguard Worker  br label %for.cond
527*9880d681SAndroid Build Coastguard Worker
528*9880d681SAndroid Build Coastguard Workerfor.cond:
529*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ]
530*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
531*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
532*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
533*9880d681SAndroid Build Coastguard Worker
534*9880d681SAndroid Build Coastguard Workerfor.body:
535*9880d681SAndroid Build Coastguard Worker  br label %for.inc
536*9880d681SAndroid Build Coastguard Worker
537*9880d681SAndroid Build Coastguard Workerfor.inc:
538*9880d681SAndroid Build Coastguard Worker  %0 = call <8 x float> @llvm.x86.fma.vfmsubadd.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0)
539*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
540*9880d681SAndroid Build Coastguard Worker  br label %for.cond
541*9880d681SAndroid Build Coastguard Worker
542*9880d681SAndroid Build Coastguard Workerfor.end:
543*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %c.addr.0
544*9880d681SAndroid Build Coastguard Worker}
545*9880d681SAndroid Build Coastguard Worker
546*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddps_loop_256:
547*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmadd231ps %ymm1, %ymm0, %ymm2
548*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
549*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
550*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fmaddps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) {
551*9880d681SAndroid Build Coastguard Workerentry:
552*9880d681SAndroid Build Coastguard Worker  br label %for.cond
553*9880d681SAndroid Build Coastguard Worker
554*9880d681SAndroid Build Coastguard Workerfor.cond:
555*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ]
556*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
557*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
558*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
559*9880d681SAndroid Build Coastguard Worker
560*9880d681SAndroid Build Coastguard Workerfor.body:
561*9880d681SAndroid Build Coastguard Worker  br label %for.inc
562*9880d681SAndroid Build Coastguard Worker
563*9880d681SAndroid Build Coastguard Workerfor.inc:
564*9880d681SAndroid Build Coastguard Worker  %0 = call <8 x float> @llvm.x86.fma.vfmadd.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0)
565*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
566*9880d681SAndroid Build Coastguard Worker  br label %for.cond
567*9880d681SAndroid Build Coastguard Worker
568*9880d681SAndroid Build Coastguard Workerfor.end:
569*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %c.addr.0
570*9880d681SAndroid Build Coastguard Worker}
571*9880d681SAndroid Build Coastguard Worker
572*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubps_loop_256:
573*9880d681SAndroid Build Coastguard Worker; CHECK:   vfmsub231ps %ymm1, %ymm0, %ymm2
574*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
575*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
576*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fmsubps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) {
577*9880d681SAndroid Build Coastguard Workerentry:
578*9880d681SAndroid Build Coastguard Worker  br label %for.cond
579*9880d681SAndroid Build Coastguard Worker
580*9880d681SAndroid Build Coastguard Workerfor.cond:
581*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ]
582*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
583*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
584*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
585*9880d681SAndroid Build Coastguard Worker
586*9880d681SAndroid Build Coastguard Workerfor.body:
587*9880d681SAndroid Build Coastguard Worker  br label %for.inc
588*9880d681SAndroid Build Coastguard Worker
589*9880d681SAndroid Build Coastguard Workerfor.inc:
590*9880d681SAndroid Build Coastguard Worker  %0 = call <8 x float> @llvm.x86.fma.vfmsub.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0)
591*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
592*9880d681SAndroid Build Coastguard Worker  br label %for.cond
593*9880d681SAndroid Build Coastguard Worker
594*9880d681SAndroid Build Coastguard Workerfor.end:
595*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %c.addr.0
596*9880d681SAndroid Build Coastguard Worker}
597*9880d681SAndroid Build Coastguard Worker
598*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmaddps_loop_256:
599*9880d681SAndroid Build Coastguard Worker; CHECK:   vfnmadd231ps %ymm1, %ymm0, %ymm2
600*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
601*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
602*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fnmaddps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) {
603*9880d681SAndroid Build Coastguard Workerentry:
604*9880d681SAndroid Build Coastguard Worker  br label %for.cond
605*9880d681SAndroid Build Coastguard Worker
606*9880d681SAndroid Build Coastguard Workerfor.cond:
607*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ]
608*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
609*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
610*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
611*9880d681SAndroid Build Coastguard Worker
612*9880d681SAndroid Build Coastguard Workerfor.body:
613*9880d681SAndroid Build Coastguard Worker  br label %for.inc
614*9880d681SAndroid Build Coastguard Worker
615*9880d681SAndroid Build Coastguard Workerfor.inc:
616*9880d681SAndroid Build Coastguard Worker  %0 = call <8 x float> @llvm.x86.fma.vfnmadd.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0)
617*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
618*9880d681SAndroid Build Coastguard Worker  br label %for.cond
619*9880d681SAndroid Build Coastguard Worker
620*9880d681SAndroid Build Coastguard Workerfor.end:
621*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %c.addr.0
622*9880d681SAndroid Build Coastguard Worker}
623*9880d681SAndroid Build Coastguard Worker
624*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmsubps_loop_256:
625*9880d681SAndroid Build Coastguard Worker; CHECK:   vfnmsub231ps %ymm1, %ymm0, %ymm2
626*9880d681SAndroid Build Coastguard Worker; CHECK:   vmovaps %ymm2, %ymm0
627*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq
628*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fnmsubps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) {
629*9880d681SAndroid Build Coastguard Workerentry:
630*9880d681SAndroid Build Coastguard Worker  br label %for.cond
631*9880d681SAndroid Build Coastguard Worker
632*9880d681SAndroid Build Coastguard Workerfor.cond:
633*9880d681SAndroid Build Coastguard Worker  %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ]
634*9880d681SAndroid Build Coastguard Worker  %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ]
635*9880d681SAndroid Build Coastguard Worker  %cmp = icmp slt i32 %i.0, %iter
636*9880d681SAndroid Build Coastguard Worker  br i1 %cmp, label %for.body, label %for.end
637*9880d681SAndroid Build Coastguard Worker
638*9880d681SAndroid Build Coastguard Workerfor.body:
639*9880d681SAndroid Build Coastguard Worker  br label %for.inc
640*9880d681SAndroid Build Coastguard Worker
641*9880d681SAndroid Build Coastguard Workerfor.inc:
642*9880d681SAndroid Build Coastguard Worker  %0 = call <8 x float> @llvm.x86.fma.vfnmsub.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0)
643*9880d681SAndroid Build Coastguard Worker  %inc = add nsw i32 %i.0, 1
644*9880d681SAndroid Build Coastguard Worker  br label %for.cond
645*9880d681SAndroid Build Coastguard Worker
646*9880d681SAndroid Build Coastguard Workerfor.end:
647*9880d681SAndroid Build Coastguard Worker  ret <8 x float> %c.addr.0
648*9880d681SAndroid Build Coastguard Worker}
649*9880d681SAndroid Build Coastguard Worker
650*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfmaddsub.ps.256(<8 x float>, <8 x float>, <8 x float>)
651*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfmsubadd.ps.256(<8 x float>, <8 x float>, <8 x float>)
652*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfmadd.ps.256(<8 x float>, <8 x float>, <8 x float>)
653*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfmsub.ps.256(<8 x float>, <8 x float>, <8 x float>)
654*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfnmadd.ps.256(<8 x float>, <8 x float>, <8 x float>)
655*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfnmsub.ps.256(<8 x float>, <8 x float>, <8 x float>)
656