1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx2,+fma | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddsubpd_loop_128: 4*9880d681SAndroid Build Coastguard Worker; CHECK: vfmaddsub231pd %xmm1, %xmm0, %xmm2 5*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 6*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 7*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmaddsubpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) { 8*9880d681SAndroid Build Coastguard Workerentry: 9*9880d681SAndroid Build Coastguard Worker br label %for.cond 10*9880d681SAndroid Build Coastguard Worker 11*9880d681SAndroid Build Coastguard Workerfor.cond: 12*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ] 13*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 14*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 15*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 16*9880d681SAndroid Build Coastguard Worker 17*9880d681SAndroid Build Coastguard Workerfor.body: 18*9880d681SAndroid Build Coastguard Worker br label %for.inc 19*9880d681SAndroid Build Coastguard Worker 20*9880d681SAndroid Build Coastguard Workerfor.inc: 21*9880d681SAndroid Build Coastguard Worker %0 = call <2 x double> @llvm.x86.fma.vfmaddsub.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0) 22*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 23*9880d681SAndroid Build Coastguard Worker br label %for.cond 24*9880d681SAndroid Build Coastguard Worker 25*9880d681SAndroid Build Coastguard Workerfor.end: 26*9880d681SAndroid Build Coastguard Worker ret <2 x double> %c.addr.0 27*9880d681SAndroid Build Coastguard Worker} 28*9880d681SAndroid Build Coastguard Worker 29*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubaddpd_loop_128: 30*9880d681SAndroid Build Coastguard Worker; CHECK: vfmsubadd231pd %xmm1, %xmm0, %xmm2 31*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 32*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 33*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmsubaddpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) { 34*9880d681SAndroid Build Coastguard Workerentry: 35*9880d681SAndroid Build Coastguard Worker br label %for.cond 36*9880d681SAndroid Build Coastguard Worker 37*9880d681SAndroid Build Coastguard Workerfor.cond: 38*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ] 39*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 40*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 41*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 42*9880d681SAndroid Build Coastguard Worker 43*9880d681SAndroid Build Coastguard Workerfor.body: 44*9880d681SAndroid Build Coastguard Worker br label %for.inc 45*9880d681SAndroid Build Coastguard Worker 46*9880d681SAndroid Build Coastguard Workerfor.inc: 47*9880d681SAndroid Build Coastguard Worker %0 = call <2 x double> @llvm.x86.fma.vfmsubadd.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0) 48*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 49*9880d681SAndroid Build Coastguard Worker br label %for.cond 50*9880d681SAndroid Build Coastguard Worker 51*9880d681SAndroid Build Coastguard Workerfor.end: 52*9880d681SAndroid Build Coastguard Worker ret <2 x double> %c.addr.0 53*9880d681SAndroid Build Coastguard Worker} 54*9880d681SAndroid Build Coastguard Worker 55*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddpd_loop_128: 56*9880d681SAndroid Build Coastguard Worker; CHECK: vfmadd231pd %xmm1, %xmm0, %xmm2 57*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 58*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 59*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmaddpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) { 60*9880d681SAndroid Build Coastguard Workerentry: 61*9880d681SAndroid Build Coastguard Worker br label %for.cond 62*9880d681SAndroid Build Coastguard Worker 63*9880d681SAndroid Build Coastguard Workerfor.cond: 64*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ] 65*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 66*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 67*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 68*9880d681SAndroid Build Coastguard Worker 69*9880d681SAndroid Build Coastguard Workerfor.body: 70*9880d681SAndroid Build Coastguard Worker br label %for.inc 71*9880d681SAndroid Build Coastguard Worker 72*9880d681SAndroid Build Coastguard Workerfor.inc: 73*9880d681SAndroid Build Coastguard Worker %0 = call <2 x double> @llvm.x86.fma.vfmadd.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0) 74*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 75*9880d681SAndroid Build Coastguard Worker br label %for.cond 76*9880d681SAndroid Build Coastguard Worker 77*9880d681SAndroid Build Coastguard Workerfor.end: 78*9880d681SAndroid Build Coastguard Worker ret <2 x double> %c.addr.0 79*9880d681SAndroid Build Coastguard Worker} 80*9880d681SAndroid Build Coastguard Worker 81*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubpd_loop_128: 82*9880d681SAndroid Build Coastguard Worker; CHECK: vfmsub231pd %xmm1, %xmm0, %xmm2 83*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 84*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 85*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmsubpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) { 86*9880d681SAndroid Build Coastguard Workerentry: 87*9880d681SAndroid Build Coastguard Worker br label %for.cond 88*9880d681SAndroid Build Coastguard Worker 89*9880d681SAndroid Build Coastguard Workerfor.cond: 90*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ] 91*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 92*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 93*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 94*9880d681SAndroid Build Coastguard Worker 95*9880d681SAndroid Build Coastguard Workerfor.body: 96*9880d681SAndroid Build Coastguard Worker br label %for.inc 97*9880d681SAndroid Build Coastguard Worker 98*9880d681SAndroid Build Coastguard Workerfor.inc: 99*9880d681SAndroid Build Coastguard Worker %0 = call <2 x double> @llvm.x86.fma.vfmsub.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0) 100*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 101*9880d681SAndroid Build Coastguard Worker br label %for.cond 102*9880d681SAndroid Build Coastguard Worker 103*9880d681SAndroid Build Coastguard Workerfor.end: 104*9880d681SAndroid Build Coastguard Worker ret <2 x double> %c.addr.0 105*9880d681SAndroid Build Coastguard Worker} 106*9880d681SAndroid Build Coastguard Worker 107*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmaddpd_loop_128: 108*9880d681SAndroid Build Coastguard Worker; CHECK: vfnmadd231pd %xmm1, %xmm0, %xmm2 109*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 110*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 111*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fnmaddpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) { 112*9880d681SAndroid Build Coastguard Workerentry: 113*9880d681SAndroid Build Coastguard Worker br label %for.cond 114*9880d681SAndroid Build Coastguard Worker 115*9880d681SAndroid Build Coastguard Workerfor.cond: 116*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ] 117*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 118*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 119*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 120*9880d681SAndroid Build Coastguard Worker 121*9880d681SAndroid Build Coastguard Workerfor.body: 122*9880d681SAndroid Build Coastguard Worker br label %for.inc 123*9880d681SAndroid Build Coastguard Worker 124*9880d681SAndroid Build Coastguard Workerfor.inc: 125*9880d681SAndroid Build Coastguard Worker %0 = call <2 x double> @llvm.x86.fma.vfnmadd.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0) 126*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 127*9880d681SAndroid Build Coastguard Worker br label %for.cond 128*9880d681SAndroid Build Coastguard Worker 129*9880d681SAndroid Build Coastguard Workerfor.end: 130*9880d681SAndroid Build Coastguard Worker ret <2 x double> %c.addr.0 131*9880d681SAndroid Build Coastguard Worker} 132*9880d681SAndroid Build Coastguard Worker 133*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmsubpd_loop_128: 134*9880d681SAndroid Build Coastguard Worker; CHECK: vfnmsub231pd %xmm1, %xmm0, %xmm2 135*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 136*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 137*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fnmsubpd_loop_128(i32 %iter, <2 x double> %a, <2 x double> %b, <2 x double> %c) { 138*9880d681SAndroid Build Coastguard Workerentry: 139*9880d681SAndroid Build Coastguard Worker br label %for.cond 140*9880d681SAndroid Build Coastguard Worker 141*9880d681SAndroid Build Coastguard Workerfor.cond: 142*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <2 x double> [ %c, %entry ], [ %0, %for.inc ] 143*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 144*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 145*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 146*9880d681SAndroid Build Coastguard Worker 147*9880d681SAndroid Build Coastguard Workerfor.body: 148*9880d681SAndroid Build Coastguard Worker br label %for.inc 149*9880d681SAndroid Build Coastguard Worker 150*9880d681SAndroid Build Coastguard Workerfor.inc: 151*9880d681SAndroid Build Coastguard Worker %0 = call <2 x double> @llvm.x86.fma.vfnmsub.pd(<2 x double> %a, <2 x double> %b, <2 x double> %c.addr.0) 152*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 153*9880d681SAndroid Build Coastguard Worker br label %for.cond 154*9880d681SAndroid Build Coastguard Worker 155*9880d681SAndroid Build Coastguard Workerfor.end: 156*9880d681SAndroid Build Coastguard Worker ret <2 x double> %c.addr.0 157*9880d681SAndroid Build Coastguard Worker} 158*9880d681SAndroid Build Coastguard Worker 159*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfmaddsub.pd(<2 x double>, <2 x double>, <2 x double>) 160*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfmsubadd.pd(<2 x double>, <2 x double>, <2 x double>) 161*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfmadd.pd(<2 x double>, <2 x double>, <2 x double>) 162*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfmsub.pd(<2 x double>, <2 x double>, <2 x double>) 163*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfnmadd.pd(<2 x double>, <2 x double>, <2 x double>) 164*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.x86.fma.vfnmsub.pd(<2 x double>, <2 x double>, <2 x double>) 165*9880d681SAndroid Build Coastguard Worker 166*9880d681SAndroid Build Coastguard Worker 167*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddsubps_loop_128: 168*9880d681SAndroid Build Coastguard Worker; CHECK: vfmaddsub231ps %xmm1, %xmm0, %xmm2 169*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 170*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 171*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmaddsubps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) { 172*9880d681SAndroid Build Coastguard Workerentry: 173*9880d681SAndroid Build Coastguard Worker br label %for.cond 174*9880d681SAndroid Build Coastguard Worker 175*9880d681SAndroid Build Coastguard Workerfor.cond: 176*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ] 177*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 178*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 179*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 180*9880d681SAndroid Build Coastguard Worker 181*9880d681SAndroid Build Coastguard Workerfor.body: 182*9880d681SAndroid Build Coastguard Worker br label %for.inc 183*9880d681SAndroid Build Coastguard Worker 184*9880d681SAndroid Build Coastguard Workerfor.inc: 185*9880d681SAndroid Build Coastguard Worker %0 = call <4 x float> @llvm.x86.fma.vfmaddsub.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0) 186*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 187*9880d681SAndroid Build Coastguard Worker br label %for.cond 188*9880d681SAndroid Build Coastguard Worker 189*9880d681SAndroid Build Coastguard Workerfor.end: 190*9880d681SAndroid Build Coastguard Worker ret <4 x float> %c.addr.0 191*9880d681SAndroid Build Coastguard Worker} 192*9880d681SAndroid Build Coastguard Worker 193*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubaddps_loop_128: 194*9880d681SAndroid Build Coastguard Worker; CHECK: vfmsubadd231ps %xmm1, %xmm0, %xmm2 195*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 196*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 197*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmsubaddps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) { 198*9880d681SAndroid Build Coastguard Workerentry: 199*9880d681SAndroid Build Coastguard Worker br label %for.cond 200*9880d681SAndroid Build Coastguard Worker 201*9880d681SAndroid Build Coastguard Workerfor.cond: 202*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ] 203*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 204*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 205*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 206*9880d681SAndroid Build Coastguard Worker 207*9880d681SAndroid Build Coastguard Workerfor.body: 208*9880d681SAndroid Build Coastguard Worker br label %for.inc 209*9880d681SAndroid Build Coastguard Worker 210*9880d681SAndroid Build Coastguard Workerfor.inc: 211*9880d681SAndroid Build Coastguard Worker %0 = call <4 x float> @llvm.x86.fma.vfmsubadd.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0) 212*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 213*9880d681SAndroid Build Coastguard Worker br label %for.cond 214*9880d681SAndroid Build Coastguard Worker 215*9880d681SAndroid Build Coastguard Workerfor.end: 216*9880d681SAndroid Build Coastguard Worker ret <4 x float> %c.addr.0 217*9880d681SAndroid Build Coastguard Worker} 218*9880d681SAndroid Build Coastguard Worker 219*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddps_loop_128: 220*9880d681SAndroid Build Coastguard Worker; CHECK: vfmadd231ps %xmm1, %xmm0, %xmm2 221*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 222*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 223*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmaddps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) { 224*9880d681SAndroid Build Coastguard Workerentry: 225*9880d681SAndroid Build Coastguard Worker br label %for.cond 226*9880d681SAndroid Build Coastguard Worker 227*9880d681SAndroid Build Coastguard Workerfor.cond: 228*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ] 229*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 230*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 231*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 232*9880d681SAndroid Build Coastguard Worker 233*9880d681SAndroid Build Coastguard Workerfor.body: 234*9880d681SAndroid Build Coastguard Worker br label %for.inc 235*9880d681SAndroid Build Coastguard Worker 236*9880d681SAndroid Build Coastguard Workerfor.inc: 237*9880d681SAndroid Build Coastguard Worker %0 = call <4 x float> @llvm.x86.fma.vfmadd.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0) 238*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 239*9880d681SAndroid Build Coastguard Worker br label %for.cond 240*9880d681SAndroid Build Coastguard Worker 241*9880d681SAndroid Build Coastguard Workerfor.end: 242*9880d681SAndroid Build Coastguard Worker ret <4 x float> %c.addr.0 243*9880d681SAndroid Build Coastguard Worker} 244*9880d681SAndroid Build Coastguard Worker 245*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubps_loop_128: 246*9880d681SAndroid Build Coastguard Worker; CHECK: vfmsub231ps %xmm1, %xmm0, %xmm2 247*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 248*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 249*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmsubps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) { 250*9880d681SAndroid Build Coastguard Workerentry: 251*9880d681SAndroid Build Coastguard Worker br label %for.cond 252*9880d681SAndroid Build Coastguard Worker 253*9880d681SAndroid Build Coastguard Workerfor.cond: 254*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ] 255*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 256*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 257*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 258*9880d681SAndroid Build Coastguard Worker 259*9880d681SAndroid Build Coastguard Workerfor.body: 260*9880d681SAndroid Build Coastguard Worker br label %for.inc 261*9880d681SAndroid Build Coastguard Worker 262*9880d681SAndroid Build Coastguard Workerfor.inc: 263*9880d681SAndroid Build Coastguard Worker %0 = call <4 x float> @llvm.x86.fma.vfmsub.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0) 264*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 265*9880d681SAndroid Build Coastguard Worker br label %for.cond 266*9880d681SAndroid Build Coastguard Worker 267*9880d681SAndroid Build Coastguard Workerfor.end: 268*9880d681SAndroid Build Coastguard Worker ret <4 x float> %c.addr.0 269*9880d681SAndroid Build Coastguard Worker} 270*9880d681SAndroid Build Coastguard Worker 271*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmaddps_loop_128: 272*9880d681SAndroid Build Coastguard Worker; CHECK: vfnmadd231ps %xmm1, %xmm0, %xmm2 273*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 274*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 275*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fnmaddps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) { 276*9880d681SAndroid Build Coastguard Workerentry: 277*9880d681SAndroid Build Coastguard Worker br label %for.cond 278*9880d681SAndroid Build Coastguard Worker 279*9880d681SAndroid Build Coastguard Workerfor.cond: 280*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ] 281*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 282*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 283*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 284*9880d681SAndroid Build Coastguard Worker 285*9880d681SAndroid Build Coastguard Workerfor.body: 286*9880d681SAndroid Build Coastguard Worker br label %for.inc 287*9880d681SAndroid Build Coastguard Worker 288*9880d681SAndroid Build Coastguard Workerfor.inc: 289*9880d681SAndroid Build Coastguard Worker %0 = call <4 x float> @llvm.x86.fma.vfnmadd.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0) 290*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 291*9880d681SAndroid Build Coastguard Worker br label %for.cond 292*9880d681SAndroid Build Coastguard Worker 293*9880d681SAndroid Build Coastguard Workerfor.end: 294*9880d681SAndroid Build Coastguard Worker ret <4 x float> %c.addr.0 295*9880d681SAndroid Build Coastguard Worker} 296*9880d681SAndroid Build Coastguard Worker 297*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmsubps_loop_128: 298*9880d681SAndroid Build Coastguard Worker; CHECK: vfnmsub231ps %xmm1, %xmm0, %xmm2 299*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %xmm2, %xmm0 300*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 301*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fnmsubps_loop_128(i32 %iter, <4 x float> %a, <4 x float> %b, <4 x float> %c) { 302*9880d681SAndroid Build Coastguard Workerentry: 303*9880d681SAndroid Build Coastguard Worker br label %for.cond 304*9880d681SAndroid Build Coastguard Worker 305*9880d681SAndroid Build Coastguard Workerfor.cond: 306*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x float> [ %c, %entry ], [ %0, %for.inc ] 307*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 308*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 309*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 310*9880d681SAndroid Build Coastguard Worker 311*9880d681SAndroid Build Coastguard Workerfor.body: 312*9880d681SAndroid Build Coastguard Worker br label %for.inc 313*9880d681SAndroid Build Coastguard Worker 314*9880d681SAndroid Build Coastguard Workerfor.inc: 315*9880d681SAndroid Build Coastguard Worker %0 = call <4 x float> @llvm.x86.fma.vfnmsub.ps(<4 x float> %a, <4 x float> %b, <4 x float> %c.addr.0) 316*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 317*9880d681SAndroid Build Coastguard Worker br label %for.cond 318*9880d681SAndroid Build Coastguard Worker 319*9880d681SAndroid Build Coastguard Workerfor.end: 320*9880d681SAndroid Build Coastguard Worker ret <4 x float> %c.addr.0 321*9880d681SAndroid Build Coastguard Worker} 322*9880d681SAndroid Build Coastguard Worker 323*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfmaddsub.ps(<4 x float>, <4 x float>, <4 x float>) 324*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfmsubadd.ps(<4 x float>, <4 x float>, <4 x float>) 325*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfmadd.ps(<4 x float>, <4 x float>, <4 x float>) 326*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfmsub.ps(<4 x float>, <4 x float>, <4 x float>) 327*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfnmadd.ps(<4 x float>, <4 x float>, <4 x float>) 328*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.x86.fma.vfnmsub.ps(<4 x float>, <4 x float>, <4 x float>) 329*9880d681SAndroid Build Coastguard Worker 330*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddsubpd_loop_256: 331*9880d681SAndroid Build Coastguard Worker; CHECK: vfmaddsub231pd %ymm1, %ymm0, %ymm2 332*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 333*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 334*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fmaddsubpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) { 335*9880d681SAndroid Build Coastguard Workerentry: 336*9880d681SAndroid Build Coastguard Worker br label %for.cond 337*9880d681SAndroid Build Coastguard Worker 338*9880d681SAndroid Build Coastguard Workerfor.cond: 339*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ] 340*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 341*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 342*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 343*9880d681SAndroid Build Coastguard Worker 344*9880d681SAndroid Build Coastguard Workerfor.body: 345*9880d681SAndroid Build Coastguard Worker br label %for.inc 346*9880d681SAndroid Build Coastguard Worker 347*9880d681SAndroid Build Coastguard Workerfor.inc: 348*9880d681SAndroid Build Coastguard Worker %0 = call <4 x double> @llvm.x86.fma.vfmaddsub.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0) 349*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 350*9880d681SAndroid Build Coastguard Worker br label %for.cond 351*9880d681SAndroid Build Coastguard Worker 352*9880d681SAndroid Build Coastguard Workerfor.end: 353*9880d681SAndroid Build Coastguard Worker ret <4 x double> %c.addr.0 354*9880d681SAndroid Build Coastguard Worker} 355*9880d681SAndroid Build Coastguard Worker 356*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubaddpd_loop_256: 357*9880d681SAndroid Build Coastguard Worker; CHECK: vfmsubadd231pd %ymm1, %ymm0, %ymm2 358*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 359*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 360*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fmsubaddpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) { 361*9880d681SAndroid Build Coastguard Workerentry: 362*9880d681SAndroid Build Coastguard Worker br label %for.cond 363*9880d681SAndroid Build Coastguard Worker 364*9880d681SAndroid Build Coastguard Workerfor.cond: 365*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ] 366*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 367*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 368*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 369*9880d681SAndroid Build Coastguard Worker 370*9880d681SAndroid Build Coastguard Workerfor.body: 371*9880d681SAndroid Build Coastguard Worker br label %for.inc 372*9880d681SAndroid Build Coastguard Worker 373*9880d681SAndroid Build Coastguard Workerfor.inc: 374*9880d681SAndroid Build Coastguard Worker %0 = call <4 x double> @llvm.x86.fma.vfmsubadd.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0) 375*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 376*9880d681SAndroid Build Coastguard Worker br label %for.cond 377*9880d681SAndroid Build Coastguard Worker 378*9880d681SAndroid Build Coastguard Workerfor.end: 379*9880d681SAndroid Build Coastguard Worker ret <4 x double> %c.addr.0 380*9880d681SAndroid Build Coastguard Worker} 381*9880d681SAndroid Build Coastguard Worker 382*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddpd_loop_256: 383*9880d681SAndroid Build Coastguard Worker; CHECK: vfmadd231pd %ymm1, %ymm0, %ymm2 384*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 385*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 386*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fmaddpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) { 387*9880d681SAndroid Build Coastguard Workerentry: 388*9880d681SAndroid Build Coastguard Worker br label %for.cond 389*9880d681SAndroid Build Coastguard Worker 390*9880d681SAndroid Build Coastguard Workerfor.cond: 391*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ] 392*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 393*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 394*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 395*9880d681SAndroid Build Coastguard Worker 396*9880d681SAndroid Build Coastguard Workerfor.body: 397*9880d681SAndroid Build Coastguard Worker br label %for.inc 398*9880d681SAndroid Build Coastguard Worker 399*9880d681SAndroid Build Coastguard Workerfor.inc: 400*9880d681SAndroid Build Coastguard Worker %0 = call <4 x double> @llvm.x86.fma.vfmadd.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0) 401*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 402*9880d681SAndroid Build Coastguard Worker br label %for.cond 403*9880d681SAndroid Build Coastguard Worker 404*9880d681SAndroid Build Coastguard Workerfor.end: 405*9880d681SAndroid Build Coastguard Worker ret <4 x double> %c.addr.0 406*9880d681SAndroid Build Coastguard Worker} 407*9880d681SAndroid Build Coastguard Worker 408*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubpd_loop_256: 409*9880d681SAndroid Build Coastguard Worker; CHECK: vfmsub231pd %ymm1, %ymm0, %ymm2 410*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 411*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 412*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fmsubpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) { 413*9880d681SAndroid Build Coastguard Workerentry: 414*9880d681SAndroid Build Coastguard Worker br label %for.cond 415*9880d681SAndroid Build Coastguard Worker 416*9880d681SAndroid Build Coastguard Workerfor.cond: 417*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ] 418*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 419*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 420*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 421*9880d681SAndroid Build Coastguard Worker 422*9880d681SAndroid Build Coastguard Workerfor.body: 423*9880d681SAndroid Build Coastguard Worker br label %for.inc 424*9880d681SAndroid Build Coastguard Worker 425*9880d681SAndroid Build Coastguard Workerfor.inc: 426*9880d681SAndroid Build Coastguard Worker %0 = call <4 x double> @llvm.x86.fma.vfmsub.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0) 427*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 428*9880d681SAndroid Build Coastguard Worker br label %for.cond 429*9880d681SAndroid Build Coastguard Worker 430*9880d681SAndroid Build Coastguard Workerfor.end: 431*9880d681SAndroid Build Coastguard Worker ret <4 x double> %c.addr.0 432*9880d681SAndroid Build Coastguard Worker} 433*9880d681SAndroid Build Coastguard Worker 434*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmaddpd_loop_256: 435*9880d681SAndroid Build Coastguard Worker; CHECK: vfnmadd231pd %ymm1, %ymm0, %ymm2 436*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 437*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 438*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fnmaddpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) { 439*9880d681SAndroid Build Coastguard Workerentry: 440*9880d681SAndroid Build Coastguard Worker br label %for.cond 441*9880d681SAndroid Build Coastguard Worker 442*9880d681SAndroid Build Coastguard Workerfor.cond: 443*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ] 444*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 445*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 446*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 447*9880d681SAndroid Build Coastguard Worker 448*9880d681SAndroid Build Coastguard Workerfor.body: 449*9880d681SAndroid Build Coastguard Worker br label %for.inc 450*9880d681SAndroid Build Coastguard Worker 451*9880d681SAndroid Build Coastguard Workerfor.inc: 452*9880d681SAndroid Build Coastguard Worker %0 = call <4 x double> @llvm.x86.fma.vfnmadd.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0) 453*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 454*9880d681SAndroid Build Coastguard Worker br label %for.cond 455*9880d681SAndroid Build Coastguard Worker 456*9880d681SAndroid Build Coastguard Workerfor.end: 457*9880d681SAndroid Build Coastguard Worker ret <4 x double> %c.addr.0 458*9880d681SAndroid Build Coastguard Worker} 459*9880d681SAndroid Build Coastguard Worker 460*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmsubpd_loop_256: 461*9880d681SAndroid Build Coastguard Worker; CHECK: vfnmsub231pd %ymm1, %ymm0, %ymm2 462*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 463*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 464*9880d681SAndroid Build Coastguard Workerdefine <4 x double> @fnmsubpd_loop_256(i32 %iter, <4 x double> %a, <4 x double> %b, <4 x double> %c) { 465*9880d681SAndroid Build Coastguard Workerentry: 466*9880d681SAndroid Build Coastguard Worker br label %for.cond 467*9880d681SAndroid Build Coastguard Worker 468*9880d681SAndroid Build Coastguard Workerfor.cond: 469*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <4 x double> [ %c, %entry ], [ %0, %for.inc ] 470*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 471*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 472*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 473*9880d681SAndroid Build Coastguard Worker 474*9880d681SAndroid Build Coastguard Workerfor.body: 475*9880d681SAndroid Build Coastguard Worker br label %for.inc 476*9880d681SAndroid Build Coastguard Worker 477*9880d681SAndroid Build Coastguard Workerfor.inc: 478*9880d681SAndroid Build Coastguard Worker %0 = call <4 x double> @llvm.x86.fma.vfnmsub.pd.256(<4 x double> %a, <4 x double> %b, <4 x double> %c.addr.0) 479*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 480*9880d681SAndroid Build Coastguard Worker br label %for.cond 481*9880d681SAndroid Build Coastguard Worker 482*9880d681SAndroid Build Coastguard Workerfor.end: 483*9880d681SAndroid Build Coastguard Worker ret <4 x double> %c.addr.0 484*9880d681SAndroid Build Coastguard Worker} 485*9880d681SAndroid Build Coastguard Worker 486*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfmaddsub.pd.256(<4 x double>, <4 x double>, <4 x double>) 487*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfmsubadd.pd.256(<4 x double>, <4 x double>, <4 x double>) 488*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfmadd.pd.256(<4 x double>, <4 x double>, <4 x double>) 489*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfmsub.pd.256(<4 x double>, <4 x double>, <4 x double>) 490*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfnmadd.pd.256(<4 x double>, <4 x double>, <4 x double>) 491*9880d681SAndroid Build Coastguard Workerdeclare <4 x double> @llvm.x86.fma.vfnmsub.pd.256(<4 x double>, <4 x double>, <4 x double>) 492*9880d681SAndroid Build Coastguard Worker 493*9880d681SAndroid Build Coastguard Worker 494*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddsubps_loop_256: 495*9880d681SAndroid Build Coastguard Worker; CHECK: vfmaddsub231ps %ymm1, %ymm0, %ymm2 496*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 497*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 498*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fmaddsubps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) { 499*9880d681SAndroid Build Coastguard Workerentry: 500*9880d681SAndroid Build Coastguard Worker br label %for.cond 501*9880d681SAndroid Build Coastguard Worker 502*9880d681SAndroid Build Coastguard Workerfor.cond: 503*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ] 504*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 505*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 506*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 507*9880d681SAndroid Build Coastguard Worker 508*9880d681SAndroid Build Coastguard Workerfor.body: 509*9880d681SAndroid Build Coastguard Worker br label %for.inc 510*9880d681SAndroid Build Coastguard Worker 511*9880d681SAndroid Build Coastguard Workerfor.inc: 512*9880d681SAndroid Build Coastguard Worker %0 = call <8 x float> @llvm.x86.fma.vfmaddsub.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0) 513*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 514*9880d681SAndroid Build Coastguard Worker br label %for.cond 515*9880d681SAndroid Build Coastguard Worker 516*9880d681SAndroid Build Coastguard Workerfor.end: 517*9880d681SAndroid Build Coastguard Worker ret <8 x float> %c.addr.0 518*9880d681SAndroid Build Coastguard Worker} 519*9880d681SAndroid Build Coastguard Worker 520*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubaddps_loop_256: 521*9880d681SAndroid Build Coastguard Worker; CHECK: vfmsubadd231ps %ymm1, %ymm0, %ymm2 522*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 523*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 524*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fmsubaddps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) { 525*9880d681SAndroid Build Coastguard Workerentry: 526*9880d681SAndroid Build Coastguard Worker br label %for.cond 527*9880d681SAndroid Build Coastguard Worker 528*9880d681SAndroid Build Coastguard Workerfor.cond: 529*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ] 530*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 531*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 532*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 533*9880d681SAndroid Build Coastguard Worker 534*9880d681SAndroid Build Coastguard Workerfor.body: 535*9880d681SAndroid Build Coastguard Worker br label %for.inc 536*9880d681SAndroid Build Coastguard Worker 537*9880d681SAndroid Build Coastguard Workerfor.inc: 538*9880d681SAndroid Build Coastguard Worker %0 = call <8 x float> @llvm.x86.fma.vfmsubadd.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0) 539*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 540*9880d681SAndroid Build Coastguard Worker br label %for.cond 541*9880d681SAndroid Build Coastguard Worker 542*9880d681SAndroid Build Coastguard Workerfor.end: 543*9880d681SAndroid Build Coastguard Worker ret <8 x float> %c.addr.0 544*9880d681SAndroid Build Coastguard Worker} 545*9880d681SAndroid Build Coastguard Worker 546*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmaddps_loop_256: 547*9880d681SAndroid Build Coastguard Worker; CHECK: vfmadd231ps %ymm1, %ymm0, %ymm2 548*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 549*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 550*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fmaddps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) { 551*9880d681SAndroid Build Coastguard Workerentry: 552*9880d681SAndroid Build Coastguard Worker br label %for.cond 553*9880d681SAndroid Build Coastguard Worker 554*9880d681SAndroid Build Coastguard Workerfor.cond: 555*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ] 556*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 557*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 558*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 559*9880d681SAndroid Build Coastguard Worker 560*9880d681SAndroid Build Coastguard Workerfor.body: 561*9880d681SAndroid Build Coastguard Worker br label %for.inc 562*9880d681SAndroid Build Coastguard Worker 563*9880d681SAndroid Build Coastguard Workerfor.inc: 564*9880d681SAndroid Build Coastguard Worker %0 = call <8 x float> @llvm.x86.fma.vfmadd.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0) 565*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 566*9880d681SAndroid Build Coastguard Worker br label %for.cond 567*9880d681SAndroid Build Coastguard Worker 568*9880d681SAndroid Build Coastguard Workerfor.end: 569*9880d681SAndroid Build Coastguard Worker ret <8 x float> %c.addr.0 570*9880d681SAndroid Build Coastguard Worker} 571*9880d681SAndroid Build Coastguard Worker 572*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fmsubps_loop_256: 573*9880d681SAndroid Build Coastguard Worker; CHECK: vfmsub231ps %ymm1, %ymm0, %ymm2 574*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 575*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 576*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fmsubps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) { 577*9880d681SAndroid Build Coastguard Workerentry: 578*9880d681SAndroid Build Coastguard Worker br label %for.cond 579*9880d681SAndroid Build Coastguard Worker 580*9880d681SAndroid Build Coastguard Workerfor.cond: 581*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ] 582*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 583*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 584*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 585*9880d681SAndroid Build Coastguard Worker 586*9880d681SAndroid Build Coastguard Workerfor.body: 587*9880d681SAndroid Build Coastguard Worker br label %for.inc 588*9880d681SAndroid Build Coastguard Worker 589*9880d681SAndroid Build Coastguard Workerfor.inc: 590*9880d681SAndroid Build Coastguard Worker %0 = call <8 x float> @llvm.x86.fma.vfmsub.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0) 591*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 592*9880d681SAndroid Build Coastguard Worker br label %for.cond 593*9880d681SAndroid Build Coastguard Worker 594*9880d681SAndroid Build Coastguard Workerfor.end: 595*9880d681SAndroid Build Coastguard Worker ret <8 x float> %c.addr.0 596*9880d681SAndroid Build Coastguard Worker} 597*9880d681SAndroid Build Coastguard Worker 598*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmaddps_loop_256: 599*9880d681SAndroid Build Coastguard Worker; CHECK: vfnmadd231ps %ymm1, %ymm0, %ymm2 600*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 601*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 602*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fnmaddps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) { 603*9880d681SAndroid Build Coastguard Workerentry: 604*9880d681SAndroid Build Coastguard Worker br label %for.cond 605*9880d681SAndroid Build Coastguard Worker 606*9880d681SAndroid Build Coastguard Workerfor.cond: 607*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ] 608*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 609*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 610*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 611*9880d681SAndroid Build Coastguard Worker 612*9880d681SAndroid Build Coastguard Workerfor.body: 613*9880d681SAndroid Build Coastguard Worker br label %for.inc 614*9880d681SAndroid Build Coastguard Worker 615*9880d681SAndroid Build Coastguard Workerfor.inc: 616*9880d681SAndroid Build Coastguard Worker %0 = call <8 x float> @llvm.x86.fma.vfnmadd.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0) 617*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 618*9880d681SAndroid Build Coastguard Worker br label %for.cond 619*9880d681SAndroid Build Coastguard Worker 620*9880d681SAndroid Build Coastguard Workerfor.end: 621*9880d681SAndroid Build Coastguard Worker ret <8 x float> %c.addr.0 622*9880d681SAndroid Build Coastguard Worker} 623*9880d681SAndroid Build Coastguard Worker 624*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: fnmsubps_loop_256: 625*9880d681SAndroid Build Coastguard Worker; CHECK: vfnmsub231ps %ymm1, %ymm0, %ymm2 626*9880d681SAndroid Build Coastguard Worker; CHECK: vmovaps %ymm2, %ymm0 627*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: retq 628*9880d681SAndroid Build Coastguard Workerdefine <8 x float> @fnmsubps_loop_256(i32 %iter, <8 x float> %a, <8 x float> %b, <8 x float> %c) { 629*9880d681SAndroid Build Coastguard Workerentry: 630*9880d681SAndroid Build Coastguard Worker br label %for.cond 631*9880d681SAndroid Build Coastguard Worker 632*9880d681SAndroid Build Coastguard Workerfor.cond: 633*9880d681SAndroid Build Coastguard Worker %c.addr.0 = phi <8 x float> [ %c, %entry ], [ %0, %for.inc ] 634*9880d681SAndroid Build Coastguard Worker %i.0 = phi i32 [ 0, %entry ], [ %inc, %for.inc ] 635*9880d681SAndroid Build Coastguard Worker %cmp = icmp slt i32 %i.0, %iter 636*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %for.body, label %for.end 637*9880d681SAndroid Build Coastguard Worker 638*9880d681SAndroid Build Coastguard Workerfor.body: 639*9880d681SAndroid Build Coastguard Worker br label %for.inc 640*9880d681SAndroid Build Coastguard Worker 641*9880d681SAndroid Build Coastguard Workerfor.inc: 642*9880d681SAndroid Build Coastguard Worker %0 = call <8 x float> @llvm.x86.fma.vfnmsub.ps.256(<8 x float> %a, <8 x float> %b, <8 x float> %c.addr.0) 643*9880d681SAndroid Build Coastguard Worker %inc = add nsw i32 %i.0, 1 644*9880d681SAndroid Build Coastguard Worker br label %for.cond 645*9880d681SAndroid Build Coastguard Worker 646*9880d681SAndroid Build Coastguard Workerfor.end: 647*9880d681SAndroid Build Coastguard Worker ret <8 x float> %c.addr.0 648*9880d681SAndroid Build Coastguard Worker} 649*9880d681SAndroid Build Coastguard Worker 650*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfmaddsub.ps.256(<8 x float>, <8 x float>, <8 x float>) 651*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfmsubadd.ps.256(<8 x float>, <8 x float>, <8 x float>) 652*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfmadd.ps.256(<8 x float>, <8 x float>, <8 x float>) 653*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfmsub.ps.256(<8 x float>, <8 x float>, <8 x float>) 654*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfnmadd.ps.256(<8 x float>, <8 x float>, <8 x float>) 655*9880d681SAndroid Build Coastguard Workerdeclare <8 x float> @llvm.x86.fma.vfnmsub.ps.256(<8 x float>, <8 x float>, <8 x float>) 656