1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -verify-machineinstrs -mtriple=aarch64-none-linux-gnu -mattr=+neon -fp-contract=fast | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @fmla2xfloat(<2 x float> %A, <2 x float> %B, <2 x float> %C) { 4*9880d681SAndroid Build Coastguard Worker;CHECK: fmla {{v[0-9]+}}.2s, {{v[0-9]+}}.2s, {{v[0-9]+}}.2s 5*9880d681SAndroid Build Coastguard Worker %tmp1 = fmul <2 x float> %A, %B; 6*9880d681SAndroid Build Coastguard Worker %tmp2 = fadd <2 x float> %C, %tmp1; 7*9880d681SAndroid Build Coastguard Worker ret <2 x float> %tmp2 8*9880d681SAndroid Build Coastguard Worker} 9*9880d681SAndroid Build Coastguard Worker 10*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmla4xfloat(<4 x float> %A, <4 x float> %B, <4 x float> %C) { 11*9880d681SAndroid Build Coastguard Worker;CHECK: fmla {{v[0-9]+}}.4s, {{v[0-9]+}}.4s, {{v[0-9]+}}.4s 12*9880d681SAndroid Build Coastguard Worker %tmp1 = fmul <4 x float> %A, %B; 13*9880d681SAndroid Build Coastguard Worker %tmp2 = fadd <4 x float> %C, %tmp1; 14*9880d681SAndroid Build Coastguard Worker ret <4 x float> %tmp2 15*9880d681SAndroid Build Coastguard Worker} 16*9880d681SAndroid Build Coastguard Worker 17*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmla2xdouble(<2 x double> %A, <2 x double> %B, <2 x double> %C) { 18*9880d681SAndroid Build Coastguard Worker;CHECK: fmla {{v[0-9]+}}.2d, {{v[0-9]+}}.2d, {{v[0-9]+}}.2d 19*9880d681SAndroid Build Coastguard Worker %tmp1 = fmul <2 x double> %A, %B; 20*9880d681SAndroid Build Coastguard Worker %tmp2 = fadd <2 x double> %C, %tmp1; 21*9880d681SAndroid Build Coastguard Worker ret <2 x double> %tmp2 22*9880d681SAndroid Build Coastguard Worker} 23*9880d681SAndroid Build Coastguard Worker 24*9880d681SAndroid Build Coastguard Worker 25*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @fmls2xfloat(<2 x float> %A, <2 x float> %B, <2 x float> %C) { 26*9880d681SAndroid Build Coastguard Worker;CHECK: fmls {{v[0-9]+}}.2s, {{v[0-9]+}}.2s, {{v[0-9]+}}.2s 27*9880d681SAndroid Build Coastguard Worker %tmp1 = fmul <2 x float> %A, %B; 28*9880d681SAndroid Build Coastguard Worker %tmp2 = fsub <2 x float> %C, %tmp1; 29*9880d681SAndroid Build Coastguard Worker ret <2 x float> %tmp2 30*9880d681SAndroid Build Coastguard Worker} 31*9880d681SAndroid Build Coastguard Worker 32*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmls4xfloat(<4 x float> %A, <4 x float> %B, <4 x float> %C) { 33*9880d681SAndroid Build Coastguard Worker;CHECK: fmls {{v[0-9]+}}.4s, {{v[0-9]+}}.4s, {{v[0-9]+}}.4s 34*9880d681SAndroid Build Coastguard Worker %tmp1 = fmul <4 x float> %A, %B; 35*9880d681SAndroid Build Coastguard Worker %tmp2 = fsub <4 x float> %C, %tmp1; 36*9880d681SAndroid Build Coastguard Worker ret <4 x float> %tmp2 37*9880d681SAndroid Build Coastguard Worker} 38*9880d681SAndroid Build Coastguard Worker 39*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmls2xdouble(<2 x double> %A, <2 x double> %B, <2 x double> %C) { 40*9880d681SAndroid Build Coastguard Worker;CHECK: fmls {{v[0-9]+}}.2d, {{v[0-9]+}}.2d, {{v[0-9]+}}.2d 41*9880d681SAndroid Build Coastguard Worker %tmp1 = fmul <2 x double> %A, %B; 42*9880d681SAndroid Build Coastguard Worker %tmp2 = fsub <2 x double> %C, %tmp1; 43*9880d681SAndroid Build Coastguard Worker ret <2 x double> %tmp2 44*9880d681SAndroid Build Coastguard Worker} 45*9880d681SAndroid Build Coastguard Worker 46*9880d681SAndroid Build Coastguard Worker 47*9880d681SAndroid Build Coastguard Worker; Another set of tests for when the intrinsic is used. 48*9880d681SAndroid Build Coastguard Worker 49*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.fma.v2f32(<2 x float>, <2 x float>, <2 x float>) 50*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.fma.v4f32(<4 x float>, <4 x float>, <4 x float>) 51*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.fma.v2f64(<2 x double>, <2 x double>, <2 x double>) 52*9880d681SAndroid Build Coastguard Worker 53*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @fmla2xfloat_fused(<2 x float> %A, <2 x float> %B, <2 x float> %C) { 54*9880d681SAndroid Build Coastguard Worker;CHECK: fmla {{v[0-9]+}}.2s, {{v[0-9]+}}.2s, {{v[0-9]+}}.2s 55*9880d681SAndroid Build Coastguard Worker %val = call <2 x float> @llvm.fma.v2f32(<2 x float> %A, <2 x float> %B, <2 x float> %C) 56*9880d681SAndroid Build Coastguard Worker ret <2 x float> %val 57*9880d681SAndroid Build Coastguard Worker} 58*9880d681SAndroid Build Coastguard Worker 59*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmla4xfloat_fused(<4 x float> %A, <4 x float> %B, <4 x float> %C) { 60*9880d681SAndroid Build Coastguard Worker;CHECK: fmla {{v[0-9]+}}.4s, {{v[0-9]+}}.4s, {{v[0-9]+}}.4s 61*9880d681SAndroid Build Coastguard Worker %val = call <4 x float> @llvm.fma.v4f32(<4 x float> %A, <4 x float> %B, <4 x float> %C) 62*9880d681SAndroid Build Coastguard Worker ret <4 x float> %val 63*9880d681SAndroid Build Coastguard Worker} 64*9880d681SAndroid Build Coastguard Worker 65*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmla2xdouble_fused(<2 x double> %A, <2 x double> %B, <2 x double> %C) { 66*9880d681SAndroid Build Coastguard Worker;CHECK: fmla {{v[0-9]+}}.2d, {{v[0-9]+}}.2d, {{v[0-9]+}}.2d 67*9880d681SAndroid Build Coastguard Worker %val = call <2 x double> @llvm.fma.v2f64(<2 x double> %A, <2 x double> %B, <2 x double> %C) 68*9880d681SAndroid Build Coastguard Worker ret <2 x double> %val 69*9880d681SAndroid Build Coastguard Worker} 70*9880d681SAndroid Build Coastguard Worker 71*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @fmls2xfloat_fused(<2 x float> %A, <2 x float> %B, <2 x float> %C) { 72*9880d681SAndroid Build Coastguard Worker;CHECK: fmls {{v[0-9]+}}.2s, {{v[0-9]+}}.2s, {{v[0-9]+}}.2s 73*9880d681SAndroid Build Coastguard Worker %negA = fsub <2 x float> <float -0.0, float -0.0>, %A 74*9880d681SAndroid Build Coastguard Worker %val = call <2 x float> @llvm.fma.v2f32(<2 x float> %negA, <2 x float> %B, <2 x float> %C) 75*9880d681SAndroid Build Coastguard Worker ret <2 x float> %val 76*9880d681SAndroid Build Coastguard Worker} 77*9880d681SAndroid Build Coastguard Worker 78*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmls4xfloat_fused(<4 x float> %A, <4 x float> %B, <4 x float> %C) { 79*9880d681SAndroid Build Coastguard Worker;CHECK: fmls {{v[0-9]+}}.4s, {{v[0-9]+}}.4s, {{v[0-9]+}}.4s 80*9880d681SAndroid Build Coastguard Worker %negA = fsub <4 x float> <float -0.0, float -0.0, float -0.0, float -0.0>, %A 81*9880d681SAndroid Build Coastguard Worker %val = call <4 x float> @llvm.fma.v4f32(<4 x float> %negA, <4 x float> %B, <4 x float> %C) 82*9880d681SAndroid Build Coastguard Worker ret <4 x float> %val 83*9880d681SAndroid Build Coastguard Worker} 84*9880d681SAndroid Build Coastguard Worker 85*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmls2xdouble_fused(<2 x double> %A, <2 x double> %B, <2 x double> %C) { 86*9880d681SAndroid Build Coastguard Worker;CHECK: fmls {{v[0-9]+}}.2d, {{v[0-9]+}}.2d, {{v[0-9]+}}.2d 87*9880d681SAndroid Build Coastguard Worker %negA = fsub <2 x double> <double -0.0, double -0.0>, %A 88*9880d681SAndroid Build Coastguard Worker %val = call <2 x double> @llvm.fma.v2f64(<2 x double> %negA, <2 x double> %B, <2 x double> %C) 89*9880d681SAndroid Build Coastguard Worker ret <2 x double> %val 90*9880d681SAndroid Build Coastguard Worker} 91*9880d681SAndroid Build Coastguard Worker 92*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.fmuladd.v2f32(<2 x float>, <2 x float>, <2 x float>) 93*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.fmuladd.v4f32(<4 x float>, <4 x float>, <4 x float>) 94*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.fmuladd.v2f64(<2 x double>, <2 x double>, <2 x double>) 95*9880d681SAndroid Build Coastguard Worker 96*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @fmuladd2xfloat(<2 x float> %A, <2 x float> %B, <2 x float> %C) { 97*9880d681SAndroid Build Coastguard Worker;CHECK: fmla {{v[0-9]+}}.2s, {{v[0-9]+}}.2s, {{v[0-9]+}}.2s 98*9880d681SAndroid Build Coastguard Worker %val = call <2 x float> @llvm.fmuladd.v2f32(<2 x float> %A, <2 x float> %B, <2 x float> %C) 99*9880d681SAndroid Build Coastguard Worker ret <2 x float> %val 100*9880d681SAndroid Build Coastguard Worker} 101*9880d681SAndroid Build Coastguard Worker 102*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @fmuladd4xfloat_fused(<4 x float> %A, <4 x float> %B, <4 x float> %C) { 103*9880d681SAndroid Build Coastguard Worker;CHECK: fmla {{v[0-9]+}}.4s, {{v[0-9]+}}.4s, {{v[0-9]+}}.4s 104*9880d681SAndroid Build Coastguard Worker %val = call <4 x float> @llvm.fmuladd.v4f32(<4 x float> %A, <4 x float> %B, <4 x float> %C) 105*9880d681SAndroid Build Coastguard Worker ret <4 x float> %val 106*9880d681SAndroid Build Coastguard Worker} 107*9880d681SAndroid Build Coastguard Worker 108*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmuladd2xdouble_fused(<2 x double> %A, <2 x double> %B, <2 x double> %C) { 109*9880d681SAndroid Build Coastguard Worker;CHECK: fmla {{v[0-9]+}}.2d, {{v[0-9]+}}.2d, {{v[0-9]+}}.2d 110*9880d681SAndroid Build Coastguard Worker %val = call <2 x double> @llvm.fmuladd.v2f64(<2 x double> %A, <2 x double> %B, <2 x double> %C) 111*9880d681SAndroid Build Coastguard Worker ret <2 x double> %val 112*9880d681SAndroid Build Coastguard Worker} 113*9880d681SAndroid Build Coastguard Worker 114*9880d681SAndroid Build Coastguard Worker 115*9880d681SAndroid Build Coastguard Worker; Another set of tests that check for multiply single use 116*9880d681SAndroid Build Coastguard Worker 117*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @fmla2xfloati_su(<2 x float> %A, <2 x float> %B, <2 x float> %C) { 118*9880d681SAndroid Build Coastguard Worker;CHECK-NOT: fmla {{v[0-9]+}}.2s, {{v[0-9]+}}.2s, {{v[0-9]+}}.2s 119*9880d681SAndroid Build Coastguard Worker %tmp1 = fmul <2 x float> %A, %B; 120*9880d681SAndroid Build Coastguard Worker %tmp2 = fadd <2 x float> %C, %tmp1; 121*9880d681SAndroid Build Coastguard Worker %tmp3 = fadd <2 x float> %tmp2, %tmp1; 122*9880d681SAndroid Build Coastguard Worker ret <2 x float> %tmp3 123*9880d681SAndroid Build Coastguard Worker} 124*9880d681SAndroid Build Coastguard Worker 125*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @fmls2xdouble_su(<2 x double> %A, <2 x double> %B, <2 x double> %C) { 126*9880d681SAndroid Build Coastguard Worker;CHECK-NOT: fmls {{v[0-9]+}}.2d, {{v[0-9]+}}.2d, {{v[0-9]+}}.2d 127*9880d681SAndroid Build Coastguard Worker %tmp1 = fmul <2 x double> %A, %B; 128*9880d681SAndroid Build Coastguard Worker %tmp2 = fsub <2 x double> %C, %tmp1; 129*9880d681SAndroid Build Coastguard Worker %tmp3 = fsub <2 x double> %tmp2, %tmp1; 130*9880d681SAndroid Build Coastguard Worker ret <2 x double> %tmp3 131*9880d681SAndroid Build Coastguard Worker} 132*9880d681SAndroid Build Coastguard Worker 133