1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=arm64 -aarch64-neon-syntax=apple | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @frecps_2s(<2 x float>* %A, <2 x float>* %B) nounwind { 4*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecps_2s: 5*9880d681SAndroid Build Coastguard Worker;CHECK: frecps.2s 6*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x float>, <2 x float>* %A 7*9880d681SAndroid Build Coastguard Worker %tmp2 = load <2 x float>, <2 x float>* %B 8*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x float> @llvm.aarch64.neon.frecps.v2f32(<2 x float> %tmp1, <2 x float> %tmp2) 9*9880d681SAndroid Build Coastguard Worker ret <2 x float> %tmp3 10*9880d681SAndroid Build Coastguard Worker} 11*9880d681SAndroid Build Coastguard Worker 12*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @frecps_4s(<4 x float>* %A, <4 x float>* %B) nounwind { 13*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecps_4s: 14*9880d681SAndroid Build Coastguard Worker;CHECK: frecps.4s 15*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x float>, <4 x float>* %A 16*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x float>, <4 x float>* %B 17*9880d681SAndroid Build Coastguard Worker %tmp3 = call <4 x float> @llvm.aarch64.neon.frecps.v4f32(<4 x float> %tmp1, <4 x float> %tmp2) 18*9880d681SAndroid Build Coastguard Worker ret <4 x float> %tmp3 19*9880d681SAndroid Build Coastguard Worker} 20*9880d681SAndroid Build Coastguard Worker 21*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @frecps_2d(<2 x double>* %A, <2 x double>* %B) nounwind { 22*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecps_2d: 23*9880d681SAndroid Build Coastguard Worker;CHECK: frecps.2d 24*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x double>, <2 x double>* %A 25*9880d681SAndroid Build Coastguard Worker %tmp2 = load <2 x double>, <2 x double>* %B 26*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x double> @llvm.aarch64.neon.frecps.v2f64(<2 x double> %tmp1, <2 x double> %tmp2) 27*9880d681SAndroid Build Coastguard Worker ret <2 x double> %tmp3 28*9880d681SAndroid Build Coastguard Worker} 29*9880d681SAndroid Build Coastguard Worker 30*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.aarch64.neon.frecps.v2f32(<2 x float>, <2 x float>) nounwind readnone 31*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.aarch64.neon.frecps.v4f32(<4 x float>, <4 x float>) nounwind readnone 32*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.aarch64.neon.frecps.v2f64(<2 x double>, <2 x double>) nounwind readnone 33*9880d681SAndroid Build Coastguard Worker 34*9880d681SAndroid Build Coastguard Worker 35*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @frsqrts_2s(<2 x float>* %A, <2 x float>* %B) nounwind { 36*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrts_2s: 37*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrts.2s 38*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x float>, <2 x float>* %A 39*9880d681SAndroid Build Coastguard Worker %tmp2 = load <2 x float>, <2 x float>* %B 40*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x float> @llvm.aarch64.neon.frsqrts.v2f32(<2 x float> %tmp1, <2 x float> %tmp2) 41*9880d681SAndroid Build Coastguard Worker ret <2 x float> %tmp3 42*9880d681SAndroid Build Coastguard Worker} 43*9880d681SAndroid Build Coastguard Worker 44*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @frsqrts_4s(<4 x float>* %A, <4 x float>* %B) nounwind { 45*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrts_4s: 46*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrts.4s 47*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x float>, <4 x float>* %A 48*9880d681SAndroid Build Coastguard Worker %tmp2 = load <4 x float>, <4 x float>* %B 49*9880d681SAndroid Build Coastguard Worker %tmp3 = call <4 x float> @llvm.aarch64.neon.frsqrts.v4f32(<4 x float> %tmp1, <4 x float> %tmp2) 50*9880d681SAndroid Build Coastguard Worker ret <4 x float> %tmp3 51*9880d681SAndroid Build Coastguard Worker} 52*9880d681SAndroid Build Coastguard Worker 53*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @frsqrts_2d(<2 x double>* %A, <2 x double>* %B) nounwind { 54*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrts_2d: 55*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrts.2d 56*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x double>, <2 x double>* %A 57*9880d681SAndroid Build Coastguard Worker %tmp2 = load <2 x double>, <2 x double>* %B 58*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x double> @llvm.aarch64.neon.frsqrts.v2f64(<2 x double> %tmp1, <2 x double> %tmp2) 59*9880d681SAndroid Build Coastguard Worker ret <2 x double> %tmp3 60*9880d681SAndroid Build Coastguard Worker} 61*9880d681SAndroid Build Coastguard Worker 62*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.aarch64.neon.frsqrts.v2f32(<2 x float>, <2 x float>) nounwind readnone 63*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.aarch64.neon.frsqrts.v4f32(<4 x float>, <4 x float>) nounwind readnone 64*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.aarch64.neon.frsqrts.v2f64(<2 x double>, <2 x double>) nounwind readnone 65*9880d681SAndroid Build Coastguard Worker 66*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @frecpe_2s(<2 x float>* %A) nounwind { 67*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_2s: 68*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe.2s 69*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x float>, <2 x float>* %A 70*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x float> @llvm.aarch64.neon.frecpe.v2f32(<2 x float> %tmp1) 71*9880d681SAndroid Build Coastguard Worker ret <2 x float> %tmp3 72*9880d681SAndroid Build Coastguard Worker} 73*9880d681SAndroid Build Coastguard Worker 74*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @frecpe_4s(<4 x float>* %A) nounwind { 75*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_4s: 76*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe.4s 77*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x float>, <4 x float>* %A 78*9880d681SAndroid Build Coastguard Worker %tmp3 = call <4 x float> @llvm.aarch64.neon.frecpe.v4f32(<4 x float> %tmp1) 79*9880d681SAndroid Build Coastguard Worker ret <4 x float> %tmp3 80*9880d681SAndroid Build Coastguard Worker} 81*9880d681SAndroid Build Coastguard Worker 82*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @frecpe_2d(<2 x double>* %A) nounwind { 83*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_2d: 84*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe.2d 85*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x double>, <2 x double>* %A 86*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x double> @llvm.aarch64.neon.frecpe.v2f64(<2 x double> %tmp1) 87*9880d681SAndroid Build Coastguard Worker ret <2 x double> %tmp3 88*9880d681SAndroid Build Coastguard Worker} 89*9880d681SAndroid Build Coastguard Worker 90*9880d681SAndroid Build Coastguard Workerdefine float @frecpe_s(float* %A) nounwind { 91*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_s: 92*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe s0, {{s[0-9]+}} 93*9880d681SAndroid Build Coastguard Worker %tmp1 = load float, float* %A 94*9880d681SAndroid Build Coastguard Worker %tmp3 = call float @llvm.aarch64.neon.frecpe.f32(float %tmp1) 95*9880d681SAndroid Build Coastguard Worker ret float %tmp3 96*9880d681SAndroid Build Coastguard Worker} 97*9880d681SAndroid Build Coastguard Worker 98*9880d681SAndroid Build Coastguard Workerdefine double @frecpe_d(double* %A) nounwind { 99*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_d: 100*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe d0, {{d[0-9]+}} 101*9880d681SAndroid Build Coastguard Worker %tmp1 = load double, double* %A 102*9880d681SAndroid Build Coastguard Worker %tmp3 = call double @llvm.aarch64.neon.frecpe.f64(double %tmp1) 103*9880d681SAndroid Build Coastguard Worker ret double %tmp3 104*9880d681SAndroid Build Coastguard Worker} 105*9880d681SAndroid Build Coastguard Worker 106*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.aarch64.neon.frecpe.v2f32(<2 x float>) nounwind readnone 107*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.aarch64.neon.frecpe.v4f32(<4 x float>) nounwind readnone 108*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.aarch64.neon.frecpe.v2f64(<2 x double>) nounwind readnone 109*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.aarch64.neon.frecpe.f32(float) nounwind readnone 110*9880d681SAndroid Build Coastguard Workerdeclare double @llvm.aarch64.neon.frecpe.f64(double) nounwind readnone 111*9880d681SAndroid Build Coastguard Worker 112*9880d681SAndroid Build Coastguard Workerdefine float @frecpx_s(float* %A) nounwind { 113*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpx_s: 114*9880d681SAndroid Build Coastguard Worker;CHECK: frecpx s0, {{s[0-9]+}} 115*9880d681SAndroid Build Coastguard Worker %tmp1 = load float, float* %A 116*9880d681SAndroid Build Coastguard Worker %tmp3 = call float @llvm.aarch64.neon.frecpx.f32(float %tmp1) 117*9880d681SAndroid Build Coastguard Worker ret float %tmp3 118*9880d681SAndroid Build Coastguard Worker} 119*9880d681SAndroid Build Coastguard Worker 120*9880d681SAndroid Build Coastguard Workerdefine double @frecpx_d(double* %A) nounwind { 121*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpx_d: 122*9880d681SAndroid Build Coastguard Worker;CHECK: frecpx d0, {{d[0-9]+}} 123*9880d681SAndroid Build Coastguard Worker %tmp1 = load double, double* %A 124*9880d681SAndroid Build Coastguard Worker %tmp3 = call double @llvm.aarch64.neon.frecpx.f64(double %tmp1) 125*9880d681SAndroid Build Coastguard Worker ret double %tmp3 126*9880d681SAndroid Build Coastguard Worker} 127*9880d681SAndroid Build Coastguard Worker 128*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.aarch64.neon.frecpx.f32(float) nounwind readnone 129*9880d681SAndroid Build Coastguard Workerdeclare double @llvm.aarch64.neon.frecpx.f64(double) nounwind readnone 130*9880d681SAndroid Build Coastguard Worker 131*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @frsqrte_2s(<2 x float>* %A) nounwind { 132*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_2s: 133*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte.2s 134*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x float>, <2 x float>* %A 135*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x float> @llvm.aarch64.neon.frsqrte.v2f32(<2 x float> %tmp1) 136*9880d681SAndroid Build Coastguard Worker ret <2 x float> %tmp3 137*9880d681SAndroid Build Coastguard Worker} 138*9880d681SAndroid Build Coastguard Worker 139*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @frsqrte_4s(<4 x float>* %A) nounwind { 140*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_4s: 141*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte.4s 142*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x float>, <4 x float>* %A 143*9880d681SAndroid Build Coastguard Worker %tmp3 = call <4 x float> @llvm.aarch64.neon.frsqrte.v4f32(<4 x float> %tmp1) 144*9880d681SAndroid Build Coastguard Worker ret <4 x float> %tmp3 145*9880d681SAndroid Build Coastguard Worker} 146*9880d681SAndroid Build Coastguard Worker 147*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @frsqrte_2d(<2 x double>* %A) nounwind { 148*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_2d: 149*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte.2d 150*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x double>, <2 x double>* %A 151*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x double> @llvm.aarch64.neon.frsqrte.v2f64(<2 x double> %tmp1) 152*9880d681SAndroid Build Coastguard Worker ret <2 x double> %tmp3 153*9880d681SAndroid Build Coastguard Worker} 154*9880d681SAndroid Build Coastguard Worker 155*9880d681SAndroid Build Coastguard Workerdefine float @frsqrte_s(float* %A) nounwind { 156*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_s: 157*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte s0, {{s[0-9]+}} 158*9880d681SAndroid Build Coastguard Worker %tmp1 = load float, float* %A 159*9880d681SAndroid Build Coastguard Worker %tmp3 = call float @llvm.aarch64.neon.frsqrte.f32(float %tmp1) 160*9880d681SAndroid Build Coastguard Worker ret float %tmp3 161*9880d681SAndroid Build Coastguard Worker} 162*9880d681SAndroid Build Coastguard Worker 163*9880d681SAndroid Build Coastguard Workerdefine double @frsqrte_d(double* %A) nounwind { 164*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_d: 165*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte d0, {{d[0-9]+}} 166*9880d681SAndroid Build Coastguard Worker %tmp1 = load double, double* %A 167*9880d681SAndroid Build Coastguard Worker %tmp3 = call double @llvm.aarch64.neon.frsqrte.f64(double %tmp1) 168*9880d681SAndroid Build Coastguard Worker ret double %tmp3 169*9880d681SAndroid Build Coastguard Worker} 170*9880d681SAndroid Build Coastguard Worker 171*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.aarch64.neon.frsqrte.v2f32(<2 x float>) nounwind readnone 172*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.aarch64.neon.frsqrte.v4f32(<4 x float>) nounwind readnone 173*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.aarch64.neon.frsqrte.v2f64(<2 x double>) nounwind readnone 174*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.aarch64.neon.frsqrte.f32(float) nounwind readnone 175*9880d681SAndroid Build Coastguard Workerdeclare double @llvm.aarch64.neon.frsqrte.f64(double) nounwind readnone 176*9880d681SAndroid Build Coastguard Worker 177*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @urecpe_2s(<2 x i32>* %A) nounwind { 178*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: urecpe_2s: 179*9880d681SAndroid Build Coastguard Worker;CHECK: urecpe.2s 180*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x i32>, <2 x i32>* %A 181*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x i32> @llvm.aarch64.neon.urecpe.v2i32(<2 x i32> %tmp1) 182*9880d681SAndroid Build Coastguard Worker ret <2 x i32> %tmp3 183*9880d681SAndroid Build Coastguard Worker} 184*9880d681SAndroid Build Coastguard Worker 185*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @urecpe_4s(<4 x i32>* %A) nounwind { 186*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: urecpe_4s: 187*9880d681SAndroid Build Coastguard Worker;CHECK: urecpe.4s 188*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i32>, <4 x i32>* %A 189*9880d681SAndroid Build Coastguard Worker %tmp3 = call <4 x i32> @llvm.aarch64.neon.urecpe.v4i32(<4 x i32> %tmp1) 190*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %tmp3 191*9880d681SAndroid Build Coastguard Worker} 192*9880d681SAndroid Build Coastguard Worker 193*9880d681SAndroid Build Coastguard Workerdeclare <2 x i32> @llvm.aarch64.neon.urecpe.v2i32(<2 x i32>) nounwind readnone 194*9880d681SAndroid Build Coastguard Workerdeclare <4 x i32> @llvm.aarch64.neon.urecpe.v4i32(<4 x i32>) nounwind readnone 195*9880d681SAndroid Build Coastguard Worker 196*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @ursqrte_2s(<2 x i32>* %A) nounwind { 197*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: ursqrte_2s: 198*9880d681SAndroid Build Coastguard Worker;CHECK: ursqrte.2s 199*9880d681SAndroid Build Coastguard Worker %tmp1 = load <2 x i32>, <2 x i32>* %A 200*9880d681SAndroid Build Coastguard Worker %tmp3 = call <2 x i32> @llvm.aarch64.neon.ursqrte.v2i32(<2 x i32> %tmp1) 201*9880d681SAndroid Build Coastguard Worker ret <2 x i32> %tmp3 202*9880d681SAndroid Build Coastguard Worker} 203*9880d681SAndroid Build Coastguard Worker 204*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @ursqrte_4s(<4 x i32>* %A) nounwind { 205*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: ursqrte_4s: 206*9880d681SAndroid Build Coastguard Worker;CHECK: ursqrte.4s 207*9880d681SAndroid Build Coastguard Worker %tmp1 = load <4 x i32>, <4 x i32>* %A 208*9880d681SAndroid Build Coastguard Worker %tmp3 = call <4 x i32> @llvm.aarch64.neon.ursqrte.v4i32(<4 x i32> %tmp1) 209*9880d681SAndroid Build Coastguard Worker ret <4 x i32> %tmp3 210*9880d681SAndroid Build Coastguard Worker} 211*9880d681SAndroid Build Coastguard Worker 212*9880d681SAndroid Build Coastguard Workerdeclare <2 x i32> @llvm.aarch64.neon.ursqrte.v2i32(<2 x i32>) nounwind readnone 213*9880d681SAndroid Build Coastguard Workerdeclare <4 x i32> @llvm.aarch64.neon.ursqrte.v4i32(<4 x i32>) nounwind readnone 214*9880d681SAndroid Build Coastguard Worker 215*9880d681SAndroid Build Coastguard Workerdefine float @f1(float %a, float %b) nounwind readnone optsize ssp { 216*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f1: 217*9880d681SAndroid Build Coastguard Worker; CHECK: frsqrts s0, s0, s1 218*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret 219*9880d681SAndroid Build Coastguard Worker %vrsqrtss.i = tail call float @llvm.aarch64.neon.frsqrts.f32(float %a, float %b) nounwind 220*9880d681SAndroid Build Coastguard Worker ret float %vrsqrtss.i 221*9880d681SAndroid Build Coastguard Worker} 222*9880d681SAndroid Build Coastguard Worker 223*9880d681SAndroid Build Coastguard Workerdefine double @f2(double %a, double %b) nounwind readnone optsize ssp { 224*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f2: 225*9880d681SAndroid Build Coastguard Worker; CHECK: frsqrts d0, d0, d1 226*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret 227*9880d681SAndroid Build Coastguard Worker %vrsqrtsd.i = tail call double @llvm.aarch64.neon.frsqrts.f64(double %a, double %b) nounwind 228*9880d681SAndroid Build Coastguard Worker ret double %vrsqrtsd.i 229*9880d681SAndroid Build Coastguard Worker} 230*9880d681SAndroid Build Coastguard Worker 231*9880d681SAndroid Build Coastguard Workerdeclare double @llvm.aarch64.neon.frsqrts.f64(double, double) nounwind readnone 232*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.aarch64.neon.frsqrts.f32(float, float) nounwind readnone 233