xref: /aosp_15_r20/external/llvm/test/CodeGen/AArch64/arm64-vsqrt.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=arm64 -aarch64-neon-syntax=apple | FileCheck %s
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @frecps_2s(<2 x float>* %A, <2 x float>* %B) nounwind {
4*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecps_2s:
5*9880d681SAndroid Build Coastguard Worker;CHECK: frecps.2s
6*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x float>, <2 x float>* %A
7*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <2 x float>, <2 x float>* %B
8*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x float> @llvm.aarch64.neon.frecps.v2f32(<2 x float> %tmp1, <2 x float> %tmp2)
9*9880d681SAndroid Build Coastguard Worker	ret <2 x float> %tmp3
10*9880d681SAndroid Build Coastguard Worker}
11*9880d681SAndroid Build Coastguard Worker
12*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @frecps_4s(<4 x float>* %A, <4 x float>* %B) nounwind {
13*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecps_4s:
14*9880d681SAndroid Build Coastguard Worker;CHECK: frecps.4s
15*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x float>, <4 x float>* %A
16*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x float>, <4 x float>* %B
17*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <4 x float> @llvm.aarch64.neon.frecps.v4f32(<4 x float> %tmp1, <4 x float> %tmp2)
18*9880d681SAndroid Build Coastguard Worker	ret <4 x float> %tmp3
19*9880d681SAndroid Build Coastguard Worker}
20*9880d681SAndroid Build Coastguard Worker
21*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @frecps_2d(<2 x double>* %A, <2 x double>* %B) nounwind {
22*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecps_2d:
23*9880d681SAndroid Build Coastguard Worker;CHECK: frecps.2d
24*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x double>, <2 x double>* %A
25*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <2 x double>, <2 x double>* %B
26*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x double> @llvm.aarch64.neon.frecps.v2f64(<2 x double> %tmp1, <2 x double> %tmp2)
27*9880d681SAndroid Build Coastguard Worker	ret <2 x double> %tmp3
28*9880d681SAndroid Build Coastguard Worker}
29*9880d681SAndroid Build Coastguard Worker
30*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.aarch64.neon.frecps.v2f32(<2 x float>, <2 x float>) nounwind readnone
31*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.aarch64.neon.frecps.v4f32(<4 x float>, <4 x float>) nounwind readnone
32*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.aarch64.neon.frecps.v2f64(<2 x double>, <2 x double>) nounwind readnone
33*9880d681SAndroid Build Coastguard Worker
34*9880d681SAndroid Build Coastguard Worker
35*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @frsqrts_2s(<2 x float>* %A, <2 x float>* %B) nounwind {
36*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrts_2s:
37*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrts.2s
38*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x float>, <2 x float>* %A
39*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <2 x float>, <2 x float>* %B
40*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x float> @llvm.aarch64.neon.frsqrts.v2f32(<2 x float> %tmp1, <2 x float> %tmp2)
41*9880d681SAndroid Build Coastguard Worker	ret <2 x float> %tmp3
42*9880d681SAndroid Build Coastguard Worker}
43*9880d681SAndroid Build Coastguard Worker
44*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @frsqrts_4s(<4 x float>* %A, <4 x float>* %B) nounwind {
45*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrts_4s:
46*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrts.4s
47*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x float>, <4 x float>* %A
48*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <4 x float>, <4 x float>* %B
49*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <4 x float> @llvm.aarch64.neon.frsqrts.v4f32(<4 x float> %tmp1, <4 x float> %tmp2)
50*9880d681SAndroid Build Coastguard Worker	ret <4 x float> %tmp3
51*9880d681SAndroid Build Coastguard Worker}
52*9880d681SAndroid Build Coastguard Worker
53*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @frsqrts_2d(<2 x double>* %A, <2 x double>* %B) nounwind {
54*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrts_2d:
55*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrts.2d
56*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x double>, <2 x double>* %A
57*9880d681SAndroid Build Coastguard Worker	%tmp2 = load <2 x double>, <2 x double>* %B
58*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x double> @llvm.aarch64.neon.frsqrts.v2f64(<2 x double> %tmp1, <2 x double> %tmp2)
59*9880d681SAndroid Build Coastguard Worker	ret <2 x double> %tmp3
60*9880d681SAndroid Build Coastguard Worker}
61*9880d681SAndroid Build Coastguard Worker
62*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.aarch64.neon.frsqrts.v2f32(<2 x float>, <2 x float>) nounwind readnone
63*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.aarch64.neon.frsqrts.v4f32(<4 x float>, <4 x float>) nounwind readnone
64*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.aarch64.neon.frsqrts.v2f64(<2 x double>, <2 x double>) nounwind readnone
65*9880d681SAndroid Build Coastguard Worker
66*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @frecpe_2s(<2 x float>* %A) nounwind {
67*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_2s:
68*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe.2s
69*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x float>, <2 x float>* %A
70*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x float> @llvm.aarch64.neon.frecpe.v2f32(<2 x float> %tmp1)
71*9880d681SAndroid Build Coastguard Worker	ret <2 x float> %tmp3
72*9880d681SAndroid Build Coastguard Worker}
73*9880d681SAndroid Build Coastguard Worker
74*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @frecpe_4s(<4 x float>* %A) nounwind {
75*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_4s:
76*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe.4s
77*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x float>, <4 x float>* %A
78*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <4 x float> @llvm.aarch64.neon.frecpe.v4f32(<4 x float> %tmp1)
79*9880d681SAndroid Build Coastguard Worker	ret <4 x float> %tmp3
80*9880d681SAndroid Build Coastguard Worker}
81*9880d681SAndroid Build Coastguard Worker
82*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @frecpe_2d(<2 x double>* %A) nounwind {
83*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_2d:
84*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe.2d
85*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x double>, <2 x double>* %A
86*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x double> @llvm.aarch64.neon.frecpe.v2f64(<2 x double> %tmp1)
87*9880d681SAndroid Build Coastguard Worker	ret <2 x double> %tmp3
88*9880d681SAndroid Build Coastguard Worker}
89*9880d681SAndroid Build Coastguard Worker
90*9880d681SAndroid Build Coastguard Workerdefine float @frecpe_s(float* %A) nounwind {
91*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_s:
92*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe s0, {{s[0-9]+}}
93*9880d681SAndroid Build Coastguard Worker  %tmp1 = load float, float* %A
94*9880d681SAndroid Build Coastguard Worker  %tmp3 = call float @llvm.aarch64.neon.frecpe.f32(float %tmp1)
95*9880d681SAndroid Build Coastguard Worker  ret float %tmp3
96*9880d681SAndroid Build Coastguard Worker}
97*9880d681SAndroid Build Coastguard Worker
98*9880d681SAndroid Build Coastguard Workerdefine double @frecpe_d(double* %A) nounwind {
99*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpe_d:
100*9880d681SAndroid Build Coastguard Worker;CHECK: frecpe d0, {{d[0-9]+}}
101*9880d681SAndroid Build Coastguard Worker  %tmp1 = load double, double* %A
102*9880d681SAndroid Build Coastguard Worker  %tmp3 = call double @llvm.aarch64.neon.frecpe.f64(double %tmp1)
103*9880d681SAndroid Build Coastguard Worker  ret double %tmp3
104*9880d681SAndroid Build Coastguard Worker}
105*9880d681SAndroid Build Coastguard Worker
106*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.aarch64.neon.frecpe.v2f32(<2 x float>) nounwind readnone
107*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.aarch64.neon.frecpe.v4f32(<4 x float>) nounwind readnone
108*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.aarch64.neon.frecpe.v2f64(<2 x double>) nounwind readnone
109*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.aarch64.neon.frecpe.f32(float) nounwind readnone
110*9880d681SAndroid Build Coastguard Workerdeclare double @llvm.aarch64.neon.frecpe.f64(double) nounwind readnone
111*9880d681SAndroid Build Coastguard Worker
112*9880d681SAndroid Build Coastguard Workerdefine float @frecpx_s(float* %A) nounwind {
113*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpx_s:
114*9880d681SAndroid Build Coastguard Worker;CHECK: frecpx s0, {{s[0-9]+}}
115*9880d681SAndroid Build Coastguard Worker  %tmp1 = load float, float* %A
116*9880d681SAndroid Build Coastguard Worker  %tmp3 = call float @llvm.aarch64.neon.frecpx.f32(float %tmp1)
117*9880d681SAndroid Build Coastguard Worker  ret float %tmp3
118*9880d681SAndroid Build Coastguard Worker}
119*9880d681SAndroid Build Coastguard Worker
120*9880d681SAndroid Build Coastguard Workerdefine double @frecpx_d(double* %A) nounwind {
121*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frecpx_d:
122*9880d681SAndroid Build Coastguard Worker;CHECK: frecpx d0, {{d[0-9]+}}
123*9880d681SAndroid Build Coastguard Worker  %tmp1 = load double, double* %A
124*9880d681SAndroid Build Coastguard Worker  %tmp3 = call double @llvm.aarch64.neon.frecpx.f64(double %tmp1)
125*9880d681SAndroid Build Coastguard Worker  ret double %tmp3
126*9880d681SAndroid Build Coastguard Worker}
127*9880d681SAndroid Build Coastguard Worker
128*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.aarch64.neon.frecpx.f32(float) nounwind readnone
129*9880d681SAndroid Build Coastguard Workerdeclare double @llvm.aarch64.neon.frecpx.f64(double) nounwind readnone
130*9880d681SAndroid Build Coastguard Worker
131*9880d681SAndroid Build Coastguard Workerdefine <2 x float> @frsqrte_2s(<2 x float>* %A) nounwind {
132*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_2s:
133*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte.2s
134*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x float>, <2 x float>* %A
135*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x float> @llvm.aarch64.neon.frsqrte.v2f32(<2 x float> %tmp1)
136*9880d681SAndroid Build Coastguard Worker	ret <2 x float> %tmp3
137*9880d681SAndroid Build Coastguard Worker}
138*9880d681SAndroid Build Coastguard Worker
139*9880d681SAndroid Build Coastguard Workerdefine <4 x float> @frsqrte_4s(<4 x float>* %A) nounwind {
140*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_4s:
141*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte.4s
142*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x float>, <4 x float>* %A
143*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <4 x float> @llvm.aarch64.neon.frsqrte.v4f32(<4 x float> %tmp1)
144*9880d681SAndroid Build Coastguard Worker	ret <4 x float> %tmp3
145*9880d681SAndroid Build Coastguard Worker}
146*9880d681SAndroid Build Coastguard Worker
147*9880d681SAndroid Build Coastguard Workerdefine <2 x double> @frsqrte_2d(<2 x double>* %A) nounwind {
148*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_2d:
149*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte.2d
150*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x double>, <2 x double>* %A
151*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x double> @llvm.aarch64.neon.frsqrte.v2f64(<2 x double> %tmp1)
152*9880d681SAndroid Build Coastguard Worker	ret <2 x double> %tmp3
153*9880d681SAndroid Build Coastguard Worker}
154*9880d681SAndroid Build Coastguard Worker
155*9880d681SAndroid Build Coastguard Workerdefine float @frsqrte_s(float* %A) nounwind {
156*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_s:
157*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte s0, {{s[0-9]+}}
158*9880d681SAndroid Build Coastguard Worker  %tmp1 = load float, float* %A
159*9880d681SAndroid Build Coastguard Worker  %tmp3 = call float @llvm.aarch64.neon.frsqrte.f32(float %tmp1)
160*9880d681SAndroid Build Coastguard Worker  ret float %tmp3
161*9880d681SAndroid Build Coastguard Worker}
162*9880d681SAndroid Build Coastguard Worker
163*9880d681SAndroid Build Coastguard Workerdefine double @frsqrte_d(double* %A) nounwind {
164*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: frsqrte_d:
165*9880d681SAndroid Build Coastguard Worker;CHECK: frsqrte d0, {{d[0-9]+}}
166*9880d681SAndroid Build Coastguard Worker  %tmp1 = load double, double* %A
167*9880d681SAndroid Build Coastguard Worker  %tmp3 = call double @llvm.aarch64.neon.frsqrte.f64(double %tmp1)
168*9880d681SAndroid Build Coastguard Worker  ret double %tmp3
169*9880d681SAndroid Build Coastguard Worker}
170*9880d681SAndroid Build Coastguard Worker
171*9880d681SAndroid Build Coastguard Workerdeclare <2 x float> @llvm.aarch64.neon.frsqrte.v2f32(<2 x float>) nounwind readnone
172*9880d681SAndroid Build Coastguard Workerdeclare <4 x float> @llvm.aarch64.neon.frsqrte.v4f32(<4 x float>) nounwind readnone
173*9880d681SAndroid Build Coastguard Workerdeclare <2 x double> @llvm.aarch64.neon.frsqrte.v2f64(<2 x double>) nounwind readnone
174*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.aarch64.neon.frsqrte.f32(float) nounwind readnone
175*9880d681SAndroid Build Coastguard Workerdeclare double @llvm.aarch64.neon.frsqrte.f64(double) nounwind readnone
176*9880d681SAndroid Build Coastguard Worker
177*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @urecpe_2s(<2 x i32>* %A) nounwind {
178*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: urecpe_2s:
179*9880d681SAndroid Build Coastguard Worker;CHECK: urecpe.2s
180*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x i32>, <2 x i32>* %A
181*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x i32> @llvm.aarch64.neon.urecpe.v2i32(<2 x i32> %tmp1)
182*9880d681SAndroid Build Coastguard Worker	ret <2 x i32> %tmp3
183*9880d681SAndroid Build Coastguard Worker}
184*9880d681SAndroid Build Coastguard Worker
185*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @urecpe_4s(<4 x i32>* %A) nounwind {
186*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: urecpe_4s:
187*9880d681SAndroid Build Coastguard Worker;CHECK: urecpe.4s
188*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x i32>, <4 x i32>* %A
189*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <4 x i32> @llvm.aarch64.neon.urecpe.v4i32(<4 x i32> %tmp1)
190*9880d681SAndroid Build Coastguard Worker	ret <4 x i32> %tmp3
191*9880d681SAndroid Build Coastguard Worker}
192*9880d681SAndroid Build Coastguard Worker
193*9880d681SAndroid Build Coastguard Workerdeclare <2 x i32> @llvm.aarch64.neon.urecpe.v2i32(<2 x i32>) nounwind readnone
194*9880d681SAndroid Build Coastguard Workerdeclare <4 x i32> @llvm.aarch64.neon.urecpe.v4i32(<4 x i32>) nounwind readnone
195*9880d681SAndroid Build Coastguard Worker
196*9880d681SAndroid Build Coastguard Workerdefine <2 x i32> @ursqrte_2s(<2 x i32>* %A) nounwind {
197*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: ursqrte_2s:
198*9880d681SAndroid Build Coastguard Worker;CHECK: ursqrte.2s
199*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <2 x i32>, <2 x i32>* %A
200*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <2 x i32> @llvm.aarch64.neon.ursqrte.v2i32(<2 x i32> %tmp1)
201*9880d681SAndroid Build Coastguard Worker	ret <2 x i32> %tmp3
202*9880d681SAndroid Build Coastguard Worker}
203*9880d681SAndroid Build Coastguard Worker
204*9880d681SAndroid Build Coastguard Workerdefine <4 x i32> @ursqrte_4s(<4 x i32>* %A) nounwind {
205*9880d681SAndroid Build Coastguard Worker;CHECK-LABEL: ursqrte_4s:
206*9880d681SAndroid Build Coastguard Worker;CHECK: ursqrte.4s
207*9880d681SAndroid Build Coastguard Worker	%tmp1 = load <4 x i32>, <4 x i32>* %A
208*9880d681SAndroid Build Coastguard Worker	%tmp3 = call <4 x i32> @llvm.aarch64.neon.ursqrte.v4i32(<4 x i32> %tmp1)
209*9880d681SAndroid Build Coastguard Worker	ret <4 x i32> %tmp3
210*9880d681SAndroid Build Coastguard Worker}
211*9880d681SAndroid Build Coastguard Worker
212*9880d681SAndroid Build Coastguard Workerdeclare <2 x i32> @llvm.aarch64.neon.ursqrte.v2i32(<2 x i32>) nounwind readnone
213*9880d681SAndroid Build Coastguard Workerdeclare <4 x i32> @llvm.aarch64.neon.ursqrte.v4i32(<4 x i32>) nounwind readnone
214*9880d681SAndroid Build Coastguard Worker
215*9880d681SAndroid Build Coastguard Workerdefine float @f1(float %a, float %b) nounwind readnone optsize ssp {
216*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f1:
217*9880d681SAndroid Build Coastguard Worker; CHECK: frsqrts s0, s0, s1
218*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret
219*9880d681SAndroid Build Coastguard Worker  %vrsqrtss.i = tail call float @llvm.aarch64.neon.frsqrts.f32(float %a, float %b) nounwind
220*9880d681SAndroid Build Coastguard Worker  ret float %vrsqrtss.i
221*9880d681SAndroid Build Coastguard Worker}
222*9880d681SAndroid Build Coastguard Worker
223*9880d681SAndroid Build Coastguard Workerdefine double @f2(double %a, double %b) nounwind readnone optsize ssp {
224*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: f2:
225*9880d681SAndroid Build Coastguard Worker; CHECK: frsqrts d0, d0, d1
226*9880d681SAndroid Build Coastguard Worker; CHECK-NEXT: ret
227*9880d681SAndroid Build Coastguard Worker  %vrsqrtsd.i = tail call double @llvm.aarch64.neon.frsqrts.f64(double %a, double %b) nounwind
228*9880d681SAndroid Build Coastguard Worker  ret double %vrsqrtsd.i
229*9880d681SAndroid Build Coastguard Worker}
230*9880d681SAndroid Build Coastguard Worker
231*9880d681SAndroid Build Coastguard Workerdeclare double @llvm.aarch64.neon.frsqrts.f64(double, double) nounwind readnone
232*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.aarch64.neon.frsqrts.f32(float, float) nounwind readnone
233