xref: /aosp_15_r20/external/llvm/test/CodeGen/AMDGPU/mad-sub.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Workerdeclare i32 @llvm.amdgcn.workitem.id.x() #0
4*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.fabs.f32(float) #0
5*9880d681SAndroid Build Coastguard Worker
6*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_f32:
7*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]]
8*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]]
9*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]]
10*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], [[REGA]], [[REGB]], -[[REGC]]
11*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]]
12*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 {
13*9880d681SAndroid Build Coastguard Worker  %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0
14*9880d681SAndroid Build Coastguard Worker  %tid.ext = sext i32 %tid to i64
15*9880d681SAndroid Build Coastguard Worker  %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext
16*9880d681SAndroid Build Coastguard Worker  %add1 = add i64 %tid.ext, 1
17*9880d681SAndroid Build Coastguard Worker  %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1
18*9880d681SAndroid Build Coastguard Worker  %add2 = add i64 %tid.ext, 2
19*9880d681SAndroid Build Coastguard Worker  %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2
20*9880d681SAndroid Build Coastguard Worker  %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext
21*9880d681SAndroid Build Coastguard Worker  %a = load volatile float, float addrspace(1)* %gep0, align 4
22*9880d681SAndroid Build Coastguard Worker  %b = load volatile float, float addrspace(1)* %gep1, align 4
23*9880d681SAndroid Build Coastguard Worker  %c = load volatile float, float addrspace(1)* %gep2, align 4
24*9880d681SAndroid Build Coastguard Worker  %mul = fmul float %a, %b
25*9880d681SAndroid Build Coastguard Worker  %sub = fsub float %mul, %c
26*9880d681SAndroid Build Coastguard Worker  store float %sub, float addrspace(1)* %outgep, align 4
27*9880d681SAndroid Build Coastguard Worker  ret void
28*9880d681SAndroid Build Coastguard Worker}
29*9880d681SAndroid Build Coastguard Worker
30*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_inv_f32:
31*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]]
32*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]]
33*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]]
34*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], -[[REGA]], [[REGB]], [[REGC]]
35*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]]
36*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_inv_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 {
37*9880d681SAndroid Build Coastguard Worker  %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0
38*9880d681SAndroid Build Coastguard Worker  %tid.ext = sext i32 %tid to i64
39*9880d681SAndroid Build Coastguard Worker  %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext
40*9880d681SAndroid Build Coastguard Worker  %add1 = add i64 %tid.ext, 1
41*9880d681SAndroid Build Coastguard Worker  %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1
42*9880d681SAndroid Build Coastguard Worker  %add2 = add i64 %tid.ext, 2
43*9880d681SAndroid Build Coastguard Worker  %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2
44*9880d681SAndroid Build Coastguard Worker  %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext
45*9880d681SAndroid Build Coastguard Worker  %a = load volatile float, float addrspace(1)* %gep0, align 4
46*9880d681SAndroid Build Coastguard Worker  %b = load volatile float, float addrspace(1)* %gep1, align 4
47*9880d681SAndroid Build Coastguard Worker  %c = load volatile float, float addrspace(1)* %gep2, align 4
48*9880d681SAndroid Build Coastguard Worker  %mul = fmul float %a, %b
49*9880d681SAndroid Build Coastguard Worker  %sub = fsub float %c, %mul
50*9880d681SAndroid Build Coastguard Worker  store float %sub, float addrspace(1)* %outgep, align 4
51*9880d681SAndroid Build Coastguard Worker  ret void
52*9880d681SAndroid Build Coastguard Worker}
53*9880d681SAndroid Build Coastguard Worker
54*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_f64:
55*9880d681SAndroid Build Coastguard Worker; SI: v_mul_f64
56*9880d681SAndroid Build Coastguard Worker; SI: v_add_f64
57*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_f64(double addrspace(1)* noalias nocapture %out, double addrspace(1)* noalias nocapture readonly %ptr) #1 {
58*9880d681SAndroid Build Coastguard Worker  %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0
59*9880d681SAndroid Build Coastguard Worker  %tid.ext = sext i32 %tid to i64
60*9880d681SAndroid Build Coastguard Worker  %gep0 = getelementptr double, double addrspace(1)* %ptr, i64 %tid.ext
61*9880d681SAndroid Build Coastguard Worker  %add1 = add i64 %tid.ext, 1
62*9880d681SAndroid Build Coastguard Worker  %gep1 = getelementptr double, double addrspace(1)* %ptr, i64 %add1
63*9880d681SAndroid Build Coastguard Worker  %add2 = add i64 %tid.ext, 2
64*9880d681SAndroid Build Coastguard Worker  %gep2 = getelementptr double, double addrspace(1)* %ptr, i64 %add2
65*9880d681SAndroid Build Coastguard Worker  %outgep = getelementptr double, double addrspace(1)* %out, i64 %tid.ext
66*9880d681SAndroid Build Coastguard Worker  %a = load volatile double, double addrspace(1)* %gep0, align 8
67*9880d681SAndroid Build Coastguard Worker  %b = load volatile double, double addrspace(1)* %gep1, align 8
68*9880d681SAndroid Build Coastguard Worker  %c = load volatile double, double addrspace(1)* %gep2, align 8
69*9880d681SAndroid Build Coastguard Worker  %mul = fmul double %a, %b
70*9880d681SAndroid Build Coastguard Worker  %sub = fsub double %mul, %c
71*9880d681SAndroid Build Coastguard Worker  store double %sub, double addrspace(1)* %outgep, align 8
72*9880d681SAndroid Build Coastguard Worker  ret void
73*9880d681SAndroid Build Coastguard Worker}
74*9880d681SAndroid Build Coastguard Worker
75*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_fabs_f32:
76*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]]
77*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]]
78*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]]
79*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], [[REGA]], [[REGB]], -|[[REGC]]|
80*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]]
81*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_fabs_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 {
82*9880d681SAndroid Build Coastguard Worker  %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0
83*9880d681SAndroid Build Coastguard Worker  %tid.ext = sext i32 %tid to i64
84*9880d681SAndroid Build Coastguard Worker  %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext
85*9880d681SAndroid Build Coastguard Worker  %add1 = add i64 %tid.ext, 1
86*9880d681SAndroid Build Coastguard Worker  %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1
87*9880d681SAndroid Build Coastguard Worker  %add2 = add i64 %tid.ext, 2
88*9880d681SAndroid Build Coastguard Worker  %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2
89*9880d681SAndroid Build Coastguard Worker  %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext
90*9880d681SAndroid Build Coastguard Worker  %a = load volatile float, float addrspace(1)* %gep0, align 4
91*9880d681SAndroid Build Coastguard Worker  %b = load volatile float, float addrspace(1)* %gep1, align 4
92*9880d681SAndroid Build Coastguard Worker  %c = load volatile float, float addrspace(1)* %gep2, align 4
93*9880d681SAndroid Build Coastguard Worker  %c.abs = call float @llvm.fabs.f32(float %c) #0
94*9880d681SAndroid Build Coastguard Worker  %mul = fmul float %a, %b
95*9880d681SAndroid Build Coastguard Worker  %sub = fsub float %mul, %c.abs
96*9880d681SAndroid Build Coastguard Worker  store float %sub, float addrspace(1)* %outgep, align 4
97*9880d681SAndroid Build Coastguard Worker  ret void
98*9880d681SAndroid Build Coastguard Worker}
99*9880d681SAndroid Build Coastguard Worker
100*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_fabs_inv_f32:
101*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]]
102*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]]
103*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]]
104*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], -[[REGA]], [[REGB]], |[[REGC]]|
105*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]]
106*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_fabs_inv_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 {
107*9880d681SAndroid Build Coastguard Worker  %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0
108*9880d681SAndroid Build Coastguard Worker  %tid.ext = sext i32 %tid to i64
109*9880d681SAndroid Build Coastguard Worker  %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext
110*9880d681SAndroid Build Coastguard Worker  %add1 = add i64 %tid.ext, 1
111*9880d681SAndroid Build Coastguard Worker  %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1
112*9880d681SAndroid Build Coastguard Worker  %add2 = add i64 %tid.ext, 2
113*9880d681SAndroid Build Coastguard Worker  %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2
114*9880d681SAndroid Build Coastguard Worker  %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext
115*9880d681SAndroid Build Coastguard Worker  %a = load volatile float, float addrspace(1)* %gep0, align 4
116*9880d681SAndroid Build Coastguard Worker  %b = load volatile float, float addrspace(1)* %gep1, align 4
117*9880d681SAndroid Build Coastguard Worker  %c = load volatile float, float addrspace(1)* %gep2, align 4
118*9880d681SAndroid Build Coastguard Worker  %c.abs = call float @llvm.fabs.f32(float %c) #0
119*9880d681SAndroid Build Coastguard Worker  %mul = fmul float %a, %b
120*9880d681SAndroid Build Coastguard Worker  %sub = fsub float %c.abs, %mul
121*9880d681SAndroid Build Coastguard Worker  store float %sub, float addrspace(1)* %outgep, align 4
122*9880d681SAndroid Build Coastguard Worker  ret void
123*9880d681SAndroid Build Coastguard Worker}
124*9880d681SAndroid Build Coastguard Worker
125*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}neg_neg_mad_f32:
126*9880d681SAndroid Build Coastguard Worker; SI: v_mac_f32_e32 {{v[0-9]+}}, {{v[0-9]+}}, {{v[0-9]+}}
127*9880d681SAndroid Build Coastguard Workerdefine void @neg_neg_mad_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 {
128*9880d681SAndroid Build Coastguard Worker  %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0
129*9880d681SAndroid Build Coastguard Worker  %tid.ext = sext i32 %tid to i64
130*9880d681SAndroid Build Coastguard Worker  %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext
131*9880d681SAndroid Build Coastguard Worker  %add1 = add i64 %tid.ext, 1
132*9880d681SAndroid Build Coastguard Worker  %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1
133*9880d681SAndroid Build Coastguard Worker  %add2 = add i64 %tid.ext, 2
134*9880d681SAndroid Build Coastguard Worker  %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2
135*9880d681SAndroid Build Coastguard Worker  %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext
136*9880d681SAndroid Build Coastguard Worker  %a = load volatile float, float addrspace(1)* %gep0, align 4
137*9880d681SAndroid Build Coastguard Worker  %b = load volatile float, float addrspace(1)* %gep1, align 4
138*9880d681SAndroid Build Coastguard Worker  %c = load volatile float, float addrspace(1)* %gep2, align 4
139*9880d681SAndroid Build Coastguard Worker  %nega = fsub float -0.000000e+00, %a
140*9880d681SAndroid Build Coastguard Worker  %negb = fsub float -0.000000e+00, %b
141*9880d681SAndroid Build Coastguard Worker  %mul = fmul float %nega, %negb
142*9880d681SAndroid Build Coastguard Worker  %sub = fadd float %mul, %c
143*9880d681SAndroid Build Coastguard Worker  store float %sub, float addrspace(1)* %outgep, align 4
144*9880d681SAndroid Build Coastguard Worker  ret void
145*9880d681SAndroid Build Coastguard Worker}
146*9880d681SAndroid Build Coastguard Worker
147*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_fabs_sub_f32:
148*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]]
149*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]]
150*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]]
151*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], [[REGA]], |[[REGB]]|, -[[REGC]]
152*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]]
153*9880d681SAndroid Build Coastguard Workerdefine void @mad_fabs_sub_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 {
154*9880d681SAndroid Build Coastguard Worker  %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0
155*9880d681SAndroid Build Coastguard Worker  %tid.ext = sext i32 %tid to i64
156*9880d681SAndroid Build Coastguard Worker  %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext
157*9880d681SAndroid Build Coastguard Worker  %add1 = add i64 %tid.ext, 1
158*9880d681SAndroid Build Coastguard Worker  %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1
159*9880d681SAndroid Build Coastguard Worker  %add2 = add i64 %tid.ext, 2
160*9880d681SAndroid Build Coastguard Worker  %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2
161*9880d681SAndroid Build Coastguard Worker  %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext
162*9880d681SAndroid Build Coastguard Worker  %a = load volatile float, float addrspace(1)* %gep0, align 4
163*9880d681SAndroid Build Coastguard Worker  %b = load volatile float, float addrspace(1)* %gep1, align 4
164*9880d681SAndroid Build Coastguard Worker  %c = load volatile float, float addrspace(1)* %gep2, align 4
165*9880d681SAndroid Build Coastguard Worker  %b.abs = call float @llvm.fabs.f32(float %b) #0
166*9880d681SAndroid Build Coastguard Worker  %mul = fmul float %a, %b.abs
167*9880d681SAndroid Build Coastguard Worker  %sub = fsub float %mul, %c
168*9880d681SAndroid Build Coastguard Worker  store float %sub, float addrspace(1)* %outgep, align 4
169*9880d681SAndroid Build Coastguard Worker  ret void
170*9880d681SAndroid Build Coastguard Worker}
171*9880d681SAndroid Build Coastguard Worker
172*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}fsub_c_fadd_a_a:
173*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
174*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
175*9880d681SAndroid Build Coastguard Worker; SI: v_mac_f32_e32 [[R2]], -2.0, [[R1]]
176*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[R2]]
177*9880d681SAndroid Build Coastguard Workerdefine void @fsub_c_fadd_a_a(float addrspace(1)* %out, float addrspace(1)* %in) {
178*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
179*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
180*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
181*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
182*9880d681SAndroid Build Coastguard Worker
183*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.0
184*9880d681SAndroid Build Coastguard Worker  %r2 = load volatile float, float addrspace(1)* %gep.1
185*9880d681SAndroid Build Coastguard Worker
186*9880d681SAndroid Build Coastguard Worker  %add = fadd float %r1, %r1
187*9880d681SAndroid Build Coastguard Worker  %r3 = fsub float %r2, %add
188*9880d681SAndroid Build Coastguard Worker
189*9880d681SAndroid Build Coastguard Worker  store float %r3, float addrspace(1)* %gep.out
190*9880d681SAndroid Build Coastguard Worker  ret void
191*9880d681SAndroid Build Coastguard Worker}
192*9880d681SAndroid Build Coastguard Worker
193*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}fsub_fadd_a_a_c:
194*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
195*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
196*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], 2.0, [[R1]], -[[R2]]
197*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]]
198*9880d681SAndroid Build Coastguard Workerdefine void @fsub_fadd_a_a_c(float addrspace(1)* %out, float addrspace(1)* %in) {
199*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
200*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
201*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
202*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
203*9880d681SAndroid Build Coastguard Worker
204*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.0
205*9880d681SAndroid Build Coastguard Worker  %r2 = load volatile float, float addrspace(1)* %gep.1
206*9880d681SAndroid Build Coastguard Worker
207*9880d681SAndroid Build Coastguard Worker  %add = fadd float %r1, %r1
208*9880d681SAndroid Build Coastguard Worker  %r3 = fsub float %add, %r2
209*9880d681SAndroid Build Coastguard Worker
210*9880d681SAndroid Build Coastguard Worker  store float %r3, float addrspace(1)* %gep.out
211*9880d681SAndroid Build Coastguard Worker  ret void
212*9880d681SAndroid Build Coastguard Worker}
213*9880d681SAndroid Build Coastguard Worker
214*9880d681SAndroid Build Coastguard Workerattributes #0 = { nounwind readnone }
215*9880d681SAndroid Build Coastguard Workerattributes #1 = { nounwind }
216