xref: /aosp_15_r20/external/llvm/test/CodeGen/AMDGPU/fmuladd.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck %s
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.fmuladd.f32(float, float, float)
4*9880d681SAndroid Build Coastguard Workerdeclare double @llvm.fmuladd.f64(double, double, double)
5*9880d681SAndroid Build Coastguard Workerdeclare i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
6*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.fabs.f32(float) nounwind readnone
7*9880d681SAndroid Build Coastguard Worker
8*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fmuladd_f32:
9*9880d681SAndroid Build Coastguard Worker; CHECK: v_mac_f32_e32 {{v[0-9]+, v[0-9]+, v[0-9]+}}
10*9880d681SAndroid Build Coastguard Worker
11*9880d681SAndroid Build Coastguard Workerdefine void @fmuladd_f32(float addrspace(1)* %out, float addrspace(1)* %in1,
12*9880d681SAndroid Build Coastguard Worker                         float addrspace(1)* %in2, float addrspace(1)* %in3) {
13*9880d681SAndroid Build Coastguard Worker   %r0 = load float, float addrspace(1)* %in1
14*9880d681SAndroid Build Coastguard Worker   %r1 = load float, float addrspace(1)* %in2
15*9880d681SAndroid Build Coastguard Worker   %r2 = load float, float addrspace(1)* %in3
16*9880d681SAndroid Build Coastguard Worker   %r3 = tail call float @llvm.fmuladd.f32(float %r0, float %r1, float %r2)
17*9880d681SAndroid Build Coastguard Worker   store float %r3, float addrspace(1)* %out
18*9880d681SAndroid Build Coastguard Worker   ret void
19*9880d681SAndroid Build Coastguard Worker}
20*9880d681SAndroid Build Coastguard Worker
21*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fmuladd_f64:
22*9880d681SAndroid Build Coastguard Worker; CHECK: v_fma_f64 {{v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\], v\[[0-9]+:[0-9]+\]}}
23*9880d681SAndroid Build Coastguard Worker
24*9880d681SAndroid Build Coastguard Workerdefine void @fmuladd_f64(double addrspace(1)* %out, double addrspace(1)* %in1,
25*9880d681SAndroid Build Coastguard Worker                         double addrspace(1)* %in2, double addrspace(1)* %in3) {
26*9880d681SAndroid Build Coastguard Worker   %r0 = load double, double addrspace(1)* %in1
27*9880d681SAndroid Build Coastguard Worker   %r1 = load double, double addrspace(1)* %in2
28*9880d681SAndroid Build Coastguard Worker   %r2 = load double, double addrspace(1)* %in3
29*9880d681SAndroid Build Coastguard Worker   %r3 = tail call double @llvm.fmuladd.f64(double %r0, double %r1, double %r2)
30*9880d681SAndroid Build Coastguard Worker   store double %r3, double addrspace(1)* %out
31*9880d681SAndroid Build Coastguard Worker   ret void
32*9880d681SAndroid Build Coastguard Worker}
33*9880d681SAndroid Build Coastguard Worker
34*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fmuladd_2.0_a_b_f32
35*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
36*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
37*9880d681SAndroid Build Coastguard Worker; CHECK: v_mac_f32_e32 [[R2]], 2.0, [[R1]]
38*9880d681SAndroid Build Coastguard Worker; CHECK: buffer_store_dword [[R2]]
39*9880d681SAndroid Build Coastguard Workerdefine void @fmuladd_2.0_a_b_f32(float addrspace(1)* %out, float addrspace(1)* %in) {
40*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
41*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
42*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
43*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
44*9880d681SAndroid Build Coastguard Worker
45*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.0
46*9880d681SAndroid Build Coastguard Worker  %r2 = load volatile float, float addrspace(1)* %gep.1
47*9880d681SAndroid Build Coastguard Worker
48*9880d681SAndroid Build Coastguard Worker  %r3 = tail call float @llvm.fmuladd.f32(float 2.0, float %r1, float %r2)
49*9880d681SAndroid Build Coastguard Worker  store float %r3, float addrspace(1)* %gep.out
50*9880d681SAndroid Build Coastguard Worker  ret void
51*9880d681SAndroid Build Coastguard Worker}
52*9880d681SAndroid Build Coastguard Worker
53*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fmuladd_a_2.0_b_f32
54*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
55*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
56*9880d681SAndroid Build Coastguard Worker; CHECK: v_mac_f32_e32 [[R2]], 2.0, [[R1]]
57*9880d681SAndroid Build Coastguard Worker; CHECK: buffer_store_dword [[R2]]
58*9880d681SAndroid Build Coastguard Workerdefine void @fmuladd_a_2.0_b_f32(float addrspace(1)* %out, float addrspace(1)* %in) {
59*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
60*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
61*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
62*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
63*9880d681SAndroid Build Coastguard Worker
64*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.0
65*9880d681SAndroid Build Coastguard Worker  %r2 = load volatile float, float addrspace(1)* %gep.1
66*9880d681SAndroid Build Coastguard Worker
67*9880d681SAndroid Build Coastguard Worker  %r3 = tail call float @llvm.fmuladd.f32(float %r1, float 2.0, float %r2)
68*9880d681SAndroid Build Coastguard Worker  store float %r3, float addrspace(1)* %gep.out
69*9880d681SAndroid Build Coastguard Worker  ret void
70*9880d681SAndroid Build Coastguard Worker}
71*9880d681SAndroid Build Coastguard Worker
72*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fadd_a_a_b_f32:
73*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
74*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
75*9880d681SAndroid Build Coastguard Worker; CHECK: v_mac_f32_e32 [[R2]], 2.0, [[R1]]
76*9880d681SAndroid Build Coastguard Worker; CHECK: buffer_store_dword [[R2]]
77*9880d681SAndroid Build Coastguard Workerdefine void @fadd_a_a_b_f32(float addrspace(1)* %out,
78*9880d681SAndroid Build Coastguard Worker                            float addrspace(1)* %in1,
79*9880d681SAndroid Build Coastguard Worker                            float addrspace(1)* %in2) {
80*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
81*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
82*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
83*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
84*9880d681SAndroid Build Coastguard Worker
85*9880d681SAndroid Build Coastguard Worker  %r0 = load volatile float, float addrspace(1)* %gep.0
86*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.1
87*9880d681SAndroid Build Coastguard Worker
88*9880d681SAndroid Build Coastguard Worker  %add.0 = fadd float %r0, %r0
89*9880d681SAndroid Build Coastguard Worker  %add.1 = fadd float %add.0, %r1
90*9880d681SAndroid Build Coastguard Worker  store float %add.1, float addrspace(1)* %out
91*9880d681SAndroid Build Coastguard Worker  ret void
92*9880d681SAndroid Build Coastguard Worker}
93*9880d681SAndroid Build Coastguard Worker
94*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fadd_b_a_a_f32:
95*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
96*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
97*9880d681SAndroid Build Coastguard Worker; CHECK: v_mac_f32_e32 [[R2]], 2.0, [[R1]]
98*9880d681SAndroid Build Coastguard Worker; CHECK: buffer_store_dword [[R2]]
99*9880d681SAndroid Build Coastguard Workerdefine void @fadd_b_a_a_f32(float addrspace(1)* %out,
100*9880d681SAndroid Build Coastguard Worker                            float addrspace(1)* %in1,
101*9880d681SAndroid Build Coastguard Worker                            float addrspace(1)* %in2) {
102*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
103*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
104*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
105*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
106*9880d681SAndroid Build Coastguard Worker
107*9880d681SAndroid Build Coastguard Worker  %r0 = load volatile float, float addrspace(1)* %gep.0
108*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.1
109*9880d681SAndroid Build Coastguard Worker
110*9880d681SAndroid Build Coastguard Worker  %add.0 = fadd float %r0, %r0
111*9880d681SAndroid Build Coastguard Worker  %add.1 = fadd float %r1, %add.0
112*9880d681SAndroid Build Coastguard Worker  store float %add.1, float addrspace(1)* %out
113*9880d681SAndroid Build Coastguard Worker  ret void
114*9880d681SAndroid Build Coastguard Worker}
115*9880d681SAndroid Build Coastguard Worker
116*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fmuladd_neg_2.0_a_b_f32
117*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
118*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
119*9880d681SAndroid Build Coastguard Worker; CHECK: v_mac_f32_e32 [[R2]], -2.0, [[R1]]
120*9880d681SAndroid Build Coastguard Worker; CHECK: buffer_store_dword [[R2]]
121*9880d681SAndroid Build Coastguard Workerdefine void @fmuladd_neg_2.0_a_b_f32(float addrspace(1)* %out, float addrspace(1)* %in) {
122*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
123*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
124*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
125*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
126*9880d681SAndroid Build Coastguard Worker
127*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.0
128*9880d681SAndroid Build Coastguard Worker  %r2 = load volatile float, float addrspace(1)* %gep.1
129*9880d681SAndroid Build Coastguard Worker
130*9880d681SAndroid Build Coastguard Worker  %r3 = tail call float @llvm.fmuladd.f32(float -2.0, float %r1, float %r2)
131*9880d681SAndroid Build Coastguard Worker  store float %r3, float addrspace(1)* %gep.out
132*9880d681SAndroid Build Coastguard Worker  ret void
133*9880d681SAndroid Build Coastguard Worker}
134*9880d681SAndroid Build Coastguard Worker
135*9880d681SAndroid Build Coastguard Worker
136*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fmuladd_neg_2.0_neg_a_b_f32
137*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
138*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
139*9880d681SAndroid Build Coastguard Worker; CHECK: v_mac_f32_e32 [[R2]], 2.0, [[R1]]
140*9880d681SAndroid Build Coastguard Worker; CHECK: buffer_store_dword [[R2]]
141*9880d681SAndroid Build Coastguard Workerdefine void @fmuladd_neg_2.0_neg_a_b_f32(float addrspace(1)* %out, float addrspace(1)* %in) {
142*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
143*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
144*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
145*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
146*9880d681SAndroid Build Coastguard Worker
147*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.0
148*9880d681SAndroid Build Coastguard Worker  %r2 = load volatile float, float addrspace(1)* %gep.1
149*9880d681SAndroid Build Coastguard Worker
150*9880d681SAndroid Build Coastguard Worker  %r1.fneg = fsub float -0.000000e+00, %r1
151*9880d681SAndroid Build Coastguard Worker
152*9880d681SAndroid Build Coastguard Worker  %r3 = tail call float @llvm.fmuladd.f32(float -2.0, float %r1.fneg, float %r2)
153*9880d681SAndroid Build Coastguard Worker  store float %r3, float addrspace(1)* %gep.out
154*9880d681SAndroid Build Coastguard Worker  ret void
155*9880d681SAndroid Build Coastguard Worker}
156*9880d681SAndroid Build Coastguard Worker
157*9880d681SAndroid Build Coastguard Worker
158*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fmuladd_2.0_neg_a_b_f32
159*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
160*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
161*9880d681SAndroid Build Coastguard Worker; CHECK: v_mac_f32_e32 [[R2]], -2.0, [[R1]]
162*9880d681SAndroid Build Coastguard Worker; CHECK: buffer_store_dword [[R2]]
163*9880d681SAndroid Build Coastguard Workerdefine void @fmuladd_2.0_neg_a_b_f32(float addrspace(1)* %out, float addrspace(1)* %in) {
164*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
165*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
166*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
167*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
168*9880d681SAndroid Build Coastguard Worker
169*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.0
170*9880d681SAndroid Build Coastguard Worker  %r2 = load volatile float, float addrspace(1)* %gep.1
171*9880d681SAndroid Build Coastguard Worker
172*9880d681SAndroid Build Coastguard Worker  %r1.fneg = fsub float -0.000000e+00, %r1
173*9880d681SAndroid Build Coastguard Worker
174*9880d681SAndroid Build Coastguard Worker  %r3 = tail call float @llvm.fmuladd.f32(float 2.0, float %r1.fneg, float %r2)
175*9880d681SAndroid Build Coastguard Worker  store float %r3, float addrspace(1)* %gep.out
176*9880d681SAndroid Build Coastguard Worker  ret void
177*9880d681SAndroid Build Coastguard Worker}
178*9880d681SAndroid Build Coastguard Worker
179*9880d681SAndroid Build Coastguard Worker
180*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}fmuladd_2.0_a_neg_b_f32
181*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}}
182*9880d681SAndroid Build Coastguard Worker; CHECK-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4
183*9880d681SAndroid Build Coastguard Worker; CHECK: v_mad_f32 [[RESULT:v[0-9]+]], 2.0, [[R1]], -[[R2]]
184*9880d681SAndroid Build Coastguard Worker; CHECK: buffer_store_dword [[RESULT]]
185*9880d681SAndroid Build Coastguard Workerdefine void @fmuladd_2.0_a_neg_b_f32(float addrspace(1)* %out, float addrspace(1)* %in) {
186*9880d681SAndroid Build Coastguard Worker  %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone
187*9880d681SAndroid Build Coastguard Worker  %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid
188*9880d681SAndroid Build Coastguard Worker  %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1
189*9880d681SAndroid Build Coastguard Worker  %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid
190*9880d681SAndroid Build Coastguard Worker
191*9880d681SAndroid Build Coastguard Worker  %r1 = load volatile float, float addrspace(1)* %gep.0
192*9880d681SAndroid Build Coastguard Worker  %r2 = load volatile float, float addrspace(1)* %gep.1
193*9880d681SAndroid Build Coastguard Worker
194*9880d681SAndroid Build Coastguard Worker  %r2.fneg = fsub float -0.000000e+00, %r2
195*9880d681SAndroid Build Coastguard Worker
196*9880d681SAndroid Build Coastguard Worker  %r3 = tail call float @llvm.fmuladd.f32(float 2.0, float %r1, float %r2.fneg)
197*9880d681SAndroid Build Coastguard Worker  store float %r3, float addrspace(1)* %gep.out
198*9880d681SAndroid Build Coastguard Worker  ret void
199*9880d681SAndroid Build Coastguard Worker}
200