xref: /aosp_15_r20/external/llvm/test/CodeGen/NVPTX/arithmetic-fp-sm20.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=nvptx -mcpu=sm_20 -fp-contract=fast | FileCheck %s
2*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 -fp-contract=fast | FileCheck %s
3*9880d681SAndroid Build Coastguard Worker
4*9880d681SAndroid Build Coastguard Worker;; These tests should run for all targets
5*9880d681SAndroid Build Coastguard Worker
6*9880d681SAndroid Build Coastguard Worker;;===-- Basic instruction selection tests ---------------------------------===;;
7*9880d681SAndroid Build Coastguard Worker
8*9880d681SAndroid Build Coastguard Worker
9*9880d681SAndroid Build Coastguard Worker;;; f64
10*9880d681SAndroid Build Coastguard Worker
11*9880d681SAndroid Build Coastguard Workerdefine double @fadd_f64(double %a, double %b) {
12*9880d681SAndroid Build Coastguard Worker; CHECK: add.f64 %fd{{[0-9]+}}, %fd{{[0-9]+}}, %fd{{[0-9]+}}
13*9880d681SAndroid Build Coastguard Worker; CHECK: ret
14*9880d681SAndroid Build Coastguard Worker  %ret = fadd double %a, %b
15*9880d681SAndroid Build Coastguard Worker  ret double %ret
16*9880d681SAndroid Build Coastguard Worker}
17*9880d681SAndroid Build Coastguard Worker
18*9880d681SAndroid Build Coastguard Workerdefine double @fsub_f64(double %a, double %b) {
19*9880d681SAndroid Build Coastguard Worker; CHECK: sub.f64 %fd{{[0-9]+}}, %fd{{[0-9]+}}, %fd{{[0-9]+}}
20*9880d681SAndroid Build Coastguard Worker; CHECK: ret
21*9880d681SAndroid Build Coastguard Worker  %ret = fsub double %a, %b
22*9880d681SAndroid Build Coastguard Worker  ret double %ret
23*9880d681SAndroid Build Coastguard Worker}
24*9880d681SAndroid Build Coastguard Worker
25*9880d681SAndroid Build Coastguard Workerdefine double @fmul_f64(double %a, double %b) {
26*9880d681SAndroid Build Coastguard Worker; CHECK: mul.f64 %fd{{[0-9]+}}, %fd{{[0-9]+}}, %fd{{[0-9]+}}
27*9880d681SAndroid Build Coastguard Worker; CHECK: ret
28*9880d681SAndroid Build Coastguard Worker  %ret = fmul double %a, %b
29*9880d681SAndroid Build Coastguard Worker  ret double %ret
30*9880d681SAndroid Build Coastguard Worker}
31*9880d681SAndroid Build Coastguard Worker
32*9880d681SAndroid Build Coastguard Workerdefine double @fdiv_f64(double %a, double %b) {
33*9880d681SAndroid Build Coastguard Worker; CHECK: div.rn.f64 %fd{{[0-9]+}}, %fd{{[0-9]+}}, %fd{{[0-9]+}}
34*9880d681SAndroid Build Coastguard Worker; CHECK: ret
35*9880d681SAndroid Build Coastguard Worker  %ret = fdiv double %a, %b
36*9880d681SAndroid Build Coastguard Worker  ret double %ret
37*9880d681SAndroid Build Coastguard Worker}
38*9880d681SAndroid Build Coastguard Worker
39*9880d681SAndroid Build Coastguard Worker;; PTX does not have a floating-point rem instruction
40*9880d681SAndroid Build Coastguard Worker
41*9880d681SAndroid Build Coastguard Worker
42*9880d681SAndroid Build Coastguard Worker;;; f32
43*9880d681SAndroid Build Coastguard Worker
44*9880d681SAndroid Build Coastguard Workerdefine float @fadd_f32(float %a, float %b) {
45*9880d681SAndroid Build Coastguard Worker; CHECK: add.f32 %f{{[0-9]+}}, %f{{[0-9]+}}, %f{{[0-9]+}}
46*9880d681SAndroid Build Coastguard Worker; CHECK: ret
47*9880d681SAndroid Build Coastguard Worker  %ret = fadd float %a, %b
48*9880d681SAndroid Build Coastguard Worker  ret float %ret
49*9880d681SAndroid Build Coastguard Worker}
50*9880d681SAndroid Build Coastguard Worker
51*9880d681SAndroid Build Coastguard Workerdefine float @fsub_f32(float %a, float %b) {
52*9880d681SAndroid Build Coastguard Worker; CHECK: sub.f32 %f{{[0-9]+}}, %f{{[0-9]+}}, %f{{[0-9]+}}
53*9880d681SAndroid Build Coastguard Worker; CHECK: ret
54*9880d681SAndroid Build Coastguard Worker  %ret = fsub float %a, %b
55*9880d681SAndroid Build Coastguard Worker  ret float %ret
56*9880d681SAndroid Build Coastguard Worker}
57*9880d681SAndroid Build Coastguard Worker
58*9880d681SAndroid Build Coastguard Workerdefine float @fmul_f32(float %a, float %b) {
59*9880d681SAndroid Build Coastguard Worker; CHECK: mul.f32 %f{{[0-9]+}}, %f{{[0-9]+}}, %f{{[0-9]+}}
60*9880d681SAndroid Build Coastguard Worker; CHECK: ret
61*9880d681SAndroid Build Coastguard Worker  %ret = fmul float %a, %b
62*9880d681SAndroid Build Coastguard Worker  ret float %ret
63*9880d681SAndroid Build Coastguard Worker}
64*9880d681SAndroid Build Coastguard Worker
65*9880d681SAndroid Build Coastguard Workerdefine float @fdiv_f32(float %a, float %b) {
66*9880d681SAndroid Build Coastguard Worker; CHECK: div.rn.f32 %f{{[0-9]+}}, %f{{[0-9]+}}, %f{{[0-9]+}}
67*9880d681SAndroid Build Coastguard Worker; CHECK: ret
68*9880d681SAndroid Build Coastguard Worker  %ret = fdiv float %a, %b
69*9880d681SAndroid Build Coastguard Worker  ret float %ret
70*9880d681SAndroid Build Coastguard Worker}
71*9880d681SAndroid Build Coastguard Worker
72*9880d681SAndroid Build Coastguard Worker;; PTX does not have a floating-point rem instruction
73