1*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Workerdeclare i32 @llvm.amdgcn.workitem.id.x() #0 4*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.fabs.f32(float) #0 5*9880d681SAndroid Build Coastguard Worker 6*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_f32: 7*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]] 8*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]] 9*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]] 10*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], [[REGA]], [[REGB]], -[[REGC]] 11*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]] 12*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 { 13*9880d681SAndroid Build Coastguard Worker %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0 14*9880d681SAndroid Build Coastguard Worker %tid.ext = sext i32 %tid to i64 15*9880d681SAndroid Build Coastguard Worker %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext 16*9880d681SAndroid Build Coastguard Worker %add1 = add i64 %tid.ext, 1 17*9880d681SAndroid Build Coastguard Worker %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1 18*9880d681SAndroid Build Coastguard Worker %add2 = add i64 %tid.ext, 2 19*9880d681SAndroid Build Coastguard Worker %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2 20*9880d681SAndroid Build Coastguard Worker %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext 21*9880d681SAndroid Build Coastguard Worker %a = load volatile float, float addrspace(1)* %gep0, align 4 22*9880d681SAndroid Build Coastguard Worker %b = load volatile float, float addrspace(1)* %gep1, align 4 23*9880d681SAndroid Build Coastguard Worker %c = load volatile float, float addrspace(1)* %gep2, align 4 24*9880d681SAndroid Build Coastguard Worker %mul = fmul float %a, %b 25*9880d681SAndroid Build Coastguard Worker %sub = fsub float %mul, %c 26*9880d681SAndroid Build Coastguard Worker store float %sub, float addrspace(1)* %outgep, align 4 27*9880d681SAndroid Build Coastguard Worker ret void 28*9880d681SAndroid Build Coastguard Worker} 29*9880d681SAndroid Build Coastguard Worker 30*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_inv_f32: 31*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]] 32*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]] 33*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]] 34*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], -[[REGA]], [[REGB]], [[REGC]] 35*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]] 36*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_inv_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 { 37*9880d681SAndroid Build Coastguard Worker %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0 38*9880d681SAndroid Build Coastguard Worker %tid.ext = sext i32 %tid to i64 39*9880d681SAndroid Build Coastguard Worker %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext 40*9880d681SAndroid Build Coastguard Worker %add1 = add i64 %tid.ext, 1 41*9880d681SAndroid Build Coastguard Worker %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1 42*9880d681SAndroid Build Coastguard Worker %add2 = add i64 %tid.ext, 2 43*9880d681SAndroid Build Coastguard Worker %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2 44*9880d681SAndroid Build Coastguard Worker %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext 45*9880d681SAndroid Build Coastguard Worker %a = load volatile float, float addrspace(1)* %gep0, align 4 46*9880d681SAndroid Build Coastguard Worker %b = load volatile float, float addrspace(1)* %gep1, align 4 47*9880d681SAndroid Build Coastguard Worker %c = load volatile float, float addrspace(1)* %gep2, align 4 48*9880d681SAndroid Build Coastguard Worker %mul = fmul float %a, %b 49*9880d681SAndroid Build Coastguard Worker %sub = fsub float %c, %mul 50*9880d681SAndroid Build Coastguard Worker store float %sub, float addrspace(1)* %outgep, align 4 51*9880d681SAndroid Build Coastguard Worker ret void 52*9880d681SAndroid Build Coastguard Worker} 53*9880d681SAndroid Build Coastguard Worker 54*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_f64: 55*9880d681SAndroid Build Coastguard Worker; SI: v_mul_f64 56*9880d681SAndroid Build Coastguard Worker; SI: v_add_f64 57*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_f64(double addrspace(1)* noalias nocapture %out, double addrspace(1)* noalias nocapture readonly %ptr) #1 { 58*9880d681SAndroid Build Coastguard Worker %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0 59*9880d681SAndroid Build Coastguard Worker %tid.ext = sext i32 %tid to i64 60*9880d681SAndroid Build Coastguard Worker %gep0 = getelementptr double, double addrspace(1)* %ptr, i64 %tid.ext 61*9880d681SAndroid Build Coastguard Worker %add1 = add i64 %tid.ext, 1 62*9880d681SAndroid Build Coastguard Worker %gep1 = getelementptr double, double addrspace(1)* %ptr, i64 %add1 63*9880d681SAndroid Build Coastguard Worker %add2 = add i64 %tid.ext, 2 64*9880d681SAndroid Build Coastguard Worker %gep2 = getelementptr double, double addrspace(1)* %ptr, i64 %add2 65*9880d681SAndroid Build Coastguard Worker %outgep = getelementptr double, double addrspace(1)* %out, i64 %tid.ext 66*9880d681SAndroid Build Coastguard Worker %a = load volatile double, double addrspace(1)* %gep0, align 8 67*9880d681SAndroid Build Coastguard Worker %b = load volatile double, double addrspace(1)* %gep1, align 8 68*9880d681SAndroid Build Coastguard Worker %c = load volatile double, double addrspace(1)* %gep2, align 8 69*9880d681SAndroid Build Coastguard Worker %mul = fmul double %a, %b 70*9880d681SAndroid Build Coastguard Worker %sub = fsub double %mul, %c 71*9880d681SAndroid Build Coastguard Worker store double %sub, double addrspace(1)* %outgep, align 8 72*9880d681SAndroid Build Coastguard Worker ret void 73*9880d681SAndroid Build Coastguard Worker} 74*9880d681SAndroid Build Coastguard Worker 75*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_fabs_f32: 76*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]] 77*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]] 78*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]] 79*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], [[REGA]], [[REGB]], -|[[REGC]]| 80*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]] 81*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_fabs_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 { 82*9880d681SAndroid Build Coastguard Worker %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0 83*9880d681SAndroid Build Coastguard Worker %tid.ext = sext i32 %tid to i64 84*9880d681SAndroid Build Coastguard Worker %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext 85*9880d681SAndroid Build Coastguard Worker %add1 = add i64 %tid.ext, 1 86*9880d681SAndroid Build Coastguard Worker %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1 87*9880d681SAndroid Build Coastguard Worker %add2 = add i64 %tid.ext, 2 88*9880d681SAndroid Build Coastguard Worker %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2 89*9880d681SAndroid Build Coastguard Worker %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext 90*9880d681SAndroid Build Coastguard Worker %a = load volatile float, float addrspace(1)* %gep0, align 4 91*9880d681SAndroid Build Coastguard Worker %b = load volatile float, float addrspace(1)* %gep1, align 4 92*9880d681SAndroid Build Coastguard Worker %c = load volatile float, float addrspace(1)* %gep2, align 4 93*9880d681SAndroid Build Coastguard Worker %c.abs = call float @llvm.fabs.f32(float %c) #0 94*9880d681SAndroid Build Coastguard Worker %mul = fmul float %a, %b 95*9880d681SAndroid Build Coastguard Worker %sub = fsub float %mul, %c.abs 96*9880d681SAndroid Build Coastguard Worker store float %sub, float addrspace(1)* %outgep, align 4 97*9880d681SAndroid Build Coastguard Worker ret void 98*9880d681SAndroid Build Coastguard Worker} 99*9880d681SAndroid Build Coastguard Worker 100*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_sub_fabs_inv_f32: 101*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]] 102*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]] 103*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]] 104*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], -[[REGA]], [[REGB]], |[[REGC]]| 105*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]] 106*9880d681SAndroid Build Coastguard Workerdefine void @mad_sub_fabs_inv_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 { 107*9880d681SAndroid Build Coastguard Worker %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0 108*9880d681SAndroid Build Coastguard Worker %tid.ext = sext i32 %tid to i64 109*9880d681SAndroid Build Coastguard Worker %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext 110*9880d681SAndroid Build Coastguard Worker %add1 = add i64 %tid.ext, 1 111*9880d681SAndroid Build Coastguard Worker %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1 112*9880d681SAndroid Build Coastguard Worker %add2 = add i64 %tid.ext, 2 113*9880d681SAndroid Build Coastguard Worker %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2 114*9880d681SAndroid Build Coastguard Worker %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext 115*9880d681SAndroid Build Coastguard Worker %a = load volatile float, float addrspace(1)* %gep0, align 4 116*9880d681SAndroid Build Coastguard Worker %b = load volatile float, float addrspace(1)* %gep1, align 4 117*9880d681SAndroid Build Coastguard Worker %c = load volatile float, float addrspace(1)* %gep2, align 4 118*9880d681SAndroid Build Coastguard Worker %c.abs = call float @llvm.fabs.f32(float %c) #0 119*9880d681SAndroid Build Coastguard Worker %mul = fmul float %a, %b 120*9880d681SAndroid Build Coastguard Worker %sub = fsub float %c.abs, %mul 121*9880d681SAndroid Build Coastguard Worker store float %sub, float addrspace(1)* %outgep, align 4 122*9880d681SAndroid Build Coastguard Worker ret void 123*9880d681SAndroid Build Coastguard Worker} 124*9880d681SAndroid Build Coastguard Worker 125*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}neg_neg_mad_f32: 126*9880d681SAndroid Build Coastguard Worker; SI: v_mac_f32_e32 {{v[0-9]+}}, {{v[0-9]+}}, {{v[0-9]+}} 127*9880d681SAndroid Build Coastguard Workerdefine void @neg_neg_mad_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 { 128*9880d681SAndroid Build Coastguard Worker %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0 129*9880d681SAndroid Build Coastguard Worker %tid.ext = sext i32 %tid to i64 130*9880d681SAndroid Build Coastguard Worker %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext 131*9880d681SAndroid Build Coastguard Worker %add1 = add i64 %tid.ext, 1 132*9880d681SAndroid Build Coastguard Worker %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1 133*9880d681SAndroid Build Coastguard Worker %add2 = add i64 %tid.ext, 2 134*9880d681SAndroid Build Coastguard Worker %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2 135*9880d681SAndroid Build Coastguard Worker %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext 136*9880d681SAndroid Build Coastguard Worker %a = load volatile float, float addrspace(1)* %gep0, align 4 137*9880d681SAndroid Build Coastguard Worker %b = load volatile float, float addrspace(1)* %gep1, align 4 138*9880d681SAndroid Build Coastguard Worker %c = load volatile float, float addrspace(1)* %gep2, align 4 139*9880d681SAndroid Build Coastguard Worker %nega = fsub float -0.000000e+00, %a 140*9880d681SAndroid Build Coastguard Worker %negb = fsub float -0.000000e+00, %b 141*9880d681SAndroid Build Coastguard Worker %mul = fmul float %nega, %negb 142*9880d681SAndroid Build Coastguard Worker %sub = fadd float %mul, %c 143*9880d681SAndroid Build Coastguard Worker store float %sub, float addrspace(1)* %outgep, align 4 144*9880d681SAndroid Build Coastguard Worker ret void 145*9880d681SAndroid Build Coastguard Worker} 146*9880d681SAndroid Build Coastguard Worker 147*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}mad_fabs_sub_f32: 148*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGA:v[0-9]+]] 149*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGB:v[0-9]+]] 150*9880d681SAndroid Build Coastguard Worker; SI: buffer_load_dword [[REGC:v[0-9]+]] 151*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], [[REGA]], |[[REGB]]|, -[[REGC]] 152*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]] 153*9880d681SAndroid Build Coastguard Workerdefine void @mad_fabs_sub_f32(float addrspace(1)* noalias nocapture %out, float addrspace(1)* noalias nocapture readonly %ptr) #1 { 154*9880d681SAndroid Build Coastguard Worker %tid = tail call i32 @llvm.amdgcn.workitem.id.x() #0 155*9880d681SAndroid Build Coastguard Worker %tid.ext = sext i32 %tid to i64 156*9880d681SAndroid Build Coastguard Worker %gep0 = getelementptr float, float addrspace(1)* %ptr, i64 %tid.ext 157*9880d681SAndroid Build Coastguard Worker %add1 = add i64 %tid.ext, 1 158*9880d681SAndroid Build Coastguard Worker %gep1 = getelementptr float, float addrspace(1)* %ptr, i64 %add1 159*9880d681SAndroid Build Coastguard Worker %add2 = add i64 %tid.ext, 2 160*9880d681SAndroid Build Coastguard Worker %gep2 = getelementptr float, float addrspace(1)* %ptr, i64 %add2 161*9880d681SAndroid Build Coastguard Worker %outgep = getelementptr float, float addrspace(1)* %out, i64 %tid.ext 162*9880d681SAndroid Build Coastguard Worker %a = load volatile float, float addrspace(1)* %gep0, align 4 163*9880d681SAndroid Build Coastguard Worker %b = load volatile float, float addrspace(1)* %gep1, align 4 164*9880d681SAndroid Build Coastguard Worker %c = load volatile float, float addrspace(1)* %gep2, align 4 165*9880d681SAndroid Build Coastguard Worker %b.abs = call float @llvm.fabs.f32(float %b) #0 166*9880d681SAndroid Build Coastguard Worker %mul = fmul float %a, %b.abs 167*9880d681SAndroid Build Coastguard Worker %sub = fsub float %mul, %c 168*9880d681SAndroid Build Coastguard Worker store float %sub, float addrspace(1)* %outgep, align 4 169*9880d681SAndroid Build Coastguard Worker ret void 170*9880d681SAndroid Build Coastguard Worker} 171*9880d681SAndroid Build Coastguard Worker 172*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}fsub_c_fadd_a_a: 173*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}} 174*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4 175*9880d681SAndroid Build Coastguard Worker; SI: v_mac_f32_e32 [[R2]], -2.0, [[R1]] 176*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[R2]] 177*9880d681SAndroid Build Coastguard Workerdefine void @fsub_c_fadd_a_a(float addrspace(1)* %out, float addrspace(1)* %in) { 178*9880d681SAndroid Build Coastguard Worker %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone 179*9880d681SAndroid Build Coastguard Worker %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid 180*9880d681SAndroid Build Coastguard Worker %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1 181*9880d681SAndroid Build Coastguard Worker %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid 182*9880d681SAndroid Build Coastguard Worker 183*9880d681SAndroid Build Coastguard Worker %r1 = load volatile float, float addrspace(1)* %gep.0 184*9880d681SAndroid Build Coastguard Worker %r2 = load volatile float, float addrspace(1)* %gep.1 185*9880d681SAndroid Build Coastguard Worker 186*9880d681SAndroid Build Coastguard Worker %add = fadd float %r1, %r1 187*9880d681SAndroid Build Coastguard Worker %r3 = fsub float %r2, %add 188*9880d681SAndroid Build Coastguard Worker 189*9880d681SAndroid Build Coastguard Worker store float %r3, float addrspace(1)* %gep.out 190*9880d681SAndroid Build Coastguard Worker ret void 191*9880d681SAndroid Build Coastguard Worker} 192*9880d681SAndroid Build Coastguard Worker 193*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}fsub_fadd_a_a_c: 194*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_load_dword [[R1:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64{{$}} 195*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_load_dword [[R2:v[0-9]+]], {{v\[[0-9]+:[0-9]+\]}}, {{s\[[0-9]+:[0-9]+\]}}, 0 addr64 offset:4 196*9880d681SAndroid Build Coastguard Worker; SI: v_mad_f32 [[RESULT:v[0-9]+]], 2.0, [[R1]], -[[R2]] 197*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[RESULT]] 198*9880d681SAndroid Build Coastguard Workerdefine void @fsub_fadd_a_a_c(float addrspace(1)* %out, float addrspace(1)* %in) { 199*9880d681SAndroid Build Coastguard Worker %tid = call i32 @llvm.amdgcn.workitem.id.x() nounwind readnone 200*9880d681SAndroid Build Coastguard Worker %gep.0 = getelementptr float, float addrspace(1)* %out, i32 %tid 201*9880d681SAndroid Build Coastguard Worker %gep.1 = getelementptr float, float addrspace(1)* %gep.0, i32 1 202*9880d681SAndroid Build Coastguard Worker %gep.out = getelementptr float, float addrspace(1)* %out, i32 %tid 203*9880d681SAndroid Build Coastguard Worker 204*9880d681SAndroid Build Coastguard Worker %r1 = load volatile float, float addrspace(1)* %gep.0 205*9880d681SAndroid Build Coastguard Worker %r2 = load volatile float, float addrspace(1)* %gep.1 206*9880d681SAndroid Build Coastguard Worker 207*9880d681SAndroid Build Coastguard Worker %add = fadd float %r1, %r1 208*9880d681SAndroid Build Coastguard Worker %r3 = fsub float %add, %r2 209*9880d681SAndroid Build Coastguard Worker 210*9880d681SAndroid Build Coastguard Worker store float %r3, float addrspace(1)* %gep.out 211*9880d681SAndroid Build Coastguard Worker ret void 212*9880d681SAndroid Build Coastguard Worker} 213*9880d681SAndroid Build Coastguard Worker 214*9880d681SAndroid Build Coastguard Workerattributes #0 = { nounwind readnone } 215*9880d681SAndroid Build Coastguard Workerattributes #1 = { nounwind } 216