1*9880d681SAndroid Build Coastguard Worker;RUN: llc < %s -march=amdgcn -mcpu=verde -verify-machineinstrs | FileCheck --check-prefix=GCN %s 2*9880d681SAndroid Build Coastguard Worker;RUN: llc < %s -march=amdgcn -mcpu=kabini -verify-machineinstrs | FileCheck --check-prefix=GCN --check-prefix=16BANK %s 3*9880d681SAndroid Build Coastguard Worker;RUN: llc < %s -march=amdgcn -mcpu=stoney -verify-machineinstrs | FileCheck --check-prefix=GCN --check-prefix=16BANK %s 4*9880d681SAndroid Build Coastguard Worker;RUN: llc < %s -march=amdgcn -mcpu=tonga -verify-machineinstrs | FileCheck --check-prefix=GCN %s 5*9880d681SAndroid Build Coastguard Worker 6*9880d681SAndroid Build Coastguard Worker;GCN-LABEL: {{^}}main: 7*9880d681SAndroid Build Coastguard Worker;GCN-NOT: s_wqm 8*9880d681SAndroid Build Coastguard Worker;GCN: s_mov_b32 9*9880d681SAndroid Build Coastguard Worker;GCN-NEXT: v_interp_mov_f32 10*9880d681SAndroid Build Coastguard Worker;GCN: v_interp_p1_f32 11*9880d681SAndroid Build Coastguard Worker;GCN: v_interp_p2_f32 12*9880d681SAndroid Build Coastguard Worker 13*9880d681SAndroid Build Coastguard Workerdefine amdgpu_ps void @main(<16 x i8> addrspace(2)* inreg, <16 x i8> addrspace(2)* inreg, <32 x i8> addrspace(2)* inreg, i32 inreg, <2 x i32>) { 14*9880d681SAndroid Build Coastguard Workermain_body: 15*9880d681SAndroid Build Coastguard Worker %5 = call float @llvm.SI.fs.constant(i32 0, i32 0, i32 %3) 16*9880d681SAndroid Build Coastguard Worker %6 = call float @llvm.SI.fs.interp(i32 0, i32 0, i32 %3, <2 x i32> %4) 17*9880d681SAndroid Build Coastguard Worker %7 = call float @llvm.SI.fs.interp(i32 1, i32 0, i32 %3, <2 x i32> %4) 18*9880d681SAndroid Build Coastguard Worker call void @llvm.SI.export(i32 15, i32 1, i32 1, i32 0, i32 1, float %5, float %6, float %7, float %7) 19*9880d681SAndroid Build Coastguard Worker ret void 20*9880d681SAndroid Build Coastguard Worker} 21*9880d681SAndroid Build Coastguard Worker 22*9880d681SAndroid Build Coastguard Worker; Thest that v_interp_p1 uses different source and destination registers 23*9880d681SAndroid Build Coastguard Worker; on 16 bank LDS chips. 24*9880d681SAndroid Build Coastguard Worker 25*9880d681SAndroid Build Coastguard Worker; 16BANK-LABEL: {{^}}v_interp_p1_bank16_bug: 26*9880d681SAndroid Build Coastguard Worker; 16BANK-NOT: v_interp_p1_f32 [[DST:v[0-9]+]], [[DST]] 27*9880d681SAndroid Build Coastguard Worker 28*9880d681SAndroid Build Coastguard Workerdefine amdgpu_ps void @v_interp_p1_bank16_bug([6 x <16 x i8>] addrspace(2)* byval, [17 x <16 x i8>] addrspace(2)* byval, [17 x <4 x i32>] addrspace(2)* byval, [34 x <8 x i32>] addrspace(2)* byval, float inreg, i32 inreg, <2 x i32>, <2 x i32>, <2 x i32>, <3 x i32>, <2 x i32>, <2 x i32>, <2 x i32>, float, float, float, float, float, float, i32, float, float) { 29*9880d681SAndroid Build Coastguard Workermain_body: 30*9880d681SAndroid Build Coastguard Worker %22 = call float @llvm.SI.fs.interp(i32 0, i32 0, i32 %5, <2 x i32> %7) 31*9880d681SAndroid Build Coastguard Worker %23 = call float @llvm.SI.fs.interp(i32 1, i32 0, i32 %5, <2 x i32> %7) 32*9880d681SAndroid Build Coastguard Worker %24 = call float @llvm.SI.fs.interp(i32 2, i32 0, i32 %5, <2 x i32> %7) 33*9880d681SAndroid Build Coastguard Worker %25 = call float @fabs(float %22) 34*9880d681SAndroid Build Coastguard Worker %26 = call float @fabs(float %23) 35*9880d681SAndroid Build Coastguard Worker %27 = call float @fabs(float %24) 36*9880d681SAndroid Build Coastguard Worker %28 = call i32 @llvm.SI.packf16(float %25, float %26) 37*9880d681SAndroid Build Coastguard Worker %29 = bitcast i32 %28 to float 38*9880d681SAndroid Build Coastguard Worker %30 = call i32 @llvm.SI.packf16(float %27, float 1.000000e+00) 39*9880d681SAndroid Build Coastguard Worker %31 = bitcast i32 %30 to float 40*9880d681SAndroid Build Coastguard Worker call void @llvm.SI.export(i32 15, i32 1, i32 1, i32 0, i32 1, float %29, float %31, float %29, float %31) 41*9880d681SAndroid Build Coastguard Worker ret void 42*9880d681SAndroid Build Coastguard Worker} 43*9880d681SAndroid Build Coastguard Worker 44*9880d681SAndroid Build Coastguard Worker; Function Attrs: readnone 45*9880d681SAndroid Build Coastguard Workerdeclare float @fabs(float) #1 46*9880d681SAndroid Build Coastguard Worker 47*9880d681SAndroid Build Coastguard Worker; Function Attrs: nounwind readnone 48*9880d681SAndroid Build Coastguard Workerdeclare i32 @llvm.SI.packf16(float, float) #0 49*9880d681SAndroid Build Coastguard Worker 50*9880d681SAndroid Build Coastguard Worker; Function Attrs: nounwind readnone 51*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.SI.fs.constant(i32, i32, i32) #0 52*9880d681SAndroid Build Coastguard Worker 53*9880d681SAndroid Build Coastguard Worker; Function Attrs: nounwind readnone 54*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.SI.fs.interp(i32, i32, i32, <2 x i32>) #0 55*9880d681SAndroid Build Coastguard Worker 56*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.SI.export(i32, i32, i32, i32, i32, float, float, float, float) 57*9880d681SAndroid Build Coastguard Worker 58*9880d681SAndroid Build Coastguard Workerattributes #0 = { nounwind readnone } 59*9880d681SAndroid Build Coastguard Workerattributes #1 = { readnone } 60