1*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefix=VI -check-prefix=VI-OPT %s 2*9880d681SAndroid Build Coastguard Worker; RUN: llc -O0 -march=amdgcn -mcpu=tonga -verify-machineinstrs -show-mc-encoding < %s | FileCheck -check-prefix=VI -check-prefix=VI-NOOPT %s 3*9880d681SAndroid Build Coastguard Worker 4*9880d681SAndroid Build Coastguard Worker; FIXME: The register allocator / scheduler should be able to avoid these hazards. 5*9880d681SAndroid Build Coastguard Worker 6*9880d681SAndroid Build Coastguard Worker; VI-LABEL: {{^}}dpp_test: 7*9880d681SAndroid Build Coastguard Worker; VI: v_mov_b32_e32 v0, s{{[0-9]+}} 8*9880d681SAndroid Build Coastguard Worker; VI: s_nop 1 9*9880d681SAndroid Build Coastguard Worker; VI: v_mov_b32_dpp v0, v0 quad_perm:[1,0,0,0] row_mask:0x1 bank_mask:0x1 bound_ctrl:0 ; encoding: [0xfa,0x02,0x00,0x7e,0x00,0x01,0x08,0x11] 10*9880d681SAndroid Build Coastguard Workerdefine void @dpp_test(i32 addrspace(1)* %out, i32 %in) { 11*9880d681SAndroid Build Coastguard Worker %tmp0 = call i32 @llvm.amdgcn.mov.dpp.i32(i32 %in, i32 1, i32 1, i32 1, i1 1) #0 12*9880d681SAndroid Build Coastguard Worker store i32 %tmp0, i32 addrspace(1)* %out 13*9880d681SAndroid Build Coastguard Worker ret void 14*9880d681SAndroid Build Coastguard Worker} 15*9880d681SAndroid Build Coastguard Worker 16*9880d681SAndroid Build Coastguard Worker; VI-LABEL: {{^}}dpp_wait_states: 17*9880d681SAndroid Build Coastguard Worker; VI: v_mov_b32_e32 [[VGPR0:v[0-9]+]], s{{[0-9]+}} 18*9880d681SAndroid Build Coastguard Worker; VI: s_nop 1 19*9880d681SAndroid Build Coastguard Worker; VI: v_mov_b32_dpp [[VGPR1:v[0-9]+]], [[VGPR0]] quad_perm:[1,0,0,0] row_mask:0x1 bank_mask:0x1 bound_ctrl:0 20*9880d681SAndroid Build Coastguard Worker; VI: s_nop 1 21*9880d681SAndroid Build Coastguard Worker; VI: v_mov_b32_dpp v{{[0-9]+}}, [[VGPR1]] quad_perm:[1,0,0,0] row_mask:0x1 bank_mask:0x1 bound_ctrl:0 22*9880d681SAndroid Build Coastguard Workerdefine void @dpp_wait_states(i32 addrspace(1)* %out, i32 %in) { 23*9880d681SAndroid Build Coastguard Worker %tmp0 = call i32 @llvm.amdgcn.mov.dpp.i32(i32 %in, i32 1, i32 1, i32 1, i1 1) #0 24*9880d681SAndroid Build Coastguard Worker %tmp1 = call i32 @llvm.amdgcn.mov.dpp.i32(i32 %tmp0, i32 1, i32 1, i32 1, i1 1) #0 25*9880d681SAndroid Build Coastguard Worker store i32 %tmp1, i32 addrspace(1)* %out 26*9880d681SAndroid Build Coastguard Worker ret void 27*9880d681SAndroid Build Coastguard Worker} 28*9880d681SAndroid Build Coastguard Worker 29*9880d681SAndroid Build Coastguard Worker; VI-LABEL: {{^}}dpp_first_in_bb: 30*9880d681SAndroid Build Coastguard Worker; VI: ; %endif 31*9880d681SAndroid Build Coastguard Worker; VI-OPT: s_mov_b32 32*9880d681SAndroid Build Coastguard Worker; VI-OPT: s_mov_b32 33*9880d681SAndroid Build Coastguard Worker; VI-NOOPT: s_nop 1 34*9880d681SAndroid Build Coastguard Worker; VI: v_mov_b32_dpp [[VGPR0:v[0-9]+]], v{{[0-9]+}} quad_perm:[1,0,0,0] row_mask:0x1 bank_mask:0x1 bound_ctrl:0 35*9880d681SAndroid Build Coastguard Worker; VI: s_nop 1 36*9880d681SAndroid Build Coastguard Worker; VI: v_mov_b32_dpp [[VGPR1:v[0-9]+]], [[VGPR0]] quad_perm:[1,0,0,0] row_mask:0x1 bank_mask:0x1 bound_ctrl:0 37*9880d681SAndroid Build Coastguard Worker; VI: s_nop 1 38*9880d681SAndroid Build Coastguard Worker; VI: v_mov_b32_dpp v{{[0-9]+}}, [[VGPR1]] quad_perm:[1,0,0,0] row_mask:0x1 bank_mask:0x1 bound_ctrl:0 39*9880d681SAndroid Build Coastguard Workerdefine void @dpp_first_in_bb(float addrspace(1)* %out, float addrspace(1)* %in, float %cond, float %a, float %b) { 40*9880d681SAndroid Build Coastguard Worker %cmp = fcmp oeq float %cond, 0.0 41*9880d681SAndroid Build Coastguard Worker br i1 %cmp, label %if, label %else 42*9880d681SAndroid Build Coastguard Worker 43*9880d681SAndroid Build Coastguard Workerif: 44*9880d681SAndroid Build Coastguard Worker %out_val = load float, float addrspace(1)* %out 45*9880d681SAndroid Build Coastguard Worker %if_val = fadd float %a, %out_val 46*9880d681SAndroid Build Coastguard Worker br label %endif 47*9880d681SAndroid Build Coastguard Worker 48*9880d681SAndroid Build Coastguard Workerelse: 49*9880d681SAndroid Build Coastguard Worker %in_val = load float, float addrspace(1)* %in 50*9880d681SAndroid Build Coastguard Worker %else_val = fadd float %b, %in_val 51*9880d681SAndroid Build Coastguard Worker br label %endif 52*9880d681SAndroid Build Coastguard Worker 53*9880d681SAndroid Build Coastguard Workerendif: 54*9880d681SAndroid Build Coastguard Worker %val = phi float [%if_val, %if], [%else_val, %else] 55*9880d681SAndroid Build Coastguard Worker %val_i32 = bitcast float %val to i32 56*9880d681SAndroid Build Coastguard Worker %tmp0 = call i32 @llvm.amdgcn.mov.dpp.i32(i32 %val_i32, i32 1, i32 1, i32 1, i1 1) #0 57*9880d681SAndroid Build Coastguard Worker %tmp1 = call i32 @llvm.amdgcn.mov.dpp.i32(i32 %tmp0, i32 1, i32 1, i32 1, i1 1) #0 58*9880d681SAndroid Build Coastguard Worker %tmp2 = call i32 @llvm.amdgcn.mov.dpp.i32(i32 %tmp1, i32 1, i32 1, i32 1, i1 1) #0 59*9880d681SAndroid Build Coastguard Worker %tmp_float = bitcast i32 %tmp2 to float 60*9880d681SAndroid Build Coastguard Worker store float %tmp_float, float addrspace(1)* %out 61*9880d681SAndroid Build Coastguard Worker ret void 62*9880d681SAndroid Build Coastguard Worker} 63*9880d681SAndroid Build Coastguard Worker 64*9880d681SAndroid Build Coastguard Workerdeclare i32 @llvm.amdgcn.mov.dpp.i32(i32, i32, i32, i32, i1) #0 65*9880d681SAndroid Build Coastguard Worker 66*9880d681SAndroid Build Coastguard Workerattributes #0 = { nounwind readnone convergent } 67