1*9880d681SAndroid Build Coastguard Worker; RUN: llc -mtriple=amdgcn--amdhsa -mcpu=fiji -verify-machineinstrs < %s | FileCheck %s 2*9880d681SAndroid Build Coastguard Worker 3*9880d681SAndroid Build Coastguard Workerdeclare i32 @llvm.amdgcn.ds.permute(i32, i32) #0 4*9880d681SAndroid Build Coastguard Worker 5*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}ds_permute: 6*9880d681SAndroid Build Coastguard Worker; CHECK: ds_permute_b32 v{{[0-9]+}}, v{{[0-9]+}}, v{{[0-9]+}} 7*9880d681SAndroid Build Coastguard Worker; CHECK: s_waitcnt lgkmcnt 8*9880d681SAndroid Build Coastguard Workerdefine void @ds_permute(i32 addrspace(1)* %out, i32 %index, i32 %src) nounwind { 9*9880d681SAndroid Build Coastguard Worker %bpermute = call i32 @llvm.amdgcn.ds.permute(i32 %index, i32 %src) #0 10*9880d681SAndroid Build Coastguard Worker store i32 %bpermute, i32 addrspace(1)* %out, align 4 11*9880d681SAndroid Build Coastguard Worker ret void 12*9880d681SAndroid Build Coastguard Worker} 13*9880d681SAndroid Build Coastguard Worker 14*9880d681SAndroid Build Coastguard Worker; CHECK-LABEL: {{^}}ds_permute_imm_offset: 15*9880d681SAndroid Build Coastguard Worker; CHECK: ds_permute_b32 v{{[0-9]+}}, v{{[0-9]+}}, v{{[0-9]+}} offset:4 16*9880d681SAndroid Build Coastguard Worker; CHECK: s_waitcnt lgkmcnt 17*9880d681SAndroid Build Coastguard Workerdefine void @ds_permute_imm_offset(i32 addrspace(1)* %out, i32 %base_index, i32 %src) nounwind { 18*9880d681SAndroid Build Coastguard Worker %index = add i32 %base_index, 4 19*9880d681SAndroid Build Coastguard Worker %bpermute = call i32 @llvm.amdgcn.ds.permute(i32 %index, i32 %src) #0 20*9880d681SAndroid Build Coastguard Worker store i32 %bpermute, i32 addrspace(1)* %out, align 4 21*9880d681SAndroid Build Coastguard Worker ret void 22*9880d681SAndroid Build Coastguard Worker} 23*9880d681SAndroid Build Coastguard Worker 24*9880d681SAndroid Build Coastguard Workerattributes #0 = { nounwind readnone convergent } 25