xref: /aosp_15_r20/external/llvm/test/CodeGen/AMDGPU/pv-packing.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc < %s -march=r600 -mcpu=cayman | FileCheck %s
2*9880d681SAndroid Build Coastguard Worker
3*9880d681SAndroid Build Coastguard Worker;CHECK: DOT4  T{{[0-9]\.X}}
4*9880d681SAndroid Build Coastguard Worker;CHECK: MULADD_IEEE * T{{[0-9]\.W}}
5*9880d681SAndroid Build Coastguard Worker
6*9880d681SAndroid Build Coastguard Workerdefine amdgpu_vs void @main(<4 x float> inreg %reg0, <4 x float> inreg %reg1, <4 x float> inreg %reg2, <4 x float> inreg %reg3) {
7*9880d681SAndroid Build Coastguard Workermain_body:
8*9880d681SAndroid Build Coastguard Worker  %0 = extractelement <4 x float> %reg1, i32 0
9*9880d681SAndroid Build Coastguard Worker  %1 = extractelement <4 x float> %reg1, i32 1
10*9880d681SAndroid Build Coastguard Worker  %2 = extractelement <4 x float> %reg1, i32 2
11*9880d681SAndroid Build Coastguard Worker  %3 = extractelement <4 x float> %reg2, i32 0
12*9880d681SAndroid Build Coastguard Worker  %4 = extractelement <4 x float> %reg2, i32 1
13*9880d681SAndroid Build Coastguard Worker  %5 = extractelement <4 x float> %reg2, i32 2
14*9880d681SAndroid Build Coastguard Worker  %6 = extractelement <4 x float> %reg3, i32 0
15*9880d681SAndroid Build Coastguard Worker  %7 = extractelement <4 x float> %reg3, i32 1
16*9880d681SAndroid Build Coastguard Worker  %8 = extractelement <4 x float> %reg3, i32 2
17*9880d681SAndroid Build Coastguard Worker  %9 = load <4 x float>, <4 x float> addrspace(8)* null
18*9880d681SAndroid Build Coastguard Worker  %10 = load <4 x float>, <4 x float> addrspace(8)* getelementptr ([1024 x <4 x float>], [1024 x <4 x float>] addrspace(8)* null, i64 0, i32 1)
19*9880d681SAndroid Build Coastguard Worker  %11 = call float @llvm.r600.dot4(<4 x float> %9, <4 x float> %9)
20*9880d681SAndroid Build Coastguard Worker  %12 = fmul float %0, %3
21*9880d681SAndroid Build Coastguard Worker  %13 = fadd float %12, %6
22*9880d681SAndroid Build Coastguard Worker  %14 = fmul float %1, %4
23*9880d681SAndroid Build Coastguard Worker  %15 = fadd float %14, %7
24*9880d681SAndroid Build Coastguard Worker  %16 = fmul float %2, %5
25*9880d681SAndroid Build Coastguard Worker  %17 = fadd float %16, %8
26*9880d681SAndroid Build Coastguard Worker  %18 = fmul float %11, %11
27*9880d681SAndroid Build Coastguard Worker  %19 = fadd float %18, %0
28*9880d681SAndroid Build Coastguard Worker  %20 = insertelement <4 x float> undef, float %13, i32 0
29*9880d681SAndroid Build Coastguard Worker  %21 = insertelement <4 x float> %20, float %15, i32 1
30*9880d681SAndroid Build Coastguard Worker  %22 = insertelement <4 x float> %21, float %17, i32 2
31*9880d681SAndroid Build Coastguard Worker  %23 = insertelement <4 x float> %22, float %19, i32 3
32*9880d681SAndroid Build Coastguard Worker  %24 = call float @llvm.r600.dot4(<4 x float> %23, <4 x float> %10)
33*9880d681SAndroid Build Coastguard Worker  %25 = insertelement <4 x float> undef, float %24, i32 0
34*9880d681SAndroid Build Coastguard Worker  call void @llvm.R600.store.swizzle(<4 x float> %25, i32 0, i32 2)
35*9880d681SAndroid Build Coastguard Worker  ret void
36*9880d681SAndroid Build Coastguard Worker}
37*9880d681SAndroid Build Coastguard Worker
38*9880d681SAndroid Build Coastguard Worker; Function Attrs: readnone
39*9880d681SAndroid Build Coastguard Workerdeclare float @llvm.r600.dot4(<4 x float>, <4 x float>) #1
40*9880d681SAndroid Build Coastguard Worker
41*9880d681SAndroid Build Coastguard Worker
42*9880d681SAndroid Build Coastguard Workerdeclare void @llvm.R600.store.swizzle(<4 x float>, i32, i32)
43*9880d681SAndroid Build Coastguard Worker
44*9880d681SAndroid Build Coastguard Workerattributes #1 = { readnone }
45