xref: /aosp_15_r20/external/llvm/test/CodeGen/AMDGPU/store.ll (revision 9880d6810fe72a1726cb53787c6711e909410d58)
1*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -mcpu=verde -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
2*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
3*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=r600 -mcpu=redwood < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s
4*9880d681SAndroid Build Coastguard Worker; RUN: llc -march=r600 -mcpu=cayman < %s | FileCheck -check-prefix=CM -check-prefix=FUNC %s
5*9880d681SAndroid Build Coastguard Worker
6*9880d681SAndroid Build Coastguard Worker;===------------------------------------------------------------------------===;
7*9880d681SAndroid Build Coastguard Worker; Global Address Space
8*9880d681SAndroid Build Coastguard Worker;===------------------------------------------------------------------------===;
9*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i1:
10*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR
11*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_byte
12*9880d681SAndroid Build Coastguard Workerdefine void @store_i1(i1 addrspace(1)* %out) {
13*9880d681SAndroid Build Coastguard Workerentry:
14*9880d681SAndroid Build Coastguard Worker  store i1 true, i1 addrspace(1)* %out
15*9880d681SAndroid Build Coastguard Worker  ret void
16*9880d681SAndroid Build Coastguard Worker}
17*9880d681SAndroid Build Coastguard Worker
18*9880d681SAndroid Build Coastguard Worker; i8 store
19*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i8:
20*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR T[[RW_GPR:[0-9]]].XW, T{{[0-9]}}.X
21*9880d681SAndroid Build Coastguard Worker
22*9880d681SAndroid Build Coastguard Worker; IG 0: Get the byte index and truncate the value
23*9880d681SAndroid Build Coastguard Worker; EG: AND_INT * T{{[0-9]}}.[[BI_CHAN:[XYZW]]], KC0[2].Y, literal.x
24*9880d681SAndroid Build Coastguard Worker; EG: LSHL T{{[0-9]}}.[[SHIFT_CHAN:[XYZW]]], PV.[[BI_CHAN]], literal.x
25*9880d681SAndroid Build Coastguard Worker; EG: AND_INT * T{{[0-9]}}.[[TRUNC_CHAN:[XYZW]]], KC0[2].Z, literal.y
26*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 3(4.203895e-45), 255(3.573311e-43)
27*9880d681SAndroid Build Coastguard Worker
28*9880d681SAndroid Build Coastguard Worker
29*9880d681SAndroid Build Coastguard Worker; IG 1: Truncate the calculated the shift amount for the mask
30*9880d681SAndroid Build Coastguard Worker
31*9880d681SAndroid Build Coastguard Worker; IG 2: Shift the value and the mask
32*9880d681SAndroid Build Coastguard Worker; EG: LSHL T[[RW_GPR]].X, PS, PV.[[SHIFT_CHAN]]
33*9880d681SAndroid Build Coastguard Worker; EG: LSHL * T[[RW_GPR]].W, literal.x, PV.[[SHIFT_CHAN]]
34*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 255
35*9880d681SAndroid Build Coastguard Worker; IG 3: Initialize the Y and Z channels to zero
36*9880d681SAndroid Build Coastguard Worker;       XXX: An optimal scheduler should merge this into one of the prevous IGs.
37*9880d681SAndroid Build Coastguard Worker; EG: MOV T[[RW_GPR]].Y, 0.0
38*9880d681SAndroid Build Coastguard Worker; EG: MOV * T[[RW_GPR]].Z, 0.0
39*9880d681SAndroid Build Coastguard Worker
40*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_byte
41*9880d681SAndroid Build Coastguard Worker
42*9880d681SAndroid Build Coastguard Workerdefine void @store_i8(i8 addrspace(1)* %out, i8 %in) {
43*9880d681SAndroid Build Coastguard Workerentry:
44*9880d681SAndroid Build Coastguard Worker  store i8 %in, i8 addrspace(1)* %out
45*9880d681SAndroid Build Coastguard Worker  ret void
46*9880d681SAndroid Build Coastguard Worker}
47*9880d681SAndroid Build Coastguard Worker
48*9880d681SAndroid Build Coastguard Worker; i16 store
49*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i16:
50*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR T[[RW_GPR:[0-9]]].XW, T{{[0-9]}}.X
51*9880d681SAndroid Build Coastguard Worker
52*9880d681SAndroid Build Coastguard Worker; IG 0: Get the byte index and truncate the value
53*9880d681SAndroid Build Coastguard Worker
54*9880d681SAndroid Build Coastguard Worker
55*9880d681SAndroid Build Coastguard Worker; EG: AND_INT * T{{[0-9]}}.[[BI_CHAN:[XYZW]]], KC0[2].Y, literal.x
56*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 3(4.203895e-45),
57*9880d681SAndroid Build Coastguard Worker
58*9880d681SAndroid Build Coastguard Worker; EG: LSHL T{{[0-9]}}.[[SHIFT_CHAN:[XYZW]]], PV.[[BI_CHAN]], literal.x
59*9880d681SAndroid Build Coastguard Worker; EG: AND_INT * T{{[0-9]}}.[[TRUNC_CHAN:[XYZW]]], KC0[2].Z, literal.y
60*9880d681SAndroid Build Coastguard Worker
61*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 3(4.203895e-45), 65535(9.183409e-41)
62*9880d681SAndroid Build Coastguard Worker; IG 1: Truncate the calculated the shift amount for the mask
63*9880d681SAndroid Build Coastguard Worker
64*9880d681SAndroid Build Coastguard Worker; IG 2: Shift the value and the mask
65*9880d681SAndroid Build Coastguard Worker; EG: LSHL T[[RW_GPR]].X, PS, PV.[[SHIFT_CHAN]]
66*9880d681SAndroid Build Coastguard Worker; EG: LSHL * T[[RW_GPR]].W, literal.x, PV.[[SHIFT_CHAN]]
67*9880d681SAndroid Build Coastguard Worker; EG-NEXT: 65535
68*9880d681SAndroid Build Coastguard Worker; IG 3: Initialize the Y and Z channels to zero
69*9880d681SAndroid Build Coastguard Worker;       XXX: An optimal scheduler should merge this into one of the prevous IGs.
70*9880d681SAndroid Build Coastguard Worker; EG: MOV T[[RW_GPR]].Y, 0.0
71*9880d681SAndroid Build Coastguard Worker; EG: MOV * T[[RW_GPR]].Z, 0.0
72*9880d681SAndroid Build Coastguard Worker
73*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_short
74*9880d681SAndroid Build Coastguard Workerdefine void @store_i16(i16 addrspace(1)* %out, i16 %in) {
75*9880d681SAndroid Build Coastguard Workerentry:
76*9880d681SAndroid Build Coastguard Worker  store i16 %in, i16 addrspace(1)* %out
77*9880d681SAndroid Build Coastguard Worker  ret void
78*9880d681SAndroid Build Coastguard Worker}
79*9880d681SAndroid Build Coastguard Worker
80*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i24:
81*9880d681SAndroid Build Coastguard Worker; SI: s_lshr_b32 s{{[0-9]+}}, s{{[0-9]+}}, 16
82*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_store_byte
83*9880d681SAndroid Build Coastguard Worker; SI-DAG: buffer_store_short
84*9880d681SAndroid Build Coastguard Workerdefine void @store_i24(i24 addrspace(1)* %out, i24 %in) {
85*9880d681SAndroid Build Coastguard Workerentry:
86*9880d681SAndroid Build Coastguard Worker  store i24 %in, i24 addrspace(1)* %out
87*9880d681SAndroid Build Coastguard Worker  ret void
88*9880d681SAndroid Build Coastguard Worker}
89*9880d681SAndroid Build Coastguard Worker
90*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i25:
91*9880d681SAndroid Build Coastguard Worker; SI: s_and_b32 [[AND:s[0-9]+]], s{{[0-9]+}}, 0x1ffffff{{$}}
92*9880d681SAndroid Build Coastguard Worker; SI: v_mov_b32_e32 [[VAND:v[0-9]+]], [[AND]]
93*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword [[VAND]]
94*9880d681SAndroid Build Coastguard Workerdefine void @store_i25(i25 addrspace(1)* %out, i25 %in) {
95*9880d681SAndroid Build Coastguard Workerentry:
96*9880d681SAndroid Build Coastguard Worker  store i25 %in, i25 addrspace(1)* %out
97*9880d681SAndroid Build Coastguard Worker  ret void
98*9880d681SAndroid Build Coastguard Worker}
99*9880d681SAndroid Build Coastguard Worker
100*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v2i8:
101*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR
102*9880d681SAndroid Build Coastguard Worker; EG-NOT: MEM_RAT MSKOR
103*9880d681SAndroid Build Coastguard Worker
104*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_short
105*9880d681SAndroid Build Coastguard Workerdefine void @store_v2i8(<2 x i8> addrspace(1)* %out, <2 x i32> %in) {
106*9880d681SAndroid Build Coastguard Workerentry:
107*9880d681SAndroid Build Coastguard Worker  %0 = trunc <2 x i32> %in to <2 x i8>
108*9880d681SAndroid Build Coastguard Worker  store <2 x i8> %0, <2 x i8> addrspace(1)* %out
109*9880d681SAndroid Build Coastguard Worker  ret void
110*9880d681SAndroid Build Coastguard Worker}
111*9880d681SAndroid Build Coastguard Worker
112*9880d681SAndroid Build Coastguard Worker
113*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v2i16:
114*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW
115*9880d681SAndroid Build Coastguard Worker
116*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD
117*9880d681SAndroid Build Coastguard Worker
118*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword
119*9880d681SAndroid Build Coastguard Workerdefine void @store_v2i16(<2 x i16> addrspace(1)* %out, <2 x i32> %in) {
120*9880d681SAndroid Build Coastguard Workerentry:
121*9880d681SAndroid Build Coastguard Worker  %0 = trunc <2 x i32> %in to <2 x i16>
122*9880d681SAndroid Build Coastguard Worker  store <2 x i16> %0, <2 x i16> addrspace(1)* %out
123*9880d681SAndroid Build Coastguard Worker  ret void
124*9880d681SAndroid Build Coastguard Worker}
125*9880d681SAndroid Build Coastguard Worker
126*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v4i8:
127*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW
128*9880d681SAndroid Build Coastguard Worker
129*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD
130*9880d681SAndroid Build Coastguard Worker
131*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword
132*9880d681SAndroid Build Coastguard Workerdefine void @store_v4i8(<4 x i8> addrspace(1)* %out, <4 x i32> %in) {
133*9880d681SAndroid Build Coastguard Workerentry:
134*9880d681SAndroid Build Coastguard Worker  %0 = trunc <4 x i32> %in to <4 x i8>
135*9880d681SAndroid Build Coastguard Worker  store <4 x i8> %0, <4 x i8> addrspace(1)* %out
136*9880d681SAndroid Build Coastguard Worker  ret void
137*9880d681SAndroid Build Coastguard Worker}
138*9880d681SAndroid Build Coastguard Worker
139*9880d681SAndroid Build Coastguard Worker; floating-point store
140*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_f32:
141*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW T{{[0-9]+\.X, T[0-9]+\.X}}, 1
142*9880d681SAndroid Build Coastguard Worker
143*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD T{{[0-9]+\.X, T[0-9]+\.X}}
144*9880d681SAndroid Build Coastguard Worker
145*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dword
146*9880d681SAndroid Build Coastguard Worker
147*9880d681SAndroid Build Coastguard Workerdefine void @store_f32(float addrspace(1)* %out, float %in) {
148*9880d681SAndroid Build Coastguard Worker  store float %in, float addrspace(1)* %out
149*9880d681SAndroid Build Coastguard Worker  ret void
150*9880d681SAndroid Build Coastguard Worker}
151*9880d681SAndroid Build Coastguard Worker
152*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v4i16:
153*9880d681SAndroid Build Coastguard Worker; MEM_RAT_CACHELESS STORE_RAW T{{[0-9]+}}.XYZW
154*9880d681SAndroid Build Coastguard Worker
155*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx2
156*9880d681SAndroid Build Coastguard Workerdefine void @store_v4i16(<4 x i16> addrspace(1)* %out, <4 x i32> %in) {
157*9880d681SAndroid Build Coastguard Workerentry:
158*9880d681SAndroid Build Coastguard Worker  %0 = trunc <4 x i32> %in to <4 x i16>
159*9880d681SAndroid Build Coastguard Worker  store <4 x i16> %0, <4 x i16> addrspace(1)* %out
160*9880d681SAndroid Build Coastguard Worker  ret void
161*9880d681SAndroid Build Coastguard Worker}
162*9880d681SAndroid Build Coastguard Worker
163*9880d681SAndroid Build Coastguard Worker; vec2 floating-point stores
164*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v2f32:
165*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW
166*9880d681SAndroid Build Coastguard Worker
167*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD
168*9880d681SAndroid Build Coastguard Worker
169*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx2
170*9880d681SAndroid Build Coastguard Worker
171*9880d681SAndroid Build Coastguard Workerdefine void @store_v2f32(<2 x float> addrspace(1)* %out, float %a, float %b) {
172*9880d681SAndroid Build Coastguard Workerentry:
173*9880d681SAndroid Build Coastguard Worker  %0 = insertelement <2 x float> <float 0.0, float 0.0>, float %a, i32 0
174*9880d681SAndroid Build Coastguard Worker  %1 = insertelement <2 x float> %0, float %b, i32 1
175*9880d681SAndroid Build Coastguard Worker  store <2 x float> %1, <2 x float> addrspace(1)* %out
176*9880d681SAndroid Build Coastguard Worker  ret void
177*9880d681SAndroid Build Coastguard Worker}
178*9880d681SAndroid Build Coastguard Worker
179*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_v4i32:
180*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW
181*9880d681SAndroid Build Coastguard Worker; EG-NOT: MEM_RAT_CACHELESS STORE_RAW
182*9880d681SAndroid Build Coastguard Worker
183*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD
184*9880d681SAndroid Build Coastguard Worker; CM-NOT: MEM_RAT_CACHELESS STORE_DWORD
185*9880d681SAndroid Build Coastguard Worker
186*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx4
187*9880d681SAndroid Build Coastguard Workerdefine void @store_v4i32(<4 x i32> addrspace(1)* %out, <4 x i32> %in) {
188*9880d681SAndroid Build Coastguard Workerentry:
189*9880d681SAndroid Build Coastguard Worker  store <4 x i32> %in, <4 x i32> addrspace(1)* %out
190*9880d681SAndroid Build Coastguard Worker  ret void
191*9880d681SAndroid Build Coastguard Worker}
192*9880d681SAndroid Build Coastguard Worker
193*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i64_i8:
194*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR
195*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_byte
196*9880d681SAndroid Build Coastguard Workerdefine void @store_i64_i8(i8 addrspace(1)* %out, i64 %in) {
197*9880d681SAndroid Build Coastguard Workerentry:
198*9880d681SAndroid Build Coastguard Worker  %0 = trunc i64 %in to i8
199*9880d681SAndroid Build Coastguard Worker  store i8 %0, i8 addrspace(1)* %out
200*9880d681SAndroid Build Coastguard Worker  ret void
201*9880d681SAndroid Build Coastguard Worker}
202*9880d681SAndroid Build Coastguard Worker
203*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_i64_i16:
204*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT MSKOR
205*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_short
206*9880d681SAndroid Build Coastguard Workerdefine void @store_i64_i16(i16 addrspace(1)* %out, i64 %in) {
207*9880d681SAndroid Build Coastguard Workerentry:
208*9880d681SAndroid Build Coastguard Worker  %0 = trunc i64 %in to i16
209*9880d681SAndroid Build Coastguard Worker  store i16 %0, i16 addrspace(1)* %out
210*9880d681SAndroid Build Coastguard Worker  ret void
211*9880d681SAndroid Build Coastguard Worker}
212*9880d681SAndroid Build Coastguard Worker
213*9880d681SAndroid Build Coastguard Worker;===------------------------------------------------------------------------===;
214*9880d681SAndroid Build Coastguard Worker; Local Address Space
215*9880d681SAndroid Build Coastguard Worker;===------------------------------------------------------------------------===;
216*9880d681SAndroid Build Coastguard Worker
217*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i1:
218*9880d681SAndroid Build Coastguard Worker; EG: LDS_BYTE_WRITE
219*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b8
220*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i1(i1 addrspace(3)* %out) {
221*9880d681SAndroid Build Coastguard Workerentry:
222*9880d681SAndroid Build Coastguard Worker  store i1 true, i1 addrspace(3)* %out
223*9880d681SAndroid Build Coastguard Worker  ret void
224*9880d681SAndroid Build Coastguard Worker}
225*9880d681SAndroid Build Coastguard Worker
226*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i8:
227*9880d681SAndroid Build Coastguard Worker; EG: LDS_BYTE_WRITE
228*9880d681SAndroid Build Coastguard Worker
229*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b8
230*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i8(i8 addrspace(3)* %out, i8 %in) {
231*9880d681SAndroid Build Coastguard Worker  store i8 %in, i8 addrspace(3)* %out
232*9880d681SAndroid Build Coastguard Worker  ret void
233*9880d681SAndroid Build Coastguard Worker}
234*9880d681SAndroid Build Coastguard Worker
235*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i16:
236*9880d681SAndroid Build Coastguard Worker; EG: LDS_SHORT_WRITE
237*9880d681SAndroid Build Coastguard Worker
238*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b16
239*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i16(i16 addrspace(3)* %out, i16 %in) {
240*9880d681SAndroid Build Coastguard Worker  store i16 %in, i16 addrspace(3)* %out
241*9880d681SAndroid Build Coastguard Worker  ret void
242*9880d681SAndroid Build Coastguard Worker}
243*9880d681SAndroid Build Coastguard Worker
244*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v2i16:
245*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
246*9880d681SAndroid Build Coastguard Worker
247*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
248*9880d681SAndroid Build Coastguard Worker
249*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b32
250*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v2i16(<2 x i16> addrspace(3)* %out, <2 x i16> %in) {
251*9880d681SAndroid Build Coastguard Workerentry:
252*9880d681SAndroid Build Coastguard Worker  store <2 x i16> %in, <2 x i16> addrspace(3)* %out
253*9880d681SAndroid Build Coastguard Worker  ret void
254*9880d681SAndroid Build Coastguard Worker}
255*9880d681SAndroid Build Coastguard Worker
256*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v4i8:
257*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
258*9880d681SAndroid Build Coastguard Worker
259*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
260*9880d681SAndroid Build Coastguard Worker
261*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b32
262*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v4i8(<4 x i8> addrspace(3)* %out, <4 x i8> %in) {
263*9880d681SAndroid Build Coastguard Workerentry:
264*9880d681SAndroid Build Coastguard Worker  store <4 x i8> %in, <4 x i8> addrspace(3)* %out
265*9880d681SAndroid Build Coastguard Worker  ret void
266*9880d681SAndroid Build Coastguard Worker}
267*9880d681SAndroid Build Coastguard Worker
268*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v2i32:
269*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
270*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
271*9880d681SAndroid Build Coastguard Worker
272*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
273*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
274*9880d681SAndroid Build Coastguard Worker
275*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b64
276*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v2i32(<2 x i32> addrspace(3)* %out, <2 x i32> %in) {
277*9880d681SAndroid Build Coastguard Workerentry:
278*9880d681SAndroid Build Coastguard Worker  store <2 x i32> %in, <2 x i32> addrspace(3)* %out
279*9880d681SAndroid Build Coastguard Worker  ret void
280*9880d681SAndroid Build Coastguard Worker}
281*9880d681SAndroid Build Coastguard Worker
282*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v4i32:
283*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
284*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
285*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
286*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
287*9880d681SAndroid Build Coastguard Worker
288*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
289*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
290*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
291*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
292*9880d681SAndroid Build Coastguard Worker
293*9880d681SAndroid Build Coastguard Worker; SI: ds_write2_b64
294*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v4i32(<4 x i32> addrspace(3)* %out, <4 x i32> %in) {
295*9880d681SAndroid Build Coastguard Workerentry:
296*9880d681SAndroid Build Coastguard Worker  store <4 x i32> %in, <4 x i32> addrspace(3)* %out
297*9880d681SAndroid Build Coastguard Worker  ret void
298*9880d681SAndroid Build Coastguard Worker}
299*9880d681SAndroid Build Coastguard Worker
300*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_v4i32_align4:
301*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
302*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
303*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
304*9880d681SAndroid Build Coastguard Worker; EG: LDS_WRITE
305*9880d681SAndroid Build Coastguard Worker
306*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
307*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
308*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
309*9880d681SAndroid Build Coastguard Worker; CM: LDS_WRITE
310*9880d681SAndroid Build Coastguard Worker
311*9880d681SAndroid Build Coastguard Worker; SI: ds_write2_b32
312*9880d681SAndroid Build Coastguard Worker; SI: ds_write2_b32
313*9880d681SAndroid Build Coastguard Workerdefine void @store_local_v4i32_align4(<4 x i32> addrspace(3)* %out, <4 x i32> %in) {
314*9880d681SAndroid Build Coastguard Workerentry:
315*9880d681SAndroid Build Coastguard Worker  store <4 x i32> %in, <4 x i32> addrspace(3)* %out, align 4
316*9880d681SAndroid Build Coastguard Worker  ret void
317*9880d681SAndroid Build Coastguard Worker}
318*9880d681SAndroid Build Coastguard Worker
319*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i64_i8:
320*9880d681SAndroid Build Coastguard Worker; EG: LDS_BYTE_WRITE
321*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b8
322*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i64_i8(i8 addrspace(3)* %out, i64 %in) {
323*9880d681SAndroid Build Coastguard Workerentry:
324*9880d681SAndroid Build Coastguard Worker  %0 = trunc i64 %in to i8
325*9880d681SAndroid Build Coastguard Worker  store i8 %0, i8 addrspace(3)* %out
326*9880d681SAndroid Build Coastguard Worker  ret void
327*9880d681SAndroid Build Coastguard Worker}
328*9880d681SAndroid Build Coastguard Worker
329*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}store_local_i64_i16:
330*9880d681SAndroid Build Coastguard Worker; EG: LDS_SHORT_WRITE
331*9880d681SAndroid Build Coastguard Worker; SI: ds_write_b16
332*9880d681SAndroid Build Coastguard Workerdefine void @store_local_i64_i16(i16 addrspace(3)* %out, i64 %in) {
333*9880d681SAndroid Build Coastguard Workerentry:
334*9880d681SAndroid Build Coastguard Worker  %0 = trunc i64 %in to i16
335*9880d681SAndroid Build Coastguard Worker  store i16 %0, i16 addrspace(3)* %out
336*9880d681SAndroid Build Coastguard Worker  ret void
337*9880d681SAndroid Build Coastguard Worker}
338*9880d681SAndroid Build Coastguard Worker
339*9880d681SAndroid Build Coastguard Worker; The stores in this function are combined by the optimizer to create a
340*9880d681SAndroid Build Coastguard Worker; 64-bit store with 32-bit alignment.  This is legal for SI and the legalizer
341*9880d681SAndroid Build Coastguard Worker; should not try to split the 64-bit store back into 2 32-bit stores.
342*9880d681SAndroid Build Coastguard Worker;
343*9880d681SAndroid Build Coastguard Worker; Evergreen / Northern Islands don't support 64-bit stores yet, so there should
344*9880d681SAndroid Build Coastguard Worker; be two 32-bit stores.
345*9880d681SAndroid Build Coastguard Worker
346*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}vecload2:
347*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW
348*9880d681SAndroid Build Coastguard Worker
349*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD
350*9880d681SAndroid Build Coastguard Worker
351*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx2
352*9880d681SAndroid Build Coastguard Workerdefine void @vecload2(i32 addrspace(1)* nocapture %out, i32 addrspace(2)* nocapture %mem) #0 {
353*9880d681SAndroid Build Coastguard Workerentry:
354*9880d681SAndroid Build Coastguard Worker  %0 = load i32, i32 addrspace(2)* %mem, align 4
355*9880d681SAndroid Build Coastguard Worker  %arrayidx1.i = getelementptr inbounds i32, i32 addrspace(2)* %mem, i64 1
356*9880d681SAndroid Build Coastguard Worker  %1 = load i32, i32 addrspace(2)* %arrayidx1.i, align 4
357*9880d681SAndroid Build Coastguard Worker  store i32 %0, i32 addrspace(1)* %out, align 4
358*9880d681SAndroid Build Coastguard Worker  %arrayidx1 = getelementptr inbounds i32, i32 addrspace(1)* %out, i64 1
359*9880d681SAndroid Build Coastguard Worker  store i32 %1, i32 addrspace(1)* %arrayidx1, align 4
360*9880d681SAndroid Build Coastguard Worker  ret void
361*9880d681SAndroid Build Coastguard Worker}
362*9880d681SAndroid Build Coastguard Worker
363*9880d681SAndroid Build Coastguard Worker; When i128 was a legal type this program generated cannot select errors:
364*9880d681SAndroid Build Coastguard Worker
365*9880d681SAndroid Build Coastguard Worker; FUNC-LABEL: {{^}}"i128-const-store":
366*9880d681SAndroid Build Coastguard Worker; EG: MEM_RAT_CACHELESS STORE_RAW T{{[0-9]+}}.XYZW, T{{[0-9]+}}.X, 1
367*9880d681SAndroid Build Coastguard Worker
368*9880d681SAndroid Build Coastguard Worker; CM: MEM_RAT_CACHELESS STORE_DWORD T{{[0-9]+}}, T{{[0-9]+}}.X
369*9880d681SAndroid Build Coastguard Worker
370*9880d681SAndroid Build Coastguard Worker; SI: buffer_store_dwordx4
371*9880d681SAndroid Build Coastguard Workerdefine void @i128-const-store(i32 addrspace(1)* %out) {
372*9880d681SAndroid Build Coastguard Workerentry:
373*9880d681SAndroid Build Coastguard Worker  store i32 1, i32 addrspace(1)* %out, align 4
374*9880d681SAndroid Build Coastguard Worker  %arrayidx2 = getelementptr inbounds i32, i32 addrspace(1)* %out, i64 1
375*9880d681SAndroid Build Coastguard Worker  store i32 1, i32 addrspace(1)* %arrayidx2, align 4
376*9880d681SAndroid Build Coastguard Worker  %arrayidx4 = getelementptr inbounds i32, i32 addrspace(1)* %out, i64 2
377*9880d681SAndroid Build Coastguard Worker  store i32 2, i32 addrspace(1)* %arrayidx4, align 4
378*9880d681SAndroid Build Coastguard Worker  %arrayidx6 = getelementptr inbounds i32, i32 addrspace(1)* %out, i64 3
379*9880d681SAndroid Build Coastguard Worker  store i32 2, i32 addrspace(1)* %arrayidx6, align 4
380*9880d681SAndroid Build Coastguard Worker  ret void
381*9880d681SAndroid Build Coastguard Worker}
382*9880d681SAndroid Build Coastguard Worker
383*9880d681SAndroid Build Coastguard Workerattributes #0 = { nounwind }
384