1*61046927SAndroid Build Coastguard Worker /*
2*61046927SAndroid Build Coastguard Worker * Copyright © 2017-2018 Rob Clark <[email protected]>
3*61046927SAndroid Build Coastguard Worker * SPDX-License-Identifier: MIT
4*61046927SAndroid Build Coastguard Worker *
5*61046927SAndroid Build Coastguard Worker * Authors:
6*61046927SAndroid Build Coastguard Worker * Rob Clark <[email protected]>
7*61046927SAndroid Build Coastguard Worker */
8*61046927SAndroid Build Coastguard Worker
9*61046927SAndroid Build Coastguard Worker #define GPU 600
10*61046927SAndroid Build Coastguard Worker
11*61046927SAndroid Build Coastguard Worker #include "ir3_context.h"
12*61046927SAndroid Build Coastguard Worker #include "ir3_image.h"
13*61046927SAndroid Build Coastguard Worker
14*61046927SAndroid Build Coastguard Worker /*
15*61046927SAndroid Build Coastguard Worker * Handlers for instructions changed/added in a6xx:
16*61046927SAndroid Build Coastguard Worker *
17*61046927SAndroid Build Coastguard Worker * Starting with a6xx, isam and stbi is used for SSBOs as well; stbi and the
18*61046927SAndroid Build Coastguard Worker * atomic instructions (used for both SSBO and image) use a new instruction
19*61046927SAndroid Build Coastguard Worker * encoding compared to a4xx/a5xx.
20*61046927SAndroid Build Coastguard Worker */
21*61046927SAndroid Build Coastguard Worker
22*61046927SAndroid Build Coastguard Worker static void
lower_ssbo_offset(struct ir3_context * ctx,nir_intrinsic_instr * intr,nir_src * offset_src,struct ir3_instruction ** offset,unsigned * imm_offset)23*61046927SAndroid Build Coastguard Worker lower_ssbo_offset(struct ir3_context *ctx, nir_intrinsic_instr *intr,
24*61046927SAndroid Build Coastguard Worker nir_src *offset_src,
25*61046927SAndroid Build Coastguard Worker struct ir3_instruction **offset, unsigned *imm_offset)
26*61046927SAndroid Build Coastguard Worker {
27*61046927SAndroid Build Coastguard Worker if (ctx->compiler->has_ssbo_imm_offsets) {
28*61046927SAndroid Build Coastguard Worker ir3_lower_imm_offset(ctx, intr, offset_src, 7, offset, imm_offset);
29*61046927SAndroid Build Coastguard Worker } else {
30*61046927SAndroid Build Coastguard Worker assert(nir_intrinsic_base(intr) == 0);
31*61046927SAndroid Build Coastguard Worker *offset = ir3_get_src(ctx, offset_src)[0];
32*61046927SAndroid Build Coastguard Worker *imm_offset = 0;
33*61046927SAndroid Build Coastguard Worker }
34*61046927SAndroid Build Coastguard Worker }
35*61046927SAndroid Build Coastguard Worker
36*61046927SAndroid Build Coastguard Worker /* src[] = { buffer_index, offset }. No const_index */
37*61046927SAndroid Build Coastguard Worker static void
emit_intrinsic_load_ssbo(struct ir3_context * ctx,nir_intrinsic_instr * intr,struct ir3_instruction ** dst)38*61046927SAndroid Build Coastguard Worker emit_intrinsic_load_ssbo(struct ir3_context *ctx, nir_intrinsic_instr *intr,
39*61046927SAndroid Build Coastguard Worker struct ir3_instruction **dst)
40*61046927SAndroid Build Coastguard Worker {
41*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
42*61046927SAndroid Build Coastguard Worker struct ir3_instruction *offset;
43*61046927SAndroid Build Coastguard Worker struct ir3_instruction *ldib;
44*61046927SAndroid Build Coastguard Worker unsigned imm_offset_val;
45*61046927SAndroid Build Coastguard Worker
46*61046927SAndroid Build Coastguard Worker lower_ssbo_offset(ctx, intr, &intr->src[2], &offset, &imm_offset_val);
47*61046927SAndroid Build Coastguard Worker struct ir3_instruction *imm_offset = create_immed(b, imm_offset_val);
48*61046927SAndroid Build Coastguard Worker
49*61046927SAndroid Build Coastguard Worker ldib = ir3_LDIB(b, ir3_ssbo_to_ibo(ctx, intr->src[0]), 0, offset, 0,
50*61046927SAndroid Build Coastguard Worker imm_offset, 0);
51*61046927SAndroid Build Coastguard Worker ldib->dsts[0]->wrmask = MASK(intr->num_components);
52*61046927SAndroid Build Coastguard Worker ldib->cat6.iim_val = intr->num_components;
53*61046927SAndroid Build Coastguard Worker ldib->cat6.d = 1;
54*61046927SAndroid Build Coastguard Worker switch (intr->def.bit_size) {
55*61046927SAndroid Build Coastguard Worker case 8:
56*61046927SAndroid Build Coastguard Worker /* This encodes the 8-bit SSBO load and matches blob's encoding of
57*61046927SAndroid Build Coastguard Worker * imageBuffer access using VK_FORMAT_R8 and the dedicated 8-bit
58*61046927SAndroid Build Coastguard Worker * descriptor. No vectorization is possible.
59*61046927SAndroid Build Coastguard Worker */
60*61046927SAndroid Build Coastguard Worker assert(intr->num_components == 1);
61*61046927SAndroid Build Coastguard Worker
62*61046927SAndroid Build Coastguard Worker ldib->cat6.type = TYPE_U16;
63*61046927SAndroid Build Coastguard Worker ldib->cat6.typed = true;
64*61046927SAndroid Build Coastguard Worker break;
65*61046927SAndroid Build Coastguard Worker case 16:
66*61046927SAndroid Build Coastguard Worker ldib->cat6.type = TYPE_U16;
67*61046927SAndroid Build Coastguard Worker break;
68*61046927SAndroid Build Coastguard Worker default:
69*61046927SAndroid Build Coastguard Worker ldib->cat6.type = TYPE_U32;
70*61046927SAndroid Build Coastguard Worker break;
71*61046927SAndroid Build Coastguard Worker }
72*61046927SAndroid Build Coastguard Worker ldib->barrier_class = IR3_BARRIER_BUFFER_R;
73*61046927SAndroid Build Coastguard Worker ldib->barrier_conflict = IR3_BARRIER_BUFFER_W;
74*61046927SAndroid Build Coastguard Worker
75*61046927SAndroid Build Coastguard Worker if (imm_offset_val) {
76*61046927SAndroid Build Coastguard Worker assert(ctx->compiler->has_ssbo_imm_offsets);
77*61046927SAndroid Build Coastguard Worker ldib->flags |= IR3_INSTR_IMM_OFFSET;
78*61046927SAndroid Build Coastguard Worker }
79*61046927SAndroid Build Coastguard Worker
80*61046927SAndroid Build Coastguard Worker ir3_handle_bindless_cat6(ldib, intr->src[0]);
81*61046927SAndroid Build Coastguard Worker ir3_handle_nonuniform(ldib, intr);
82*61046927SAndroid Build Coastguard Worker
83*61046927SAndroid Build Coastguard Worker ir3_split_dest(b, dst, ldib, 0, intr->num_components);
84*61046927SAndroid Build Coastguard Worker }
85*61046927SAndroid Build Coastguard Worker
86*61046927SAndroid Build Coastguard Worker /* src[] = { value, block_index, offset }. const_index[] = { write_mask } */
87*61046927SAndroid Build Coastguard Worker static void
emit_intrinsic_store_ssbo(struct ir3_context * ctx,nir_intrinsic_instr * intr)88*61046927SAndroid Build Coastguard Worker emit_intrinsic_store_ssbo(struct ir3_context *ctx, nir_intrinsic_instr *intr)
89*61046927SAndroid Build Coastguard Worker {
90*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
91*61046927SAndroid Build Coastguard Worker struct ir3_instruction *stib, *val, *offset;
92*61046927SAndroid Build Coastguard Worker unsigned wrmask = nir_intrinsic_write_mask(intr);
93*61046927SAndroid Build Coastguard Worker unsigned ncomp = ffs(~wrmask) - 1;
94*61046927SAndroid Build Coastguard Worker unsigned imm_offset_val;
95*61046927SAndroid Build Coastguard Worker
96*61046927SAndroid Build Coastguard Worker assert(wrmask == BITFIELD_MASK(intr->num_components));
97*61046927SAndroid Build Coastguard Worker
98*61046927SAndroid Build Coastguard Worker /* src0 is offset, src1 is immediate offset, src2 is value:
99*61046927SAndroid Build Coastguard Worker */
100*61046927SAndroid Build Coastguard Worker val = ir3_create_collect(b, ir3_get_src(ctx, &intr->src[0]), ncomp);
101*61046927SAndroid Build Coastguard Worker
102*61046927SAndroid Build Coastguard Worker /* Any 8-bit store will be done on a single-component value that additionally
103*61046927SAndroid Build Coastguard Worker * has to be masked to clear up the higher bits or it will malfunction.
104*61046927SAndroid Build Coastguard Worker */
105*61046927SAndroid Build Coastguard Worker if (intr->src[0].ssa->bit_size == 8) {
106*61046927SAndroid Build Coastguard Worker assert(ncomp == 1);
107*61046927SAndroid Build Coastguard Worker
108*61046927SAndroid Build Coastguard Worker struct ir3_instruction *mask = create_immed_typed(b, 0xff, TYPE_U8);
109*61046927SAndroid Build Coastguard Worker val = ir3_AND_B(b, val, 0, mask, 0);
110*61046927SAndroid Build Coastguard Worker val->dsts[0]->flags |= IR3_REG_HALF;
111*61046927SAndroid Build Coastguard Worker }
112*61046927SAndroid Build Coastguard Worker
113*61046927SAndroid Build Coastguard Worker lower_ssbo_offset(ctx, intr, &intr->src[3], &offset, &imm_offset_val);
114*61046927SAndroid Build Coastguard Worker struct ir3_instruction *imm_offset = create_immed(b, imm_offset_val);
115*61046927SAndroid Build Coastguard Worker
116*61046927SAndroid Build Coastguard Worker stib = ir3_STIB(b, ir3_ssbo_to_ibo(ctx, intr->src[1]), 0, offset, 0,
117*61046927SAndroid Build Coastguard Worker imm_offset, 0, val, 0);
118*61046927SAndroid Build Coastguard Worker stib->cat6.iim_val = ncomp;
119*61046927SAndroid Build Coastguard Worker stib->cat6.d = 1;
120*61046927SAndroid Build Coastguard Worker switch (intr->src[0].ssa->bit_size) {
121*61046927SAndroid Build Coastguard Worker case 8:
122*61046927SAndroid Build Coastguard Worker /* As with ldib, this encodes the 8-bit SSBO store and matches blob's
123*61046927SAndroid Build Coastguard Worker * encoding of imageBuffer access using VK_FORMAT_R8 and the extra 8-bit
124*61046927SAndroid Build Coastguard Worker * descriptor. No vectorization is possible and we have to override the
125*61046927SAndroid Build Coastguard Worker * relevant field anyway.
126*61046927SAndroid Build Coastguard Worker */
127*61046927SAndroid Build Coastguard Worker stib->cat6.type = TYPE_U16;
128*61046927SAndroid Build Coastguard Worker stib->cat6.iim_val = 4;
129*61046927SAndroid Build Coastguard Worker stib->cat6.typed = true;
130*61046927SAndroid Build Coastguard Worker break;
131*61046927SAndroid Build Coastguard Worker case 16:
132*61046927SAndroid Build Coastguard Worker stib->cat6.type = TYPE_U16;
133*61046927SAndroid Build Coastguard Worker break;
134*61046927SAndroid Build Coastguard Worker default:
135*61046927SAndroid Build Coastguard Worker stib->cat6.type = TYPE_U32;
136*61046927SAndroid Build Coastguard Worker break;
137*61046927SAndroid Build Coastguard Worker }
138*61046927SAndroid Build Coastguard Worker stib->barrier_class = IR3_BARRIER_BUFFER_W;
139*61046927SAndroid Build Coastguard Worker stib->barrier_conflict = IR3_BARRIER_BUFFER_R | IR3_BARRIER_BUFFER_W;
140*61046927SAndroid Build Coastguard Worker
141*61046927SAndroid Build Coastguard Worker if (imm_offset_val) {
142*61046927SAndroid Build Coastguard Worker assert(ctx->compiler->has_ssbo_imm_offsets);
143*61046927SAndroid Build Coastguard Worker stib->flags |= IR3_INSTR_IMM_OFFSET;
144*61046927SAndroid Build Coastguard Worker }
145*61046927SAndroid Build Coastguard Worker
146*61046927SAndroid Build Coastguard Worker ir3_handle_bindless_cat6(stib, intr->src[1]);
147*61046927SAndroid Build Coastguard Worker ir3_handle_nonuniform(stib, intr);
148*61046927SAndroid Build Coastguard Worker
149*61046927SAndroid Build Coastguard Worker array_insert(b, b->keeps, stib);
150*61046927SAndroid Build Coastguard Worker }
151*61046927SAndroid Build Coastguard Worker
152*61046927SAndroid Build Coastguard Worker static struct ir3_instruction *
emit_atomic(struct ir3_block * b,nir_atomic_op op,struct ir3_instruction * ibo,struct ir3_instruction * src0,struct ir3_instruction * src1)153*61046927SAndroid Build Coastguard Worker emit_atomic(struct ir3_block *b,
154*61046927SAndroid Build Coastguard Worker nir_atomic_op op,
155*61046927SAndroid Build Coastguard Worker struct ir3_instruction *ibo,
156*61046927SAndroid Build Coastguard Worker struct ir3_instruction *src0,
157*61046927SAndroid Build Coastguard Worker struct ir3_instruction *src1)
158*61046927SAndroid Build Coastguard Worker {
159*61046927SAndroid Build Coastguard Worker switch (op) {
160*61046927SAndroid Build Coastguard Worker case nir_atomic_op_iadd:
161*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_ADD(b, ibo, 0, src0, 0, src1, 0);
162*61046927SAndroid Build Coastguard Worker case nir_atomic_op_imin:
163*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_MIN(b, ibo, 0, src0, 0, src1, 0);
164*61046927SAndroid Build Coastguard Worker case nir_atomic_op_umin:
165*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_MIN(b, ibo, 0, src0, 0, src1, 0);
166*61046927SAndroid Build Coastguard Worker case nir_atomic_op_imax:
167*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_MAX(b, ibo, 0, src0, 0, src1, 0);
168*61046927SAndroid Build Coastguard Worker case nir_atomic_op_umax:
169*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_MAX(b, ibo, 0, src0, 0, src1, 0);
170*61046927SAndroid Build Coastguard Worker case nir_atomic_op_iand:
171*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_AND(b, ibo, 0, src0, 0, src1, 0);
172*61046927SAndroid Build Coastguard Worker case nir_atomic_op_ior:
173*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_OR(b, ibo, 0, src0, 0, src1, 0);
174*61046927SAndroid Build Coastguard Worker case nir_atomic_op_ixor:
175*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_XOR(b, ibo, 0, src0, 0, src1, 0);
176*61046927SAndroid Build Coastguard Worker case nir_atomic_op_xchg:
177*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_XCHG(b, ibo, 0, src0, 0, src1, 0);
178*61046927SAndroid Build Coastguard Worker case nir_atomic_op_cmpxchg:
179*61046927SAndroid Build Coastguard Worker return ir3_ATOMIC_B_CMPXCHG(b, ibo, 0, src0, 0, src1, 0);
180*61046927SAndroid Build Coastguard Worker default:
181*61046927SAndroid Build Coastguard Worker unreachable("boo");
182*61046927SAndroid Build Coastguard Worker }
183*61046927SAndroid Build Coastguard Worker }
184*61046927SAndroid Build Coastguard Worker
185*61046927SAndroid Build Coastguard Worker /*
186*61046927SAndroid Build Coastguard Worker * SSBO atomic intrinsics
187*61046927SAndroid Build Coastguard Worker *
188*61046927SAndroid Build Coastguard Worker * All of the SSBO atomic memory operations read a value from memory,
189*61046927SAndroid Build Coastguard Worker * compute a new value using one of the operations below, write the new
190*61046927SAndroid Build Coastguard Worker * value to memory, and return the original value read.
191*61046927SAndroid Build Coastguard Worker *
192*61046927SAndroid Build Coastguard Worker * All operations take 3 sources except CompSwap that takes 4. These
193*61046927SAndroid Build Coastguard Worker * sources represent:
194*61046927SAndroid Build Coastguard Worker *
195*61046927SAndroid Build Coastguard Worker * 0: The SSBO buffer index.
196*61046927SAndroid Build Coastguard Worker * 1: The offset into the SSBO buffer of the variable that the atomic
197*61046927SAndroid Build Coastguard Worker * operation will operate on.
198*61046927SAndroid Build Coastguard Worker * 2: The data parameter to the atomic function (i.e. the value to add
199*61046927SAndroid Build Coastguard Worker * in, etc).
200*61046927SAndroid Build Coastguard Worker * 3: For CompSwap only: the second data parameter.
201*61046927SAndroid Build Coastguard Worker */
202*61046927SAndroid Build Coastguard Worker static struct ir3_instruction *
emit_intrinsic_atomic_ssbo(struct ir3_context * ctx,nir_intrinsic_instr * intr)203*61046927SAndroid Build Coastguard Worker emit_intrinsic_atomic_ssbo(struct ir3_context *ctx, nir_intrinsic_instr *intr)
204*61046927SAndroid Build Coastguard Worker {
205*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
206*61046927SAndroid Build Coastguard Worker struct ir3_instruction *atomic, *ibo, *src0, *src1, *data, *dummy;
207*61046927SAndroid Build Coastguard Worker nir_atomic_op op = nir_intrinsic_atomic_op(intr);
208*61046927SAndroid Build Coastguard Worker type_t type = nir_atomic_op_type(op) == nir_type_int ? TYPE_S32 : TYPE_U32;
209*61046927SAndroid Build Coastguard Worker
210*61046927SAndroid Build Coastguard Worker ibo = ir3_ssbo_to_ibo(ctx, intr->src[0]);
211*61046927SAndroid Build Coastguard Worker
212*61046927SAndroid Build Coastguard Worker data = ir3_get_src(ctx, &intr->src[2])[0];
213*61046927SAndroid Build Coastguard Worker
214*61046927SAndroid Build Coastguard Worker /* So this gets a bit creative:
215*61046927SAndroid Build Coastguard Worker *
216*61046927SAndroid Build Coastguard Worker * src0 - vecN offset/coords
217*61046927SAndroid Build Coastguard Worker * src1.x - is actually destination register
218*61046927SAndroid Build Coastguard Worker * src1.y - is 'data' except for cmpxchg where src2.y is 'compare'
219*61046927SAndroid Build Coastguard Worker * src1.z - is 'data' for cmpxchg
220*61046927SAndroid Build Coastguard Worker *
221*61046927SAndroid Build Coastguard Worker * The combining src and dest kinda doesn't work out so well with how
222*61046927SAndroid Build Coastguard Worker * scheduling and RA work. So we create a dummy src2 which is tied to the
223*61046927SAndroid Build Coastguard Worker * destination in RA (i.e. must be allocated to the same vec2/vec3
224*61046927SAndroid Build Coastguard Worker * register) and then immediately extract the first component.
225*61046927SAndroid Build Coastguard Worker *
226*61046927SAndroid Build Coastguard Worker * Note that nir already multiplies the offset by four
227*61046927SAndroid Build Coastguard Worker */
228*61046927SAndroid Build Coastguard Worker dummy = create_immed(b, 0);
229*61046927SAndroid Build Coastguard Worker
230*61046927SAndroid Build Coastguard Worker if (op == nir_atomic_op_cmpxchg) {
231*61046927SAndroid Build Coastguard Worker src0 = ir3_get_src(ctx, &intr->src[4])[0];
232*61046927SAndroid Build Coastguard Worker struct ir3_instruction *compare = ir3_get_src(ctx, &intr->src[3])[0];
233*61046927SAndroid Build Coastguard Worker src1 = ir3_collect(b, dummy, compare, data);
234*61046927SAndroid Build Coastguard Worker } else {
235*61046927SAndroid Build Coastguard Worker src0 = ir3_get_src(ctx, &intr->src[3])[0];
236*61046927SAndroid Build Coastguard Worker src1 = ir3_collect(b, dummy, data);
237*61046927SAndroid Build Coastguard Worker }
238*61046927SAndroid Build Coastguard Worker
239*61046927SAndroid Build Coastguard Worker atomic = emit_atomic(b, op, ibo, src0, src1);
240*61046927SAndroid Build Coastguard Worker atomic->cat6.iim_val = 1;
241*61046927SAndroid Build Coastguard Worker atomic->cat6.d = 1;
242*61046927SAndroid Build Coastguard Worker atomic->cat6.type = type;
243*61046927SAndroid Build Coastguard Worker atomic->barrier_class = IR3_BARRIER_BUFFER_W;
244*61046927SAndroid Build Coastguard Worker atomic->barrier_conflict = IR3_BARRIER_BUFFER_R | IR3_BARRIER_BUFFER_W;
245*61046927SAndroid Build Coastguard Worker ir3_handle_bindless_cat6(atomic, intr->src[0]);
246*61046927SAndroid Build Coastguard Worker
247*61046927SAndroid Build Coastguard Worker /* even if nothing consume the result, we can't DCE the instruction: */
248*61046927SAndroid Build Coastguard Worker array_insert(b, b->keeps, atomic);
249*61046927SAndroid Build Coastguard Worker
250*61046927SAndroid Build Coastguard Worker atomic->dsts[0]->wrmask = src1->dsts[0]->wrmask;
251*61046927SAndroid Build Coastguard Worker ir3_reg_tie(atomic->dsts[0], atomic->srcs[2]);
252*61046927SAndroid Build Coastguard Worker ir3_handle_nonuniform(atomic, intr);
253*61046927SAndroid Build Coastguard Worker struct ir3_instruction *split;
254*61046927SAndroid Build Coastguard Worker ir3_split_dest(b, &split, atomic, 0, 1);
255*61046927SAndroid Build Coastguard Worker return split;
256*61046927SAndroid Build Coastguard Worker }
257*61046927SAndroid Build Coastguard Worker
258*61046927SAndroid Build Coastguard Worker /* src[] = { deref, coord, sample_index }. const_index[] = {} */
259*61046927SAndroid Build Coastguard Worker static void
emit_intrinsic_load_image(struct ir3_context * ctx,nir_intrinsic_instr * intr,struct ir3_instruction ** dst)260*61046927SAndroid Build Coastguard Worker emit_intrinsic_load_image(struct ir3_context *ctx, nir_intrinsic_instr *intr,
261*61046927SAndroid Build Coastguard Worker struct ir3_instruction **dst)
262*61046927SAndroid Build Coastguard Worker {
263*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
264*61046927SAndroid Build Coastguard Worker struct ir3_instruction *ldib;
265*61046927SAndroid Build Coastguard Worker struct ir3_instruction *const *coords = ir3_get_src(ctx, &intr->src[1]);
266*61046927SAndroid Build Coastguard Worker unsigned ncoords = ir3_get_image_coords(intr, NULL);
267*61046927SAndroid Build Coastguard Worker
268*61046927SAndroid Build Coastguard Worker ldib = ir3_LDIB(b, ir3_image_to_ibo(ctx, intr->src[0]), 0,
269*61046927SAndroid Build Coastguard Worker ir3_create_collect(b, coords, ncoords), 0,
270*61046927SAndroid Build Coastguard Worker create_immed(b, 0), 0);
271*61046927SAndroid Build Coastguard Worker ldib->dsts[0]->wrmask = MASK(intr->num_components);
272*61046927SAndroid Build Coastguard Worker ldib->cat6.iim_val = intr->num_components;
273*61046927SAndroid Build Coastguard Worker ldib->cat6.d = ncoords;
274*61046927SAndroid Build Coastguard Worker ldib->cat6.type = ir3_get_type_for_image_intrinsic(intr);
275*61046927SAndroid Build Coastguard Worker ldib->cat6.typed = true;
276*61046927SAndroid Build Coastguard Worker ldib->barrier_class = IR3_BARRIER_IMAGE_R;
277*61046927SAndroid Build Coastguard Worker ldib->barrier_conflict = IR3_BARRIER_IMAGE_W;
278*61046927SAndroid Build Coastguard Worker ir3_handle_bindless_cat6(ldib, intr->src[0]);
279*61046927SAndroid Build Coastguard Worker ir3_handle_nonuniform(ldib, intr);
280*61046927SAndroid Build Coastguard Worker
281*61046927SAndroid Build Coastguard Worker ir3_split_dest(b, dst, ldib, 0, intr->num_components);
282*61046927SAndroid Build Coastguard Worker }
283*61046927SAndroid Build Coastguard Worker
284*61046927SAndroid Build Coastguard Worker /* src[] = { deref, coord, sample_index, value }. const_index[] = {} */
285*61046927SAndroid Build Coastguard Worker static void
emit_intrinsic_store_image(struct ir3_context * ctx,nir_intrinsic_instr * intr)286*61046927SAndroid Build Coastguard Worker emit_intrinsic_store_image(struct ir3_context *ctx, nir_intrinsic_instr *intr)
287*61046927SAndroid Build Coastguard Worker {
288*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
289*61046927SAndroid Build Coastguard Worker struct ir3_instruction *stib;
290*61046927SAndroid Build Coastguard Worker struct ir3_instruction *const *value = ir3_get_src(ctx, &intr->src[3]);
291*61046927SAndroid Build Coastguard Worker struct ir3_instruction *const *coords = ir3_get_src(ctx, &intr->src[1]);
292*61046927SAndroid Build Coastguard Worker unsigned ncoords = ir3_get_image_coords(intr, NULL);
293*61046927SAndroid Build Coastguard Worker enum pipe_format format = nir_intrinsic_format(intr);
294*61046927SAndroid Build Coastguard Worker unsigned ncomp = ir3_get_num_components_for_image_format(format);
295*61046927SAndroid Build Coastguard Worker
296*61046927SAndroid Build Coastguard Worker /* src0 is offset, src1 is value:
297*61046927SAndroid Build Coastguard Worker */
298*61046927SAndroid Build Coastguard Worker stib =
299*61046927SAndroid Build Coastguard Worker ir3_STIB(b, ir3_image_to_ibo(ctx, intr->src[0]), 0,
300*61046927SAndroid Build Coastguard Worker ir3_create_collect(b, coords, ncoords), 0, create_immed(b, 0), 0,
301*61046927SAndroid Build Coastguard Worker ir3_create_collect(b, value, ncomp), 0);
302*61046927SAndroid Build Coastguard Worker stib->cat6.iim_val = ncomp;
303*61046927SAndroid Build Coastguard Worker stib->cat6.d = ncoords;
304*61046927SAndroid Build Coastguard Worker stib->cat6.type = ir3_get_type_for_image_intrinsic(intr);
305*61046927SAndroid Build Coastguard Worker stib->cat6.typed = true;
306*61046927SAndroid Build Coastguard Worker stib->barrier_class = IR3_BARRIER_IMAGE_W;
307*61046927SAndroid Build Coastguard Worker stib->barrier_conflict = IR3_BARRIER_IMAGE_R | IR3_BARRIER_IMAGE_W;
308*61046927SAndroid Build Coastguard Worker ir3_handle_bindless_cat6(stib, intr->src[0]);
309*61046927SAndroid Build Coastguard Worker ir3_handle_nonuniform(stib, intr);
310*61046927SAndroid Build Coastguard Worker
311*61046927SAndroid Build Coastguard Worker array_insert(b, b->keeps, stib);
312*61046927SAndroid Build Coastguard Worker }
313*61046927SAndroid Build Coastguard Worker
314*61046927SAndroid Build Coastguard Worker /* src[] = { deref, coord, sample_index, value, compare }. const_index[] = {} */
315*61046927SAndroid Build Coastguard Worker static struct ir3_instruction *
emit_intrinsic_atomic_image(struct ir3_context * ctx,nir_intrinsic_instr * intr)316*61046927SAndroid Build Coastguard Worker emit_intrinsic_atomic_image(struct ir3_context *ctx, nir_intrinsic_instr *intr)
317*61046927SAndroid Build Coastguard Worker {
318*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
319*61046927SAndroid Build Coastguard Worker struct ir3_instruction *atomic, *ibo, *src0, *src1, *dummy;
320*61046927SAndroid Build Coastguard Worker struct ir3_instruction *const *coords = ir3_get_src(ctx, &intr->src[1]);
321*61046927SAndroid Build Coastguard Worker struct ir3_instruction *value = ir3_get_src(ctx, &intr->src[3])[0];
322*61046927SAndroid Build Coastguard Worker unsigned ncoords = ir3_get_image_coords(intr, NULL);
323*61046927SAndroid Build Coastguard Worker nir_atomic_op op = nir_intrinsic_atomic_op(intr);
324*61046927SAndroid Build Coastguard Worker
325*61046927SAndroid Build Coastguard Worker ibo = ir3_image_to_ibo(ctx, intr->src[0]);
326*61046927SAndroid Build Coastguard Worker
327*61046927SAndroid Build Coastguard Worker /* So this gets a bit creative:
328*61046927SAndroid Build Coastguard Worker *
329*61046927SAndroid Build Coastguard Worker * src0 - vecN offset/coords
330*61046927SAndroid Build Coastguard Worker * src1.x - is actually destination register
331*61046927SAndroid Build Coastguard Worker * src1.y - is 'value' except for cmpxchg where src2.y is 'compare'
332*61046927SAndroid Build Coastguard Worker * src1.z - is 'value' for cmpxchg
333*61046927SAndroid Build Coastguard Worker *
334*61046927SAndroid Build Coastguard Worker * The combining src and dest kinda doesn't work out so well with how
335*61046927SAndroid Build Coastguard Worker * scheduling and RA work. So we create a dummy src2 which is tied to the
336*61046927SAndroid Build Coastguard Worker * destination in RA (i.e. must be allocated to the same vec2/vec3
337*61046927SAndroid Build Coastguard Worker * register) and then immediately extract the first component.
338*61046927SAndroid Build Coastguard Worker */
339*61046927SAndroid Build Coastguard Worker dummy = create_immed(b, 0);
340*61046927SAndroid Build Coastguard Worker src0 = ir3_create_collect(b, coords, ncoords);
341*61046927SAndroid Build Coastguard Worker
342*61046927SAndroid Build Coastguard Worker if (op == nir_atomic_op_cmpxchg) {
343*61046927SAndroid Build Coastguard Worker struct ir3_instruction *compare = ir3_get_src(ctx, &intr->src[4])[0];
344*61046927SAndroid Build Coastguard Worker src1 = ir3_collect(b, dummy, compare, value);
345*61046927SAndroid Build Coastguard Worker } else {
346*61046927SAndroid Build Coastguard Worker src1 = ir3_collect(b, dummy, value);
347*61046927SAndroid Build Coastguard Worker }
348*61046927SAndroid Build Coastguard Worker
349*61046927SAndroid Build Coastguard Worker atomic = emit_atomic(b, op, ibo, src0, src1);
350*61046927SAndroid Build Coastguard Worker atomic->cat6.iim_val = 1;
351*61046927SAndroid Build Coastguard Worker atomic->cat6.d = ncoords;
352*61046927SAndroid Build Coastguard Worker atomic->cat6.type = ir3_get_type_for_image_intrinsic(intr);
353*61046927SAndroid Build Coastguard Worker atomic->cat6.typed = true;
354*61046927SAndroid Build Coastguard Worker atomic->barrier_class = IR3_BARRIER_IMAGE_W;
355*61046927SAndroid Build Coastguard Worker atomic->barrier_conflict = IR3_BARRIER_IMAGE_R | IR3_BARRIER_IMAGE_W;
356*61046927SAndroid Build Coastguard Worker ir3_handle_bindless_cat6(atomic, intr->src[0]);
357*61046927SAndroid Build Coastguard Worker
358*61046927SAndroid Build Coastguard Worker /* even if nothing consume the result, we can't DCE the instruction: */
359*61046927SAndroid Build Coastguard Worker array_insert(b, b->keeps, atomic);
360*61046927SAndroid Build Coastguard Worker
361*61046927SAndroid Build Coastguard Worker atomic->dsts[0]->wrmask = src1->dsts[0]->wrmask;
362*61046927SAndroid Build Coastguard Worker ir3_reg_tie(atomic->dsts[0], atomic->srcs[2]);
363*61046927SAndroid Build Coastguard Worker ir3_handle_nonuniform(atomic, intr);
364*61046927SAndroid Build Coastguard Worker struct ir3_instruction *split;
365*61046927SAndroid Build Coastguard Worker ir3_split_dest(b, &split, atomic, 0, 1);
366*61046927SAndroid Build Coastguard Worker return split;
367*61046927SAndroid Build Coastguard Worker }
368*61046927SAndroid Build Coastguard Worker
369*61046927SAndroid Build Coastguard Worker static void
emit_intrinsic_image_size(struct ir3_context * ctx,nir_intrinsic_instr * intr,struct ir3_instruction ** dst)370*61046927SAndroid Build Coastguard Worker emit_intrinsic_image_size(struct ir3_context *ctx, nir_intrinsic_instr *intr,
371*61046927SAndroid Build Coastguard Worker struct ir3_instruction **dst)
372*61046927SAndroid Build Coastguard Worker {
373*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
374*61046927SAndroid Build Coastguard Worker struct ir3_instruction *ibo = ir3_image_to_ibo(ctx, intr->src[0]);
375*61046927SAndroid Build Coastguard Worker struct ir3_instruction *resinfo = ir3_RESINFO(b, ibo, 0);
376*61046927SAndroid Build Coastguard Worker resinfo->cat6.iim_val = 1;
377*61046927SAndroid Build Coastguard Worker resinfo->cat6.d = intr->num_components;
378*61046927SAndroid Build Coastguard Worker resinfo->cat6.type = TYPE_U32;
379*61046927SAndroid Build Coastguard Worker resinfo->cat6.typed = false;
380*61046927SAndroid Build Coastguard Worker /* resinfo has no writemask and always writes out 3 components: */
381*61046927SAndroid Build Coastguard Worker compile_assert(ctx, intr->num_components <= 3);
382*61046927SAndroid Build Coastguard Worker resinfo->dsts[0]->wrmask = MASK(3);
383*61046927SAndroid Build Coastguard Worker ir3_handle_bindless_cat6(resinfo, intr->src[0]);
384*61046927SAndroid Build Coastguard Worker ir3_handle_nonuniform(resinfo, intr);
385*61046927SAndroid Build Coastguard Worker
386*61046927SAndroid Build Coastguard Worker ir3_split_dest(b, dst, resinfo, 0, intr->num_components);
387*61046927SAndroid Build Coastguard Worker }
388*61046927SAndroid Build Coastguard Worker
389*61046927SAndroid Build Coastguard Worker static void
emit_intrinsic_load_global_ir3(struct ir3_context * ctx,nir_intrinsic_instr * intr,struct ir3_instruction ** dst)390*61046927SAndroid Build Coastguard Worker emit_intrinsic_load_global_ir3(struct ir3_context *ctx,
391*61046927SAndroid Build Coastguard Worker nir_intrinsic_instr *intr,
392*61046927SAndroid Build Coastguard Worker struct ir3_instruction **dst)
393*61046927SAndroid Build Coastguard Worker {
394*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
395*61046927SAndroid Build Coastguard Worker unsigned dest_components = nir_intrinsic_dest_components(intr);
396*61046927SAndroid Build Coastguard Worker struct ir3_instruction *addr, *offset;
397*61046927SAndroid Build Coastguard Worker
398*61046927SAndroid Build Coastguard Worker addr = ir3_collect(b, ir3_get_src(ctx, &intr->src[0])[0],
399*61046927SAndroid Build Coastguard Worker ir3_get_src(ctx, &intr->src[0])[1]);
400*61046927SAndroid Build Coastguard Worker
401*61046927SAndroid Build Coastguard Worker struct ir3_instruction *load;
402*61046927SAndroid Build Coastguard Worker
403*61046927SAndroid Build Coastguard Worker bool const_offset_in_bounds =
404*61046927SAndroid Build Coastguard Worker nir_src_is_const(intr->src[1]) &&
405*61046927SAndroid Build Coastguard Worker nir_src_as_int(intr->src[1]) < (1 << 8) &&
406*61046927SAndroid Build Coastguard Worker nir_src_as_int(intr->src[1]) > -(1 << 8);
407*61046927SAndroid Build Coastguard Worker
408*61046927SAndroid Build Coastguard Worker if (const_offset_in_bounds) {
409*61046927SAndroid Build Coastguard Worker load = ir3_LDG(b, addr, 0,
410*61046927SAndroid Build Coastguard Worker create_immed(b, nir_src_as_int(intr->src[1]) * 4),
411*61046927SAndroid Build Coastguard Worker 0, create_immed(b, dest_components), 0);
412*61046927SAndroid Build Coastguard Worker } else {
413*61046927SAndroid Build Coastguard Worker unsigned shift = ctx->compiler->gen >= 7 ? 2 : 0;
414*61046927SAndroid Build Coastguard Worker offset = ir3_get_src(ctx, &intr->src[1])[0];
415*61046927SAndroid Build Coastguard Worker if (shift) {
416*61046927SAndroid Build Coastguard Worker /* A7XX TODO: Move to NIR for it to be properly optimized? */
417*61046927SAndroid Build Coastguard Worker offset = ir3_SHL_B(b, offset, 0, create_immed(b, shift), 0);
418*61046927SAndroid Build Coastguard Worker }
419*61046927SAndroid Build Coastguard Worker load =
420*61046927SAndroid Build Coastguard Worker ir3_LDG_A(b, addr, 0, offset, 0, create_immed(b, 0), 0,
421*61046927SAndroid Build Coastguard Worker create_immed(b, 0), 0, create_immed(b, dest_components), 0);
422*61046927SAndroid Build Coastguard Worker }
423*61046927SAndroid Build Coastguard Worker
424*61046927SAndroid Build Coastguard Worker load->cat6.type = type_uint_size(intr->def.bit_size);
425*61046927SAndroid Build Coastguard Worker load->dsts[0]->wrmask = MASK(dest_components);
426*61046927SAndroid Build Coastguard Worker
427*61046927SAndroid Build Coastguard Worker load->barrier_class = IR3_BARRIER_BUFFER_R;
428*61046927SAndroid Build Coastguard Worker load->barrier_conflict = IR3_BARRIER_BUFFER_W;
429*61046927SAndroid Build Coastguard Worker
430*61046927SAndroid Build Coastguard Worker ir3_split_dest(b, dst, load, 0, dest_components);
431*61046927SAndroid Build Coastguard Worker }
432*61046927SAndroid Build Coastguard Worker
433*61046927SAndroid Build Coastguard Worker static void
emit_intrinsic_store_global_ir3(struct ir3_context * ctx,nir_intrinsic_instr * intr)434*61046927SAndroid Build Coastguard Worker emit_intrinsic_store_global_ir3(struct ir3_context *ctx,
435*61046927SAndroid Build Coastguard Worker nir_intrinsic_instr *intr)
436*61046927SAndroid Build Coastguard Worker {
437*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
438*61046927SAndroid Build Coastguard Worker struct ir3_instruction *value, *addr, *offset;
439*61046927SAndroid Build Coastguard Worker unsigned ncomp = nir_intrinsic_src_components(intr, 0);
440*61046927SAndroid Build Coastguard Worker
441*61046927SAndroid Build Coastguard Worker addr = ir3_collect(b, ir3_get_src(ctx, &intr->src[1])[0],
442*61046927SAndroid Build Coastguard Worker ir3_get_src(ctx, &intr->src[1])[1]);
443*61046927SAndroid Build Coastguard Worker
444*61046927SAndroid Build Coastguard Worker value = ir3_create_collect(b, ir3_get_src(ctx, &intr->src[0]), ncomp);
445*61046927SAndroid Build Coastguard Worker
446*61046927SAndroid Build Coastguard Worker struct ir3_instruction *stg;
447*61046927SAndroid Build Coastguard Worker
448*61046927SAndroid Build Coastguard Worker bool const_offset_in_bounds = nir_src_is_const(intr->src[2]) &&
449*61046927SAndroid Build Coastguard Worker nir_src_as_int(intr->src[2]) < (1 << 10) &&
450*61046927SAndroid Build Coastguard Worker nir_src_as_int(intr->src[2]) > -(1 << 10);
451*61046927SAndroid Build Coastguard Worker
452*61046927SAndroid Build Coastguard Worker if (const_offset_in_bounds) {
453*61046927SAndroid Build Coastguard Worker stg = ir3_STG(b, addr, 0,
454*61046927SAndroid Build Coastguard Worker create_immed(b, nir_src_as_int(intr->src[2]) * 4), 0,
455*61046927SAndroid Build Coastguard Worker value, 0,
456*61046927SAndroid Build Coastguard Worker create_immed(b, ncomp), 0);
457*61046927SAndroid Build Coastguard Worker } else {
458*61046927SAndroid Build Coastguard Worker offset = ir3_get_src(ctx, &intr->src[2])[0];
459*61046927SAndroid Build Coastguard Worker if (ctx->compiler->gen >= 7) {
460*61046927SAndroid Build Coastguard Worker /* A7XX TODO: Move to NIR for it to be properly optimized? */
461*61046927SAndroid Build Coastguard Worker offset = ir3_SHL_B(b, offset, 0, create_immed(b, 2), 0);
462*61046927SAndroid Build Coastguard Worker }
463*61046927SAndroid Build Coastguard Worker stg =
464*61046927SAndroid Build Coastguard Worker ir3_STG_A(b, addr, 0, offset, 0, create_immed(b, 0), 0,
465*61046927SAndroid Build Coastguard Worker create_immed(b, 0), 0, value, 0, create_immed(b, ncomp), 0);
466*61046927SAndroid Build Coastguard Worker }
467*61046927SAndroid Build Coastguard Worker
468*61046927SAndroid Build Coastguard Worker stg->cat6.type = type_uint_size(intr->src[0].ssa->bit_size);
469*61046927SAndroid Build Coastguard Worker stg->cat6.iim_val = 1;
470*61046927SAndroid Build Coastguard Worker
471*61046927SAndroid Build Coastguard Worker array_insert(b, b->keeps, stg);
472*61046927SAndroid Build Coastguard Worker
473*61046927SAndroid Build Coastguard Worker stg->barrier_class = IR3_BARRIER_BUFFER_W;
474*61046927SAndroid Build Coastguard Worker stg->barrier_conflict = IR3_BARRIER_BUFFER_R | IR3_BARRIER_BUFFER_W;
475*61046927SAndroid Build Coastguard Worker }
476*61046927SAndroid Build Coastguard Worker
477*61046927SAndroid Build Coastguard Worker static struct ir3_instruction *
emit_intrinsic_atomic_global(struct ir3_context * ctx,nir_intrinsic_instr * intr)478*61046927SAndroid Build Coastguard Worker emit_intrinsic_atomic_global(struct ir3_context *ctx, nir_intrinsic_instr *intr)
479*61046927SAndroid Build Coastguard Worker {
480*61046927SAndroid Build Coastguard Worker struct ir3_block *b = ctx->block;
481*61046927SAndroid Build Coastguard Worker struct ir3_instruction *addr, *atomic, *src1;
482*61046927SAndroid Build Coastguard Worker struct ir3_instruction *value = ir3_get_src(ctx, &intr->src[1])[0];
483*61046927SAndroid Build Coastguard Worker nir_atomic_op op = nir_intrinsic_atomic_op(intr);
484*61046927SAndroid Build Coastguard Worker type_t type = nir_atomic_op_type(op) == nir_type_int ? TYPE_S32 : TYPE_U32;
485*61046927SAndroid Build Coastguard Worker
486*61046927SAndroid Build Coastguard Worker addr = ir3_collect(b, ir3_get_src(ctx, &intr->src[0])[0],
487*61046927SAndroid Build Coastguard Worker ir3_get_src(ctx, &intr->src[0])[1]);
488*61046927SAndroid Build Coastguard Worker
489*61046927SAndroid Build Coastguard Worker if (op == nir_atomic_op_cmpxchg) {
490*61046927SAndroid Build Coastguard Worker struct ir3_instruction *compare = ir3_get_src(ctx, &intr->src[2])[0];
491*61046927SAndroid Build Coastguard Worker src1 = ir3_collect(b, compare, value);
492*61046927SAndroid Build Coastguard Worker } else {
493*61046927SAndroid Build Coastguard Worker src1 = value;
494*61046927SAndroid Build Coastguard Worker }
495*61046927SAndroid Build Coastguard Worker
496*61046927SAndroid Build Coastguard Worker switch (op) {
497*61046927SAndroid Build Coastguard Worker case nir_atomic_op_iadd:
498*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_ADD(b, addr, 0, src1, 0);
499*61046927SAndroid Build Coastguard Worker break;
500*61046927SAndroid Build Coastguard Worker case nir_atomic_op_imin:
501*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_MIN(b, addr, 0, src1, 0);
502*61046927SAndroid Build Coastguard Worker type = TYPE_S32;
503*61046927SAndroid Build Coastguard Worker break;
504*61046927SAndroid Build Coastguard Worker case nir_atomic_op_umin:
505*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_MIN(b, addr, 0, src1, 0);
506*61046927SAndroid Build Coastguard Worker break;
507*61046927SAndroid Build Coastguard Worker case nir_atomic_op_imax:
508*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_MAX(b, addr, 0, src1, 0);
509*61046927SAndroid Build Coastguard Worker type = TYPE_S32;
510*61046927SAndroid Build Coastguard Worker break;
511*61046927SAndroid Build Coastguard Worker case nir_atomic_op_umax:
512*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_MAX(b, addr, 0, src1, 0);
513*61046927SAndroid Build Coastguard Worker break;
514*61046927SAndroid Build Coastguard Worker case nir_atomic_op_iand:
515*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_AND(b, addr, 0, src1, 0);
516*61046927SAndroid Build Coastguard Worker break;
517*61046927SAndroid Build Coastguard Worker case nir_atomic_op_ior:
518*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_OR(b, addr, 0, src1, 0);
519*61046927SAndroid Build Coastguard Worker break;
520*61046927SAndroid Build Coastguard Worker case nir_atomic_op_ixor:
521*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_XOR(b, addr, 0, src1, 0);
522*61046927SAndroid Build Coastguard Worker break;
523*61046927SAndroid Build Coastguard Worker case nir_atomic_op_xchg:
524*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_XCHG(b, addr, 0, src1, 0);
525*61046927SAndroid Build Coastguard Worker break;
526*61046927SAndroid Build Coastguard Worker case nir_atomic_op_cmpxchg:
527*61046927SAndroid Build Coastguard Worker atomic = ir3_ATOMIC_G_CMPXCHG(b, addr, 0, src1, 0);
528*61046927SAndroid Build Coastguard Worker break;
529*61046927SAndroid Build Coastguard Worker default:
530*61046927SAndroid Build Coastguard Worker unreachable("Unknown global atomic op");
531*61046927SAndroid Build Coastguard Worker }
532*61046927SAndroid Build Coastguard Worker
533*61046927SAndroid Build Coastguard Worker atomic->cat6.iim_val = 1;
534*61046927SAndroid Build Coastguard Worker atomic->cat6.d = 1;
535*61046927SAndroid Build Coastguard Worker atomic->cat6.type = type;
536*61046927SAndroid Build Coastguard Worker atomic->barrier_class = IR3_BARRIER_BUFFER_W;
537*61046927SAndroid Build Coastguard Worker atomic->barrier_conflict = IR3_BARRIER_BUFFER_R | IR3_BARRIER_BUFFER_W;
538*61046927SAndroid Build Coastguard Worker
539*61046927SAndroid Build Coastguard Worker /* even if nothing consume the result, we can't DCE the instruction: */
540*61046927SAndroid Build Coastguard Worker array_insert(b, b->keeps, atomic);
541*61046927SAndroid Build Coastguard Worker
542*61046927SAndroid Build Coastguard Worker return atomic;
543*61046927SAndroid Build Coastguard Worker }
544*61046927SAndroid Build Coastguard Worker
545*61046927SAndroid Build Coastguard Worker const struct ir3_context_funcs ir3_a6xx_funcs = {
546*61046927SAndroid Build Coastguard Worker .emit_intrinsic_load_ssbo = emit_intrinsic_load_ssbo,
547*61046927SAndroid Build Coastguard Worker .emit_intrinsic_store_ssbo = emit_intrinsic_store_ssbo,
548*61046927SAndroid Build Coastguard Worker .emit_intrinsic_atomic_ssbo = emit_intrinsic_atomic_ssbo,
549*61046927SAndroid Build Coastguard Worker .emit_intrinsic_load_image = emit_intrinsic_load_image,
550*61046927SAndroid Build Coastguard Worker .emit_intrinsic_store_image = emit_intrinsic_store_image,
551*61046927SAndroid Build Coastguard Worker .emit_intrinsic_atomic_image = emit_intrinsic_atomic_image,
552*61046927SAndroid Build Coastguard Worker .emit_intrinsic_image_size = emit_intrinsic_image_size,
553*61046927SAndroid Build Coastguard Worker .emit_intrinsic_load_global_ir3 = emit_intrinsic_load_global_ir3,
554*61046927SAndroid Build Coastguard Worker .emit_intrinsic_store_global_ir3 = emit_intrinsic_store_global_ir3,
555*61046927SAndroid Build Coastguard Worker .emit_intrinsic_atomic_global = emit_intrinsic_atomic_global,
556*61046927SAndroid Build Coastguard Worker };
557