1*61046927SAndroid Build Coastguard Worker /*
2*61046927SAndroid Build Coastguard Worker * Copyright © 2016 Red Hat.
3*61046927SAndroid Build Coastguard Worker * Copyright © 2016 Bas Nieuwenhuizen
4*61046927SAndroid Build Coastguard Worker *
5*61046927SAndroid Build Coastguard Worker * SPDX-License-Identifier: MIT
6*61046927SAndroid Build Coastguard Worker */
7*61046927SAndroid Build Coastguard Worker
8*61046927SAndroid Build Coastguard Worker #ifndef RADV_CS_H
9*61046927SAndroid Build Coastguard Worker #define RADV_CS_H
10*61046927SAndroid Build Coastguard Worker
11*61046927SAndroid Build Coastguard Worker #include <assert.h>
12*61046927SAndroid Build Coastguard Worker #include <stdint.h>
13*61046927SAndroid Build Coastguard Worker #include <string.h>
14*61046927SAndroid Build Coastguard Worker
15*61046927SAndroid Build Coastguard Worker #include "radv_cmd_buffer.h"
16*61046927SAndroid Build Coastguard Worker #include "radv_radeon_winsys.h"
17*61046927SAndroid Build Coastguard Worker #include "sid.h"
18*61046927SAndroid Build Coastguard Worker
19*61046927SAndroid Build Coastguard Worker static inline unsigned
radeon_check_space(struct radeon_winsys * ws,struct radeon_cmdbuf * cs,unsigned needed)20*61046927SAndroid Build Coastguard Worker radeon_check_space(struct radeon_winsys *ws, struct radeon_cmdbuf *cs, unsigned needed)
21*61046927SAndroid Build Coastguard Worker {
22*61046927SAndroid Build Coastguard Worker assert(cs->cdw <= cs->reserved_dw);
23*61046927SAndroid Build Coastguard Worker if (cs->max_dw - cs->cdw < needed)
24*61046927SAndroid Build Coastguard Worker ws->cs_grow(cs, needed);
25*61046927SAndroid Build Coastguard Worker cs->reserved_dw = MAX2(cs->reserved_dw, cs->cdw + needed);
26*61046927SAndroid Build Coastguard Worker return cs->cdw + needed;
27*61046927SAndroid Build Coastguard Worker }
28*61046927SAndroid Build Coastguard Worker
29*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_reg_seq(struct radeon_cmdbuf * cs,unsigned reg,unsigned num,unsigned idx,unsigned base_reg_offset,unsigned packet,bool reset_filter_cam)30*61046927SAndroid Build Coastguard Worker radeon_set_reg_seq(struct radeon_cmdbuf *cs, unsigned reg, unsigned num, unsigned idx, unsigned base_reg_offset,
31*61046927SAndroid Build Coastguard Worker unsigned packet, bool reset_filter_cam)
32*61046927SAndroid Build Coastguard Worker {
33*61046927SAndroid Build Coastguard Worker assert(cs->cdw + 2 + num <= cs->reserved_dw);
34*61046927SAndroid Build Coastguard Worker assert(num);
35*61046927SAndroid Build Coastguard Worker radeon_emit(cs, PKT3(packet, num, 0) | PKT3_RESET_FILTER_CAM_S(reset_filter_cam));
36*61046927SAndroid Build Coastguard Worker radeon_emit(cs, ((reg - base_reg_offset) >> 2) | (idx << 28));
37*61046927SAndroid Build Coastguard Worker }
38*61046927SAndroid Build Coastguard Worker
39*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_config_reg_seq(struct radeon_cmdbuf * cs,unsigned reg,unsigned num)40*61046927SAndroid Build Coastguard Worker radeon_set_config_reg_seq(struct radeon_cmdbuf *cs, unsigned reg, unsigned num)
41*61046927SAndroid Build Coastguard Worker {
42*61046927SAndroid Build Coastguard Worker assert(reg >= SI_CONFIG_REG_OFFSET && reg < SI_CONFIG_REG_END);
43*61046927SAndroid Build Coastguard Worker radeon_set_reg_seq(cs, reg, num, 0, SI_CONFIG_REG_OFFSET, PKT3_SET_CONFIG_REG, false);
44*61046927SAndroid Build Coastguard Worker }
45*61046927SAndroid Build Coastguard Worker
46*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_config_reg(struct radeon_cmdbuf * cs,unsigned reg,unsigned value)47*61046927SAndroid Build Coastguard Worker radeon_set_config_reg(struct radeon_cmdbuf *cs, unsigned reg, unsigned value)
48*61046927SAndroid Build Coastguard Worker {
49*61046927SAndroid Build Coastguard Worker radeon_set_config_reg_seq(cs, reg, 1);
50*61046927SAndroid Build Coastguard Worker radeon_emit(cs, value);
51*61046927SAndroid Build Coastguard Worker }
52*61046927SAndroid Build Coastguard Worker
53*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_context_reg_seq(struct radeon_cmdbuf * cs,unsigned reg,unsigned num)54*61046927SAndroid Build Coastguard Worker radeon_set_context_reg_seq(struct radeon_cmdbuf *cs, unsigned reg, unsigned num)
55*61046927SAndroid Build Coastguard Worker {
56*61046927SAndroid Build Coastguard Worker assert(reg >= SI_CONTEXT_REG_OFFSET && reg < SI_CONTEXT_REG_END);
57*61046927SAndroid Build Coastguard Worker radeon_set_reg_seq(cs, reg, num, 0, SI_CONTEXT_REG_OFFSET, PKT3_SET_CONTEXT_REG, false);
58*61046927SAndroid Build Coastguard Worker }
59*61046927SAndroid Build Coastguard Worker
60*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_context_reg(struct radeon_cmdbuf * cs,unsigned reg,unsigned value)61*61046927SAndroid Build Coastguard Worker radeon_set_context_reg(struct radeon_cmdbuf *cs, unsigned reg, unsigned value)
62*61046927SAndroid Build Coastguard Worker {
63*61046927SAndroid Build Coastguard Worker radeon_set_context_reg_seq(cs, reg, 1);
64*61046927SAndroid Build Coastguard Worker radeon_emit(cs, value);
65*61046927SAndroid Build Coastguard Worker }
66*61046927SAndroid Build Coastguard Worker
67*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_context_reg_idx(struct radeon_cmdbuf * cs,unsigned reg,unsigned idx,unsigned value)68*61046927SAndroid Build Coastguard Worker radeon_set_context_reg_idx(struct radeon_cmdbuf *cs, unsigned reg, unsigned idx, unsigned value)
69*61046927SAndroid Build Coastguard Worker {
70*61046927SAndroid Build Coastguard Worker assert(reg >= SI_CONTEXT_REG_OFFSET && reg < SI_CONTEXT_REG_END);
71*61046927SAndroid Build Coastguard Worker radeon_set_reg_seq(cs, reg, 1, idx, SI_CONTEXT_REG_OFFSET, PKT3_SET_CONTEXT_REG, false);
72*61046927SAndroid Build Coastguard Worker radeon_emit(cs, value);
73*61046927SAndroid Build Coastguard Worker }
74*61046927SAndroid Build Coastguard Worker
75*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_sh_reg_seq(struct radeon_cmdbuf * cs,unsigned reg,unsigned num)76*61046927SAndroid Build Coastguard Worker radeon_set_sh_reg_seq(struct radeon_cmdbuf *cs, unsigned reg, unsigned num)
77*61046927SAndroid Build Coastguard Worker {
78*61046927SAndroid Build Coastguard Worker assert(reg >= SI_SH_REG_OFFSET && reg < SI_SH_REG_END);
79*61046927SAndroid Build Coastguard Worker radeon_set_reg_seq(cs, reg, num, 0, SI_SH_REG_OFFSET, PKT3_SET_SH_REG, false);
80*61046927SAndroid Build Coastguard Worker }
81*61046927SAndroid Build Coastguard Worker
82*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_sh_reg(struct radeon_cmdbuf * cs,unsigned reg,unsigned value)83*61046927SAndroid Build Coastguard Worker radeon_set_sh_reg(struct radeon_cmdbuf *cs, unsigned reg, unsigned value)
84*61046927SAndroid Build Coastguard Worker {
85*61046927SAndroid Build Coastguard Worker radeon_set_sh_reg_seq(cs, reg, 1);
86*61046927SAndroid Build Coastguard Worker radeon_emit(cs, value);
87*61046927SAndroid Build Coastguard Worker }
88*61046927SAndroid Build Coastguard Worker
89*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_sh_reg_idx(const struct radeon_info * info,struct radeon_cmdbuf * cs,unsigned reg,unsigned idx,unsigned value)90*61046927SAndroid Build Coastguard Worker radeon_set_sh_reg_idx(const struct radeon_info *info, struct radeon_cmdbuf *cs, unsigned reg, unsigned idx,
91*61046927SAndroid Build Coastguard Worker unsigned value)
92*61046927SAndroid Build Coastguard Worker {
93*61046927SAndroid Build Coastguard Worker assert(reg >= SI_SH_REG_OFFSET && reg < SI_SH_REG_END);
94*61046927SAndroid Build Coastguard Worker assert(idx);
95*61046927SAndroid Build Coastguard Worker
96*61046927SAndroid Build Coastguard Worker unsigned opcode = PKT3_SET_SH_REG_INDEX;
97*61046927SAndroid Build Coastguard Worker if (info->gfx_level < GFX10)
98*61046927SAndroid Build Coastguard Worker opcode = PKT3_SET_SH_REG;
99*61046927SAndroid Build Coastguard Worker
100*61046927SAndroid Build Coastguard Worker radeon_set_reg_seq(cs, reg, 1, idx, SI_SH_REG_OFFSET, opcode, false);
101*61046927SAndroid Build Coastguard Worker radeon_emit(cs, value);
102*61046927SAndroid Build Coastguard Worker }
103*61046927SAndroid Build Coastguard Worker
104*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_uconfig_reg_seq(struct radeon_cmdbuf * cs,unsigned reg,unsigned num)105*61046927SAndroid Build Coastguard Worker radeon_set_uconfig_reg_seq(struct radeon_cmdbuf *cs, unsigned reg, unsigned num)
106*61046927SAndroid Build Coastguard Worker {
107*61046927SAndroid Build Coastguard Worker assert(reg >= CIK_UCONFIG_REG_OFFSET && reg < CIK_UCONFIG_REG_END);
108*61046927SAndroid Build Coastguard Worker radeon_set_reg_seq(cs, reg, num, 0, CIK_UCONFIG_REG_OFFSET, PKT3_SET_UCONFIG_REG, false);
109*61046927SAndroid Build Coastguard Worker }
110*61046927SAndroid Build Coastguard Worker
111*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_uconfig_perfctr_reg_seq(enum amd_gfx_level gfx_level,enum radv_queue_family qf,struct radeon_cmdbuf * cs,unsigned reg,unsigned num)112*61046927SAndroid Build Coastguard Worker radeon_set_uconfig_perfctr_reg_seq(enum amd_gfx_level gfx_level, enum radv_queue_family qf, struct radeon_cmdbuf *cs,
113*61046927SAndroid Build Coastguard Worker unsigned reg, unsigned num)
114*61046927SAndroid Build Coastguard Worker {
115*61046927SAndroid Build Coastguard Worker /*
116*61046927SAndroid Build Coastguard Worker * On GFX10, there is a bug with the ME implementation of its content addressable memory (CAM),
117*61046927SAndroid Build Coastguard Worker * that means that it can skip register writes due to not taking correctly into account the
118*61046927SAndroid Build Coastguard Worker * fields from the GRBM_GFX_INDEX. With this bit we can force the write.
119*61046927SAndroid Build Coastguard Worker */
120*61046927SAndroid Build Coastguard Worker const bool filter_cam_workaround = gfx_level >= GFX10 && qf == RADV_QUEUE_GENERAL;
121*61046927SAndroid Build Coastguard Worker
122*61046927SAndroid Build Coastguard Worker assert(reg >= CIK_UCONFIG_REG_OFFSET && reg < CIK_UCONFIG_REG_END);
123*61046927SAndroid Build Coastguard Worker radeon_set_reg_seq(cs, reg, num, 0, CIK_UCONFIG_REG_OFFSET, PKT3_SET_UCONFIG_REG, filter_cam_workaround);
124*61046927SAndroid Build Coastguard Worker }
125*61046927SAndroid Build Coastguard Worker
126*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_uconfig_perfctr_reg(enum amd_gfx_level gfx_level,enum radv_queue_family qf,struct radeon_cmdbuf * cs,unsigned reg,unsigned value)127*61046927SAndroid Build Coastguard Worker radeon_set_uconfig_perfctr_reg(enum amd_gfx_level gfx_level, enum radv_queue_family qf, struct radeon_cmdbuf *cs,
128*61046927SAndroid Build Coastguard Worker unsigned reg, unsigned value)
129*61046927SAndroid Build Coastguard Worker {
130*61046927SAndroid Build Coastguard Worker radeon_set_uconfig_perfctr_reg_seq(gfx_level, qf, cs, reg, 1);
131*61046927SAndroid Build Coastguard Worker radeon_emit(cs, value);
132*61046927SAndroid Build Coastguard Worker }
133*61046927SAndroid Build Coastguard Worker
134*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_uconfig_reg(struct radeon_cmdbuf * cs,unsigned reg,unsigned value)135*61046927SAndroid Build Coastguard Worker radeon_set_uconfig_reg(struct radeon_cmdbuf *cs, unsigned reg, unsigned value)
136*61046927SAndroid Build Coastguard Worker {
137*61046927SAndroid Build Coastguard Worker radeon_set_uconfig_reg_seq(cs, reg, 1);
138*61046927SAndroid Build Coastguard Worker radeon_emit(cs, value);
139*61046927SAndroid Build Coastguard Worker }
140*61046927SAndroid Build Coastguard Worker
141*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_uconfig_reg_idx(const struct radeon_info * info,struct radeon_cmdbuf * cs,unsigned reg,unsigned idx,unsigned value)142*61046927SAndroid Build Coastguard Worker radeon_set_uconfig_reg_idx(const struct radeon_info *info, struct radeon_cmdbuf *cs, unsigned reg, unsigned idx,
143*61046927SAndroid Build Coastguard Worker unsigned value)
144*61046927SAndroid Build Coastguard Worker {
145*61046927SAndroid Build Coastguard Worker assert(reg >= CIK_UCONFIG_REG_OFFSET && reg < CIK_UCONFIG_REG_END);
146*61046927SAndroid Build Coastguard Worker assert(idx);
147*61046927SAndroid Build Coastguard Worker
148*61046927SAndroid Build Coastguard Worker unsigned opcode = PKT3_SET_UCONFIG_REG_INDEX;
149*61046927SAndroid Build Coastguard Worker if (info->gfx_level < GFX9 || (info->gfx_level == GFX9 && info->me_fw_version < 26))
150*61046927SAndroid Build Coastguard Worker opcode = PKT3_SET_UCONFIG_REG;
151*61046927SAndroid Build Coastguard Worker
152*61046927SAndroid Build Coastguard Worker radeon_set_reg_seq(cs, reg, 1, idx, CIK_UCONFIG_REG_OFFSET, opcode, false);
153*61046927SAndroid Build Coastguard Worker radeon_emit(cs, value);
154*61046927SAndroid Build Coastguard Worker }
155*61046927SAndroid Build Coastguard Worker
156*61046927SAndroid Build Coastguard Worker static inline void
radeon_set_privileged_config_reg(struct radeon_cmdbuf * cs,unsigned reg,unsigned value)157*61046927SAndroid Build Coastguard Worker radeon_set_privileged_config_reg(struct radeon_cmdbuf *cs, unsigned reg, unsigned value)
158*61046927SAndroid Build Coastguard Worker {
159*61046927SAndroid Build Coastguard Worker assert(reg < CIK_UCONFIG_REG_OFFSET);
160*61046927SAndroid Build Coastguard Worker assert(cs->cdw + 6 <= cs->reserved_dw);
161*61046927SAndroid Build Coastguard Worker
162*61046927SAndroid Build Coastguard Worker radeon_emit(cs, PKT3(PKT3_COPY_DATA, 4, 0));
163*61046927SAndroid Build Coastguard Worker radeon_emit(cs, COPY_DATA_SRC_SEL(COPY_DATA_IMM) | COPY_DATA_DST_SEL(COPY_DATA_PERF));
164*61046927SAndroid Build Coastguard Worker radeon_emit(cs, value);
165*61046927SAndroid Build Coastguard Worker radeon_emit(cs, 0); /* unused */
166*61046927SAndroid Build Coastguard Worker radeon_emit(cs, reg >> 2);
167*61046927SAndroid Build Coastguard Worker radeon_emit(cs, 0); /* unused */
168*61046927SAndroid Build Coastguard Worker }
169*61046927SAndroid Build Coastguard Worker
170*61046927SAndroid Build Coastguard Worker #define radeon_opt_set_context_reg(cmdbuf, reg, reg_enum, value) \
171*61046927SAndroid Build Coastguard Worker do { \
172*61046927SAndroid Build Coastguard Worker struct radv_cmd_buffer *__cmdbuf = (cmdbuf); \
173*61046927SAndroid Build Coastguard Worker struct radv_tracked_regs *__tracked_regs = &__cmdbuf->tracked_regs; \
174*61046927SAndroid Build Coastguard Worker const uint32_t __value = (value); \
175*61046927SAndroid Build Coastguard Worker if (!BITSET_TEST(__tracked_regs->reg_saved_mask, (reg_enum)) || \
176*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum)] != __value) { \
177*61046927SAndroid Build Coastguard Worker radeon_set_context_reg(__cmdbuf->cs, reg, __value); \
178*61046927SAndroid Build Coastguard Worker BITSET_SET(__tracked_regs->reg_saved_mask, (reg_enum)); \
179*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum)] = __value; \
180*61046927SAndroid Build Coastguard Worker __cmdbuf->state.context_roll_without_scissor_emitted = true; \
181*61046927SAndroid Build Coastguard Worker } \
182*61046927SAndroid Build Coastguard Worker } while (0)
183*61046927SAndroid Build Coastguard Worker
184*61046927SAndroid Build Coastguard Worker #define radeon_opt_set_context_reg2(cmdbuf, reg, reg_enum, v1, v2) \
185*61046927SAndroid Build Coastguard Worker do { \
186*61046927SAndroid Build Coastguard Worker struct radv_cmd_buffer *__cmdbuf = (cmdbuf); \
187*61046927SAndroid Build Coastguard Worker struct radv_tracked_regs *__tracked_regs = &__cmdbuf->tracked_regs; \
188*61046927SAndroid Build Coastguard Worker const uint32_t __v1 = (v1), __v2 = (v2); \
189*61046927SAndroid Build Coastguard Worker if (!BITSET_TEST_RANGE_INSIDE_WORD(__tracked_regs->reg_saved_mask, (reg_enum), (reg_enum) + 1, 0x3) || \
190*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum)] != __v1 || __tracked_regs->reg_value[(reg_enum) + 1] != __v2) { \
191*61046927SAndroid Build Coastguard Worker radeon_set_context_reg_seq(cmdbuf->cs, reg, 2); \
192*61046927SAndroid Build Coastguard Worker radeon_emit(cmdbuf->cs, __v1); \
193*61046927SAndroid Build Coastguard Worker radeon_emit(cmdbuf->cs, __v2); \
194*61046927SAndroid Build Coastguard Worker BITSET_SET_RANGE_INSIDE_WORD(__tracked_regs->reg_saved_mask, (reg_enum), (reg_enum) + 1); \
195*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum)] = __v1; \
196*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum) + 1] = __v2; \
197*61046927SAndroid Build Coastguard Worker cmdbuf->state.context_roll_without_scissor_emitted = true; \
198*61046927SAndroid Build Coastguard Worker } \
199*61046927SAndroid Build Coastguard Worker } while (0)
200*61046927SAndroid Build Coastguard Worker
201*61046927SAndroid Build Coastguard Worker #define radeon_opt_set_context_reg3(cmdbuf, reg, reg_enum, v1, v2, v3) \
202*61046927SAndroid Build Coastguard Worker do { \
203*61046927SAndroid Build Coastguard Worker struct radv_cmd_buffer *__cmdbuf = (cmdbuf); \
204*61046927SAndroid Build Coastguard Worker struct radv_tracked_regs *__tracked_regs = &__cmdbuf->tracked_regs; \
205*61046927SAndroid Build Coastguard Worker const uint32_t __v1 = (v1), __v2 = (v2), __v3 = (v3); \
206*61046927SAndroid Build Coastguard Worker if (!BITSET_TEST_RANGE_INSIDE_WORD(__tracked_regs->reg_saved_mask, (reg_enum), (reg_enum) + 2, 0x7) || \
207*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum)] != __v1 || __tracked_regs->reg_value[(reg_enum) + 1] != __v2 || \
208*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum) + 2] != __v3) { \
209*61046927SAndroid Build Coastguard Worker radeon_set_context_reg_seq(cmdbuf->cs, reg, 3); \
210*61046927SAndroid Build Coastguard Worker radeon_emit(cmdbuf->cs, __v1); \
211*61046927SAndroid Build Coastguard Worker radeon_emit(cmdbuf->cs, __v2); \
212*61046927SAndroid Build Coastguard Worker radeon_emit(cmdbuf->cs, __v3); \
213*61046927SAndroid Build Coastguard Worker BITSET_SET_RANGE_INSIDE_WORD(__tracked_regs->reg_saved_mask, (reg_enum), (reg_enum) + 2); \
214*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum)] = __v1; \
215*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum) + 1] = __v2; \
216*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum) + 2] = __v3; \
217*61046927SAndroid Build Coastguard Worker cmdbuf->state.context_roll_without_scissor_emitted = true; \
218*61046927SAndroid Build Coastguard Worker } \
219*61046927SAndroid Build Coastguard Worker } while (0)
220*61046927SAndroid Build Coastguard Worker
221*61046927SAndroid Build Coastguard Worker #define radeon_opt_set_context_reg4(cmdbuf, reg, reg_enum, v1, v2, v3, v4) \
222*61046927SAndroid Build Coastguard Worker do { \
223*61046927SAndroid Build Coastguard Worker struct radv_cmd_buffer *__cmdbuf = (cmdbuf); \
224*61046927SAndroid Build Coastguard Worker struct radv_tracked_regs *__tracked_regs = &__cmdbuf->tracked_regs; \
225*61046927SAndroid Build Coastguard Worker const uint32_t __v1 = (v1), __v2 = (v2), __v3 = (v3), __v4 = (v4); \
226*61046927SAndroid Build Coastguard Worker if (!BITSET_TEST_RANGE_INSIDE_WORD(__tracked_regs->reg_saved_mask, (reg_enum), (reg_enum) + 3, 0xf) || \
227*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum)] != __v1 || __tracked_regs->reg_value[(reg_enum) + 1] != __v2 || \
228*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum) + 2] != __v3 || __tracked_regs->reg_value[(reg_enum) + 3] != __v4) { \
229*61046927SAndroid Build Coastguard Worker radeon_set_context_reg_seq(cmdbuf->cs, reg, 4); \
230*61046927SAndroid Build Coastguard Worker radeon_emit(cmdbuf->cs, __v1); \
231*61046927SAndroid Build Coastguard Worker radeon_emit(cmdbuf->cs, __v2); \
232*61046927SAndroid Build Coastguard Worker radeon_emit(cmdbuf->cs, __v3); \
233*61046927SAndroid Build Coastguard Worker radeon_emit(cmdbuf->cs, __v4); \
234*61046927SAndroid Build Coastguard Worker BITSET_SET_RANGE_INSIDE_WORD(__tracked_regs->reg_saved_mask, (reg_enum), (reg_enum) + 3); \
235*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum)] = __v1; \
236*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum) + 1] = __v2; \
237*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum) + 2] = __v3; \
238*61046927SAndroid Build Coastguard Worker __tracked_regs->reg_value[(reg_enum) + 3] = __v4; \
239*61046927SAndroid Build Coastguard Worker cmdbuf->state.context_roll_without_scissor_emitted = true; \
240*61046927SAndroid Build Coastguard Worker } \
241*61046927SAndroid Build Coastguard Worker } while (0)
242*61046927SAndroid Build Coastguard Worker
243*61046927SAndroid Build Coastguard Worker #define radeon_opt_set_context_regn(cmdbuf, reg, values, saved_values, num) \
244*61046927SAndroid Build Coastguard Worker do { \
245*61046927SAndroid Build Coastguard Worker struct radv_cmd_buffer *__cmdbuf = (cmdbuf); \
246*61046927SAndroid Build Coastguard Worker if (memcmp(values, saved_values, sizeof(uint32_t) * (num))) { \
247*61046927SAndroid Build Coastguard Worker radeon_set_context_reg_seq(cmdbuf->cs, reg, num); \
248*61046927SAndroid Build Coastguard Worker radeon_emit_array(cmdbuf->cs, values, num); \
249*61046927SAndroid Build Coastguard Worker memcpy(saved_values, values, sizeof(uint32_t) * (num)); \
250*61046927SAndroid Build Coastguard Worker __cmdbuf->state.context_roll_without_scissor_emitted = true; \
251*61046927SAndroid Build Coastguard Worker } \
252*61046927SAndroid Build Coastguard Worker } while (0)
253*61046927SAndroid Build Coastguard Worker
254*61046927SAndroid Build Coastguard Worker ALWAYS_INLINE static void
radv_cp_wait_mem(struct radeon_cmdbuf * cs,const enum radv_queue_family qf,const uint32_t op,const uint64_t va,const uint32_t ref,const uint32_t mask)255*61046927SAndroid Build Coastguard Worker radv_cp_wait_mem(struct radeon_cmdbuf *cs, const enum radv_queue_family qf, const uint32_t op, const uint64_t va,
256*61046927SAndroid Build Coastguard Worker const uint32_t ref, const uint32_t mask)
257*61046927SAndroid Build Coastguard Worker {
258*61046927SAndroid Build Coastguard Worker assert(op == WAIT_REG_MEM_EQUAL || op == WAIT_REG_MEM_NOT_EQUAL || op == WAIT_REG_MEM_GREATER_OR_EQUAL);
259*61046927SAndroid Build Coastguard Worker
260*61046927SAndroid Build Coastguard Worker if (qf == RADV_QUEUE_GENERAL || qf == RADV_QUEUE_COMPUTE) {
261*61046927SAndroid Build Coastguard Worker radeon_emit(cs, PKT3(PKT3_WAIT_REG_MEM, 5, false));
262*61046927SAndroid Build Coastguard Worker radeon_emit(cs, op | WAIT_REG_MEM_MEM_SPACE(1));
263*61046927SAndroid Build Coastguard Worker radeon_emit(cs, va);
264*61046927SAndroid Build Coastguard Worker radeon_emit(cs, va >> 32);
265*61046927SAndroid Build Coastguard Worker radeon_emit(cs, ref); /* reference value */
266*61046927SAndroid Build Coastguard Worker radeon_emit(cs, mask); /* mask */
267*61046927SAndroid Build Coastguard Worker radeon_emit(cs, 4); /* poll interval */
268*61046927SAndroid Build Coastguard Worker } else if (qf == RADV_QUEUE_TRANSFER) {
269*61046927SAndroid Build Coastguard Worker radeon_emit(cs, SDMA_PACKET(SDMA_OPCODE_POLL_REGMEM, 0, 0) | op << 28 | SDMA_POLL_MEM);
270*61046927SAndroid Build Coastguard Worker radeon_emit(cs, va);
271*61046927SAndroid Build Coastguard Worker radeon_emit(cs, va >> 32);
272*61046927SAndroid Build Coastguard Worker radeon_emit(cs, ref);
273*61046927SAndroid Build Coastguard Worker radeon_emit(cs, mask);
274*61046927SAndroid Build Coastguard Worker radeon_emit(cs, SDMA_POLL_INTERVAL_160_CLK | SDMA_POLL_RETRY_INDEFINITELY << 16);
275*61046927SAndroid Build Coastguard Worker } else {
276*61046927SAndroid Build Coastguard Worker unreachable("unsupported queue family");
277*61046927SAndroid Build Coastguard Worker }
278*61046927SAndroid Build Coastguard Worker }
279*61046927SAndroid Build Coastguard Worker
280*61046927SAndroid Build Coastguard Worker ALWAYS_INLINE static unsigned
radv_cs_write_data_head(const struct radv_device * device,struct radeon_cmdbuf * cs,const enum radv_queue_family qf,const unsigned engine_sel,const uint64_t va,const unsigned count,const bool predicating)281*61046927SAndroid Build Coastguard Worker radv_cs_write_data_head(const struct radv_device *device, struct radeon_cmdbuf *cs, const enum radv_queue_family qf,
282*61046927SAndroid Build Coastguard Worker const unsigned engine_sel, const uint64_t va, const unsigned count, const bool predicating)
283*61046927SAndroid Build Coastguard Worker {
284*61046927SAndroid Build Coastguard Worker /* Return the correct cdw at the end of the packet so the caller can assert it. */
285*61046927SAndroid Build Coastguard Worker const unsigned cdw_end = radeon_check_space(device->ws, cs, 4 + count);
286*61046927SAndroid Build Coastguard Worker
287*61046927SAndroid Build Coastguard Worker if (qf == RADV_QUEUE_GENERAL || qf == RADV_QUEUE_COMPUTE) {
288*61046927SAndroid Build Coastguard Worker radeon_emit(cs, PKT3(PKT3_WRITE_DATA, 2 + count, predicating));
289*61046927SAndroid Build Coastguard Worker radeon_emit(cs, S_370_DST_SEL(V_370_MEM) | S_370_WR_CONFIRM(1) | S_370_ENGINE_SEL(engine_sel));
290*61046927SAndroid Build Coastguard Worker radeon_emit(cs, va);
291*61046927SAndroid Build Coastguard Worker radeon_emit(cs, va >> 32);
292*61046927SAndroid Build Coastguard Worker } else if (qf == RADV_QUEUE_TRANSFER) {
293*61046927SAndroid Build Coastguard Worker /* Vulkan transfer queues don't support conditional rendering, so we can ignore predication here.
294*61046927SAndroid Build Coastguard Worker * Furthermore, we can ignore the engine selection here, it is meaningless to the SDMA.
295*61046927SAndroid Build Coastguard Worker */
296*61046927SAndroid Build Coastguard Worker radeon_emit(cs, SDMA_PACKET(SDMA_OPCODE_WRITE, SDMA_WRITE_SUB_OPCODE_LINEAR, 0));
297*61046927SAndroid Build Coastguard Worker radeon_emit(cs, va);
298*61046927SAndroid Build Coastguard Worker radeon_emit(cs, va >> 32);
299*61046927SAndroid Build Coastguard Worker radeon_emit(cs, count - 1);
300*61046927SAndroid Build Coastguard Worker } else {
301*61046927SAndroid Build Coastguard Worker unreachable("unsupported queue family");
302*61046927SAndroid Build Coastguard Worker }
303*61046927SAndroid Build Coastguard Worker
304*61046927SAndroid Build Coastguard Worker return cdw_end;
305*61046927SAndroid Build Coastguard Worker }
306*61046927SAndroid Build Coastguard Worker
307*61046927SAndroid Build Coastguard Worker ALWAYS_INLINE static void
radv_cs_write_data(const struct radv_device * device,struct radeon_cmdbuf * cs,const enum radv_queue_family qf,const unsigned engine_sel,const uint64_t va,const unsigned count,const uint32_t * dwords,const bool predicating)308*61046927SAndroid Build Coastguard Worker radv_cs_write_data(const struct radv_device *device, struct radeon_cmdbuf *cs, const enum radv_queue_family qf,
309*61046927SAndroid Build Coastguard Worker const unsigned engine_sel, const uint64_t va, const unsigned count, const uint32_t *dwords,
310*61046927SAndroid Build Coastguard Worker const bool predicating)
311*61046927SAndroid Build Coastguard Worker {
312*61046927SAndroid Build Coastguard Worker ASSERTED const unsigned cdw_end = radv_cs_write_data_head(device, cs, qf, engine_sel, va, count, predicating);
313*61046927SAndroid Build Coastguard Worker radeon_emit_array(cs, dwords, count);
314*61046927SAndroid Build Coastguard Worker assert(cs->cdw == cdw_end);
315*61046927SAndroid Build Coastguard Worker }
316*61046927SAndroid Build Coastguard Worker
317*61046927SAndroid Build Coastguard Worker void radv_cs_emit_write_event_eop(struct radeon_cmdbuf *cs, enum amd_gfx_level gfx_level, enum radv_queue_family qf,
318*61046927SAndroid Build Coastguard Worker unsigned event, unsigned event_flags, unsigned dst_sel, unsigned data_sel,
319*61046927SAndroid Build Coastguard Worker uint64_t va, uint32_t new_fence, uint64_t gfx9_eop_bug_va);
320*61046927SAndroid Build Coastguard Worker
321*61046927SAndroid Build Coastguard Worker void radv_cs_emit_cache_flush(struct radeon_winsys *ws, struct radeon_cmdbuf *cs, enum amd_gfx_level gfx_level,
322*61046927SAndroid Build Coastguard Worker uint32_t *flush_cnt, uint64_t flush_va, enum radv_queue_family qf,
323*61046927SAndroid Build Coastguard Worker enum radv_cmd_flush_bits flush_bits, enum rgp_flush_bits *sqtt_flush_bits,
324*61046927SAndroid Build Coastguard Worker uint64_t gfx9_eop_bug_va);
325*61046927SAndroid Build Coastguard Worker
326*61046927SAndroid Build Coastguard Worker void radv_emit_cond_exec(const struct radv_device *device, struct radeon_cmdbuf *cs, uint64_t va, uint32_t count);
327*61046927SAndroid Build Coastguard Worker
328*61046927SAndroid Build Coastguard Worker void radv_cs_write_data_imm(struct radeon_cmdbuf *cs, unsigned engine_sel, uint64_t va, uint32_t imm);
329*61046927SAndroid Build Coastguard Worker
330*61046927SAndroid Build Coastguard Worker #endif /* RADV_CS_H */
331