xref: /aosp_15_r20/external/mesa3d/src/intel/compiler/elk/elk_shader.h (revision 6104692788411f58d303aa86923a9ff6ecaded22)
1 /*
2  * Copyright © 2010 Intel Corporation
3  *
4  * Permission is hereby granted, free of charge, to any person obtaining a
5  * copy of this software and associated documentation files (the "Software"),
6  * to deal in the Software without restriction, including without limitation
7  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8  * and/or sell copies of the Software, and to permit persons to whom the
9  * Software is furnished to do so, subject to the following conditions:
10  *
11  * The above copyright notice and this permission notice (including the next
12  * paragraph) shall be included in all copies or substantial portions of the
13  * Software.
14  *
15  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
18  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21  * IN THE SOFTWARE.
22  */
23 
24 #ifndef ELK_SHADER_H
25 #define ELK_SHADER_H
26 
27 #include <stdint.h>
28 #include "elk_cfg.h"
29 #include "elk_compiler.h"
30 #include "compiler/nir/nir.h"
31 
32 #ifdef __cplusplus
33 #include "elk_ir_analysis.h"
34 #include "elk_ir_allocator.h"
35 
36 enum instruction_scheduler_mode {
37    SCHEDULE_PRE,
38    SCHEDULE_PRE_NON_LIFO,
39    SCHEDULE_PRE_LIFO,
40    SCHEDULE_POST,
41    SCHEDULE_NONE,
42 };
43 
44 #define UBO_START ((1 << 16) - 4)
45 
46 struct elk_backend_shader {
47 protected:
48 
49    elk_backend_shader(const struct elk_compiler *compiler,
50                   const struct elk_compile_params *params,
51                   const nir_shader *shader,
52                   struct elk_stage_prog_data *stage_prog_data,
53                   bool debug_enabled);
54 
55 public:
56    virtual ~elk_backend_shader();
57 
58    const struct elk_compiler *compiler;
59    void *log_data; /* Passed to compiler->*_log functions */
60 
61    const struct intel_device_info * const devinfo;
62    const nir_shader *nir;
63    struct elk_stage_prog_data * const stage_prog_data;
64 
65    /** ralloc context for temporary data used during compile */
66    void *mem_ctx;
67 
68    /**
69     * List of either elk_fs_inst or vec4_instruction (inheriting from
70     * elk_backend_instruction)
71     */
72    exec_list instructions;
73 
74    elk_cfg_t *cfg;
75    elk_analysis<elk::idom_tree, elk_backend_shader> idom_analysis;
76 
77    gl_shader_stage stage;
78    bool debug_enabled;
79 
80    elk::simple_allocator alloc;
81 
82    virtual void dump_instruction_to_file(const elk_backend_instruction *inst, FILE *file) const = 0;
83    virtual void dump_instructions_to_file(FILE *file) const;
84 
85    /* Convenience functions based on the above. */
86    void dump_instruction(const elk_backend_instruction *inst, FILE *file = stderr) const {
87       dump_instruction_to_file(inst, file);
88    }
89    void dump_instructions(const char *name = nullptr) const;
90 
91    void calculate_cfg();
92 
93    virtual void invalidate_analysis(elk::analysis_dependency_class c);
94 };
95 
96 #else
97 struct elk_backend_shader;
98 #endif /* __cplusplus */
99 
100 enum elk_reg_type elk_type_for_base_type(const struct glsl_type *type);
101 uint32_t elk_math_function(enum elk_opcode op);
102 const char *elk_instruction_name(const struct elk_isa_info *isa,
103                                  enum elk_opcode op);
104 bool elk_saturate_immediate(enum elk_reg_type type, struct elk_reg *reg);
105 bool elk_negate_immediate(enum elk_reg_type type, struct elk_reg *reg);
106 bool elk_abs_immediate(enum elk_reg_type type, struct elk_reg *reg);
107 
108 bool elk_opt_predicated_break(struct elk_backend_shader *s);
109 
110 #ifdef __cplusplus
111 extern "C" {
112 #endif
113 
114 /* elk_fs_reg_allocate.cpp */
115 void elk_fs_alloc_reg_sets(struct elk_compiler *compiler);
116 
117 /* elk_vec4_reg_allocate.cpp */
118 void elk_vec4_alloc_reg_set(struct elk_compiler *compiler);
119 
120 /* elk_disasm.c */
121 extern const char *const elk_conditional_modifier[16];
122 extern const char *const elk_pred_ctrl_align16[16];
123 
124 /* Per-thread scratch space is a power-of-two multiple of 1KB. */
125 static inline unsigned
elk_get_scratch_size(int size)126 elk_get_scratch_size(int size)
127 {
128    return MAX2(1024, util_next_power_of_two(size));
129 }
130 
131 
132 static inline nir_variable_mode
elk_nir_no_indirect_mask(const struct elk_compiler * compiler,gl_shader_stage stage)133 elk_nir_no_indirect_mask(const struct elk_compiler *compiler,
134                          gl_shader_stage stage)
135 {
136    const struct intel_device_info *devinfo = compiler->devinfo;
137    const bool is_scalar = compiler->scalar_stage[stage];
138    nir_variable_mode indirect_mask = (nir_variable_mode) 0;
139 
140    switch (stage) {
141    case MESA_SHADER_VERTEX:
142    case MESA_SHADER_FRAGMENT:
143       indirect_mask |= nir_var_shader_in;
144       break;
145 
146    case MESA_SHADER_GEOMETRY:
147       if (!is_scalar)
148          indirect_mask |= nir_var_shader_in;
149       break;
150 
151    default:
152       /* Everything else can handle indirect inputs */
153       break;
154    }
155 
156    if (is_scalar && stage != MESA_SHADER_TESS_CTRL)
157       indirect_mask |= nir_var_shader_out;
158 
159    /* On HSW+, we allow indirects in scalar shaders.  They get implemented
160     * using nir_lower_vars_to_explicit_types and nir_lower_explicit_io in
161     * elk_postprocess_nir.
162     *
163     * We haven't plumbed through the indirect scratch messages on gfx6 or
164     * earlier so doing indirects via scratch doesn't work there. On gfx7 and
165     * earlier the scratch space size is limited to 12kB.  If we allowed
166     * indirects as scratch all the time, we may easily exceed this limit
167     * without having any fallback.
168     */
169    if (is_scalar && devinfo->verx10 <= 70)
170       indirect_mask |= nir_var_function_temp;
171 
172    return indirect_mask;
173 }
174 
175 bool elk_texture_offset(const nir_tex_instr *tex, unsigned src,
176                         uint32_t *offset_bits);
177 
178 /**
179  * Scratch data used when compiling a GLSL geometry shader.
180  */
181 struct elk_gs_compile
182 {
183    struct elk_gs_prog_key key;
184    struct intel_vue_map input_vue_map;
185 
186    unsigned control_data_bits_per_vertex;
187    unsigned control_data_header_size_bits;
188 };
189 
190 #ifdef __cplusplus
191 }
192 #endif
193 
194 #endif /* ELK_SHADER_H */
195