1 /*
2 * Copyright © 2010 Intel Corporation
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
21 * IN THE SOFTWARE.
22 */
23
24 #ifndef ELK_SHADER_H
25 #define ELK_SHADER_H
26
27 #include <stdint.h>
28 #include "elk_cfg.h"
29 #include "elk_compiler.h"
30 #include "compiler/nir/nir.h"
31
32 #ifdef __cplusplus
33 #include "elk_ir_analysis.h"
34 #include "elk_ir_allocator.h"
35
36 enum instruction_scheduler_mode {
37 SCHEDULE_PRE,
38 SCHEDULE_PRE_NON_LIFO,
39 SCHEDULE_PRE_LIFO,
40 SCHEDULE_POST,
41 SCHEDULE_NONE,
42 };
43
44 #define UBO_START ((1 << 16) - 4)
45
46 struct elk_backend_shader {
47 protected:
48
49 elk_backend_shader(const struct elk_compiler *compiler,
50 const struct elk_compile_params *params,
51 const nir_shader *shader,
52 struct elk_stage_prog_data *stage_prog_data,
53 bool debug_enabled);
54
55 public:
56 virtual ~elk_backend_shader();
57
58 const struct elk_compiler *compiler;
59 void *log_data; /* Passed to compiler->*_log functions */
60
61 const struct intel_device_info * const devinfo;
62 const nir_shader *nir;
63 struct elk_stage_prog_data * const stage_prog_data;
64
65 /** ralloc context for temporary data used during compile */
66 void *mem_ctx;
67
68 /**
69 * List of either elk_fs_inst or vec4_instruction (inheriting from
70 * elk_backend_instruction)
71 */
72 exec_list instructions;
73
74 elk_cfg_t *cfg;
75 elk_analysis<elk::idom_tree, elk_backend_shader> idom_analysis;
76
77 gl_shader_stage stage;
78 bool debug_enabled;
79
80 elk::simple_allocator alloc;
81
82 virtual void dump_instruction_to_file(const elk_backend_instruction *inst, FILE *file) const = 0;
83 virtual void dump_instructions_to_file(FILE *file) const;
84
85 /* Convenience functions based on the above. */
86 void dump_instruction(const elk_backend_instruction *inst, FILE *file = stderr) const {
87 dump_instruction_to_file(inst, file);
88 }
89 void dump_instructions(const char *name = nullptr) const;
90
91 void calculate_cfg();
92
93 virtual void invalidate_analysis(elk::analysis_dependency_class c);
94 };
95
96 #else
97 struct elk_backend_shader;
98 #endif /* __cplusplus */
99
100 enum elk_reg_type elk_type_for_base_type(const struct glsl_type *type);
101 uint32_t elk_math_function(enum elk_opcode op);
102 const char *elk_instruction_name(const struct elk_isa_info *isa,
103 enum elk_opcode op);
104 bool elk_saturate_immediate(enum elk_reg_type type, struct elk_reg *reg);
105 bool elk_negate_immediate(enum elk_reg_type type, struct elk_reg *reg);
106 bool elk_abs_immediate(enum elk_reg_type type, struct elk_reg *reg);
107
108 bool elk_opt_predicated_break(struct elk_backend_shader *s);
109
110 #ifdef __cplusplus
111 extern "C" {
112 #endif
113
114 /* elk_fs_reg_allocate.cpp */
115 void elk_fs_alloc_reg_sets(struct elk_compiler *compiler);
116
117 /* elk_vec4_reg_allocate.cpp */
118 void elk_vec4_alloc_reg_set(struct elk_compiler *compiler);
119
120 /* elk_disasm.c */
121 extern const char *const elk_conditional_modifier[16];
122 extern const char *const elk_pred_ctrl_align16[16];
123
124 /* Per-thread scratch space is a power-of-two multiple of 1KB. */
125 static inline unsigned
elk_get_scratch_size(int size)126 elk_get_scratch_size(int size)
127 {
128 return MAX2(1024, util_next_power_of_two(size));
129 }
130
131
132 static inline nir_variable_mode
elk_nir_no_indirect_mask(const struct elk_compiler * compiler,gl_shader_stage stage)133 elk_nir_no_indirect_mask(const struct elk_compiler *compiler,
134 gl_shader_stage stage)
135 {
136 const struct intel_device_info *devinfo = compiler->devinfo;
137 const bool is_scalar = compiler->scalar_stage[stage];
138 nir_variable_mode indirect_mask = (nir_variable_mode) 0;
139
140 switch (stage) {
141 case MESA_SHADER_VERTEX:
142 case MESA_SHADER_FRAGMENT:
143 indirect_mask |= nir_var_shader_in;
144 break;
145
146 case MESA_SHADER_GEOMETRY:
147 if (!is_scalar)
148 indirect_mask |= nir_var_shader_in;
149 break;
150
151 default:
152 /* Everything else can handle indirect inputs */
153 break;
154 }
155
156 if (is_scalar && stage != MESA_SHADER_TESS_CTRL)
157 indirect_mask |= nir_var_shader_out;
158
159 /* On HSW+, we allow indirects in scalar shaders. They get implemented
160 * using nir_lower_vars_to_explicit_types and nir_lower_explicit_io in
161 * elk_postprocess_nir.
162 *
163 * We haven't plumbed through the indirect scratch messages on gfx6 or
164 * earlier so doing indirects via scratch doesn't work there. On gfx7 and
165 * earlier the scratch space size is limited to 12kB. If we allowed
166 * indirects as scratch all the time, we may easily exceed this limit
167 * without having any fallback.
168 */
169 if (is_scalar && devinfo->verx10 <= 70)
170 indirect_mask |= nir_var_function_temp;
171
172 return indirect_mask;
173 }
174
175 bool elk_texture_offset(const nir_tex_instr *tex, unsigned src,
176 uint32_t *offset_bits);
177
178 /**
179 * Scratch data used when compiling a GLSL geometry shader.
180 */
181 struct elk_gs_compile
182 {
183 struct elk_gs_prog_key key;
184 struct intel_vue_map input_vue_map;
185
186 unsigned control_data_bits_per_vertex;
187 unsigned control_data_header_size_bits;
188 };
189
190 #ifdef __cplusplus
191 }
192 #endif
193
194 #endif /* ELK_SHADER_H */
195