xref: /aosp_15_r20/external/mesa3d/src/compiler/spirv/vtn_amd.c (revision 6104692788411f58d303aa86923a9ff6ecaded22)
1*61046927SAndroid Build Coastguard Worker /*
2*61046927SAndroid Build Coastguard Worker  * Copyright © 2018 Valve Corporation
3*61046927SAndroid Build Coastguard Worker  * Copyright © 2017 Red Hat
4*61046927SAndroid Build Coastguard Worker  *
5*61046927SAndroid Build Coastguard Worker  * Permission is hereby granted, free of charge, to any person obtaining a
6*61046927SAndroid Build Coastguard Worker  * copy of this software and associated documentation files (the "Software"),
7*61046927SAndroid Build Coastguard Worker  * to deal in the Software without restriction, including without limitation
8*61046927SAndroid Build Coastguard Worker  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
9*61046927SAndroid Build Coastguard Worker  * and/or sell copies of the Software, and to permit persons to whom the
10*61046927SAndroid Build Coastguard Worker  * Software is furnished to do so, subject to the following conditions:
11*61046927SAndroid Build Coastguard Worker  *
12*61046927SAndroid Build Coastguard Worker  * The above copyright notice and this permission notice (including the next
13*61046927SAndroid Build Coastguard Worker  * paragraph) shall be included in all copies or substantial portions of the
14*61046927SAndroid Build Coastguard Worker  * Software.
15*61046927SAndroid Build Coastguard Worker  *
16*61046927SAndroid Build Coastguard Worker  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17*61046927SAndroid Build Coastguard Worker  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18*61046927SAndroid Build Coastguard Worker  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
19*61046927SAndroid Build Coastguard Worker  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20*61046927SAndroid Build Coastguard Worker  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21*61046927SAndroid Build Coastguard Worker  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22*61046927SAndroid Build Coastguard Worker  * IN THE SOFTWARE.
23*61046927SAndroid Build Coastguard Worker  *
24*61046927SAndroid Build Coastguard Worker  */
25*61046927SAndroid Build Coastguard Worker 
26*61046927SAndroid Build Coastguard Worker #include "vtn_private.h"
27*61046927SAndroid Build Coastguard Worker #include "GLSL.ext.AMD.h"
28*61046927SAndroid Build Coastguard Worker 
29*61046927SAndroid Build Coastguard Worker bool
vtn_handle_amd_gcn_shader_instruction(struct vtn_builder * b,SpvOp ext_opcode,const uint32_t * w,unsigned count)30*61046927SAndroid Build Coastguard Worker vtn_handle_amd_gcn_shader_instruction(struct vtn_builder *b, SpvOp ext_opcode,
31*61046927SAndroid Build Coastguard Worker                                       const uint32_t *w, unsigned count)
32*61046927SAndroid Build Coastguard Worker {
33*61046927SAndroid Build Coastguard Worker    nir_def *def;
34*61046927SAndroid Build Coastguard Worker    switch ((enum GcnShaderAMD)ext_opcode) {
35*61046927SAndroid Build Coastguard Worker    case CubeFaceIndexAMD:
36*61046927SAndroid Build Coastguard Worker       def = nir_channel(&b->nb, nir_cube_amd(&b->nb, vtn_get_nir_ssa(b, w[5])), 3);
37*61046927SAndroid Build Coastguard Worker       break;
38*61046927SAndroid Build Coastguard Worker    case CubeFaceCoordAMD: {
39*61046927SAndroid Build Coastguard Worker       def = nir_cube_amd(&b->nb, vtn_get_nir_ssa(b, w[5]));
40*61046927SAndroid Build Coastguard Worker       nir_def *st = nir_swizzle(&b->nb, def, (unsigned[]){1, 0}, 2);
41*61046927SAndroid Build Coastguard Worker       nir_def *invma = nir_frcp(&b->nb, nir_channel(&b->nb, def, 2));
42*61046927SAndroid Build Coastguard Worker       def = nir_ffma_imm2(&b->nb, st, invma, 0.5);
43*61046927SAndroid Build Coastguard Worker       break;
44*61046927SAndroid Build Coastguard Worker    }
45*61046927SAndroid Build Coastguard Worker    case TimeAMD: {
46*61046927SAndroid Build Coastguard Worker       def = nir_pack_64_2x32(&b->nb, nir_shader_clock(&b->nb, SCOPE_SUBGROUP));
47*61046927SAndroid Build Coastguard Worker       break;
48*61046927SAndroid Build Coastguard Worker    }
49*61046927SAndroid Build Coastguard Worker    default:
50*61046927SAndroid Build Coastguard Worker       unreachable("Invalid opcode");
51*61046927SAndroid Build Coastguard Worker    }
52*61046927SAndroid Build Coastguard Worker 
53*61046927SAndroid Build Coastguard Worker    vtn_push_nir_ssa(b, w[2], def);
54*61046927SAndroid Build Coastguard Worker 
55*61046927SAndroid Build Coastguard Worker    return true;
56*61046927SAndroid Build Coastguard Worker }
57*61046927SAndroid Build Coastguard Worker 
58*61046927SAndroid Build Coastguard Worker bool
vtn_handle_amd_shader_ballot_instruction(struct vtn_builder * b,SpvOp ext_opcode,const uint32_t * w,unsigned count)59*61046927SAndroid Build Coastguard Worker vtn_handle_amd_shader_ballot_instruction(struct vtn_builder *b, SpvOp ext_opcode,
60*61046927SAndroid Build Coastguard Worker                                          const uint32_t *w, unsigned count)
61*61046927SAndroid Build Coastguard Worker {
62*61046927SAndroid Build Coastguard Worker    unsigned num_args;
63*61046927SAndroid Build Coastguard Worker    nir_intrinsic_op op;
64*61046927SAndroid Build Coastguard Worker    switch ((enum ShaderBallotAMD)ext_opcode) {
65*61046927SAndroid Build Coastguard Worker    case SwizzleInvocationsAMD:
66*61046927SAndroid Build Coastguard Worker       num_args = 1;
67*61046927SAndroid Build Coastguard Worker       op = nir_intrinsic_quad_swizzle_amd;
68*61046927SAndroid Build Coastguard Worker       break;
69*61046927SAndroid Build Coastguard Worker    case SwizzleInvocationsMaskedAMD:
70*61046927SAndroid Build Coastguard Worker       num_args = 1;
71*61046927SAndroid Build Coastguard Worker       op = nir_intrinsic_masked_swizzle_amd;
72*61046927SAndroid Build Coastguard Worker       break;
73*61046927SAndroid Build Coastguard Worker    case WriteInvocationAMD:
74*61046927SAndroid Build Coastguard Worker       num_args = 3;
75*61046927SAndroid Build Coastguard Worker       op = nir_intrinsic_write_invocation_amd;
76*61046927SAndroid Build Coastguard Worker       break;
77*61046927SAndroid Build Coastguard Worker    case MbcntAMD:
78*61046927SAndroid Build Coastguard Worker       num_args = 1;
79*61046927SAndroid Build Coastguard Worker       op = nir_intrinsic_mbcnt_amd;
80*61046927SAndroid Build Coastguard Worker       break;
81*61046927SAndroid Build Coastguard Worker    default:
82*61046927SAndroid Build Coastguard Worker       unreachable("Invalid opcode");
83*61046927SAndroid Build Coastguard Worker    }
84*61046927SAndroid Build Coastguard Worker 
85*61046927SAndroid Build Coastguard Worker    const struct glsl_type *dest_type = vtn_get_type(b, w[1])->type;
86*61046927SAndroid Build Coastguard Worker    nir_intrinsic_instr *intrin = nir_intrinsic_instr_create(b->nb.shader, op);
87*61046927SAndroid Build Coastguard Worker    nir_def_init_for_type(&intrin->instr, &intrin->def, dest_type);
88*61046927SAndroid Build Coastguard Worker    if (nir_intrinsic_infos[op].src_components[0] == 0)
89*61046927SAndroid Build Coastguard Worker       intrin->num_components = intrin->def.num_components;
90*61046927SAndroid Build Coastguard Worker 
91*61046927SAndroid Build Coastguard Worker    for (unsigned i = 0; i < num_args; i++)
92*61046927SAndroid Build Coastguard Worker       intrin->src[i] = nir_src_for_ssa(vtn_get_nir_ssa(b, w[i + 5]));
93*61046927SAndroid Build Coastguard Worker 
94*61046927SAndroid Build Coastguard Worker    if (intrin->intrinsic == nir_intrinsic_quad_swizzle_amd) {
95*61046927SAndroid Build Coastguard Worker       struct vtn_value *val = vtn_value(b, w[6], vtn_value_type_constant);
96*61046927SAndroid Build Coastguard Worker       unsigned mask = val->constant->values[0].u32 |
97*61046927SAndroid Build Coastguard Worker                       val->constant->values[1].u32 << 2 |
98*61046927SAndroid Build Coastguard Worker                       val->constant->values[2].u32 << 4 |
99*61046927SAndroid Build Coastguard Worker                       val->constant->values[3].u32 << 6;
100*61046927SAndroid Build Coastguard Worker       nir_intrinsic_set_swizzle_mask(intrin, mask);
101*61046927SAndroid Build Coastguard Worker 
102*61046927SAndroid Build Coastguard Worker    } else if (intrin->intrinsic == nir_intrinsic_masked_swizzle_amd) {
103*61046927SAndroid Build Coastguard Worker       struct vtn_value *val = vtn_value(b, w[6], vtn_value_type_constant);
104*61046927SAndroid Build Coastguard Worker       unsigned mask = val->constant->values[0].u32 |
105*61046927SAndroid Build Coastguard Worker                       val->constant->values[1].u32 << 5 |
106*61046927SAndroid Build Coastguard Worker                       val->constant->values[2].u32 << 10;
107*61046927SAndroid Build Coastguard Worker       nir_intrinsic_set_swizzle_mask(intrin, mask);
108*61046927SAndroid Build Coastguard Worker    } else if (intrin->intrinsic == nir_intrinsic_mbcnt_amd) {
109*61046927SAndroid Build Coastguard Worker       /* The v_mbcnt instruction has an additional source that is added to the result.
110*61046927SAndroid Build Coastguard Worker        * This is exposed by the NIR intrinsic but not by SPIR-V, so we add zero here.
111*61046927SAndroid Build Coastguard Worker        */
112*61046927SAndroid Build Coastguard Worker       intrin->src[1] = nir_src_for_ssa(nir_imm_int(&b->nb, 0));
113*61046927SAndroid Build Coastguard Worker    }
114*61046927SAndroid Build Coastguard Worker 
115*61046927SAndroid Build Coastguard Worker    nir_builder_instr_insert(&b->nb, &intrin->instr);
116*61046927SAndroid Build Coastguard Worker    vtn_push_nir_ssa(b, w[2], &intrin->def);
117*61046927SAndroid Build Coastguard Worker 
118*61046927SAndroid Build Coastguard Worker    return true;
119*61046927SAndroid Build Coastguard Worker }
120*61046927SAndroid Build Coastguard Worker 
121*61046927SAndroid Build Coastguard Worker bool
vtn_handle_amd_shader_trinary_minmax_instruction(struct vtn_builder * b,SpvOp ext_opcode,const uint32_t * w,unsigned count)122*61046927SAndroid Build Coastguard Worker vtn_handle_amd_shader_trinary_minmax_instruction(struct vtn_builder *b, SpvOp ext_opcode,
123*61046927SAndroid Build Coastguard Worker                                                  const uint32_t *w, unsigned count)
124*61046927SAndroid Build Coastguard Worker {
125*61046927SAndroid Build Coastguard Worker    struct nir_builder *nb = &b->nb;
126*61046927SAndroid Build Coastguard Worker 
127*61046927SAndroid Build Coastguard Worker    unsigned num_inputs = count - 5;
128*61046927SAndroid Build Coastguard Worker    assert(num_inputs == 3);
129*61046927SAndroid Build Coastguard Worker    nir_def *src[3] = { NULL, };
130*61046927SAndroid Build Coastguard Worker    for (unsigned i = 0; i < num_inputs; i++)
131*61046927SAndroid Build Coastguard Worker       src[i] = vtn_get_nir_ssa(b, w[i + 5]);
132*61046927SAndroid Build Coastguard Worker 
133*61046927SAndroid Build Coastguard Worker    /* place constants at src[1-2] for easier constant-folding */
134*61046927SAndroid Build Coastguard Worker    for (unsigned i = 1; i <= 2; i++) {
135*61046927SAndroid Build Coastguard Worker       if (nir_src_as_const_value(nir_src_for_ssa(src[0]))) {
136*61046927SAndroid Build Coastguard Worker          nir_def* tmp = src[i];
137*61046927SAndroid Build Coastguard Worker          src[i] = src[0];
138*61046927SAndroid Build Coastguard Worker          src[0] = tmp;
139*61046927SAndroid Build Coastguard Worker       }
140*61046927SAndroid Build Coastguard Worker    }
141*61046927SAndroid Build Coastguard Worker    nir_def *def;
142*61046927SAndroid Build Coastguard Worker    switch ((enum ShaderTrinaryMinMaxAMD)ext_opcode) {
143*61046927SAndroid Build Coastguard Worker    case FMin3AMD:
144*61046927SAndroid Build Coastguard Worker       def = nir_fmin(nb, src[0], nir_fmin(nb, src[1], src[2]));
145*61046927SAndroid Build Coastguard Worker       break;
146*61046927SAndroid Build Coastguard Worker    case UMin3AMD:
147*61046927SAndroid Build Coastguard Worker       def = nir_umin(nb, src[0], nir_umin(nb, src[1], src[2]));
148*61046927SAndroid Build Coastguard Worker       break;
149*61046927SAndroid Build Coastguard Worker    case SMin3AMD:
150*61046927SAndroid Build Coastguard Worker       def = nir_imin(nb, src[0], nir_imin(nb, src[1], src[2]));
151*61046927SAndroid Build Coastguard Worker       break;
152*61046927SAndroid Build Coastguard Worker    case FMax3AMD:
153*61046927SAndroid Build Coastguard Worker       def = nir_fmax(nb, src[0], nir_fmax(nb, src[1], src[2]));
154*61046927SAndroid Build Coastguard Worker       break;
155*61046927SAndroid Build Coastguard Worker    case UMax3AMD:
156*61046927SAndroid Build Coastguard Worker       def = nir_umax(nb, src[0], nir_umax(nb, src[1], src[2]));
157*61046927SAndroid Build Coastguard Worker       break;
158*61046927SAndroid Build Coastguard Worker    case SMax3AMD:
159*61046927SAndroid Build Coastguard Worker       def = nir_imax(nb, src[0], nir_imax(nb, src[1], src[2]));
160*61046927SAndroid Build Coastguard Worker       break;
161*61046927SAndroid Build Coastguard Worker    case FMid3AMD:
162*61046927SAndroid Build Coastguard Worker       def = nir_fmin(nb, nir_fmax(nb, src[0], nir_fmin(nb, src[1], src[2])),
163*61046927SAndroid Build Coastguard Worker                      nir_fmax(nb, src[1], src[2]));
164*61046927SAndroid Build Coastguard Worker       break;
165*61046927SAndroid Build Coastguard Worker    case UMid3AMD:
166*61046927SAndroid Build Coastguard Worker       def = nir_umin(nb, nir_umax(nb, src[0], nir_umin(nb, src[1], src[2])),
167*61046927SAndroid Build Coastguard Worker                      nir_umax(nb, src[1], src[2]));
168*61046927SAndroid Build Coastguard Worker       break;
169*61046927SAndroid Build Coastguard Worker    case SMid3AMD:
170*61046927SAndroid Build Coastguard Worker       def = nir_imin(nb, nir_imax(nb, src[0], nir_imin(nb, src[1], src[2])),
171*61046927SAndroid Build Coastguard Worker                      nir_imax(nb, src[1], src[2]));
172*61046927SAndroid Build Coastguard Worker       break;
173*61046927SAndroid Build Coastguard Worker    default:
174*61046927SAndroid Build Coastguard Worker       unreachable("unknown opcode\n");
175*61046927SAndroid Build Coastguard Worker       break;
176*61046927SAndroid Build Coastguard Worker    }
177*61046927SAndroid Build Coastguard Worker 
178*61046927SAndroid Build Coastguard Worker    vtn_push_nir_ssa(b, w[2], def);
179*61046927SAndroid Build Coastguard Worker 
180*61046927SAndroid Build Coastguard Worker    return true;
181*61046927SAndroid Build Coastguard Worker }
182*61046927SAndroid Build Coastguard Worker 
183*61046927SAndroid Build Coastguard Worker bool
vtn_handle_amd_shader_explicit_vertex_parameter_instruction(struct vtn_builder * b,SpvOp ext_opcode,const uint32_t * w,unsigned count)184*61046927SAndroid Build Coastguard Worker vtn_handle_amd_shader_explicit_vertex_parameter_instruction(struct vtn_builder *b, SpvOp ext_opcode,
185*61046927SAndroid Build Coastguard Worker                                                             const uint32_t *w, unsigned count)
186*61046927SAndroid Build Coastguard Worker {
187*61046927SAndroid Build Coastguard Worker    nir_intrinsic_op op;
188*61046927SAndroid Build Coastguard Worker    switch ((enum ShaderExplicitVertexParameterAMD)ext_opcode) {
189*61046927SAndroid Build Coastguard Worker    case InterpolateAtVertexAMD:
190*61046927SAndroid Build Coastguard Worker       op = nir_intrinsic_interp_deref_at_vertex;
191*61046927SAndroid Build Coastguard Worker       break;
192*61046927SAndroid Build Coastguard Worker    default:
193*61046927SAndroid Build Coastguard Worker       unreachable("unknown opcode");
194*61046927SAndroid Build Coastguard Worker    }
195*61046927SAndroid Build Coastguard Worker 
196*61046927SAndroid Build Coastguard Worker    nir_intrinsic_instr *intrin = nir_intrinsic_instr_create(b->nb.shader, op);
197*61046927SAndroid Build Coastguard Worker 
198*61046927SAndroid Build Coastguard Worker    struct vtn_pointer *ptr =
199*61046927SAndroid Build Coastguard Worker       vtn_value(b, w[5], vtn_value_type_pointer)->pointer;
200*61046927SAndroid Build Coastguard Worker    nir_deref_instr *deref = vtn_pointer_to_deref(b, ptr);
201*61046927SAndroid Build Coastguard Worker 
202*61046927SAndroid Build Coastguard Worker    /* If the value we are interpolating has an index into a vector then
203*61046927SAndroid Build Coastguard Worker     * interpolate the vector and index the result of that instead. This is
204*61046927SAndroid Build Coastguard Worker     * necessary because the index will get generated as a series of nir_bcsel
205*61046927SAndroid Build Coastguard Worker     * instructions so it would no longer be an input variable.
206*61046927SAndroid Build Coastguard Worker     */
207*61046927SAndroid Build Coastguard Worker    const bool vec_array_deref = deref->deref_type == nir_deref_type_array &&
208*61046927SAndroid Build Coastguard Worker       glsl_type_is_vector(nir_deref_instr_parent(deref)->type);
209*61046927SAndroid Build Coastguard Worker 
210*61046927SAndroid Build Coastguard Worker    nir_deref_instr *vec_deref = NULL;
211*61046927SAndroid Build Coastguard Worker    if (vec_array_deref) {
212*61046927SAndroid Build Coastguard Worker       vec_deref = deref;
213*61046927SAndroid Build Coastguard Worker       deref = nir_deref_instr_parent(deref);
214*61046927SAndroid Build Coastguard Worker    }
215*61046927SAndroid Build Coastguard Worker    intrin->src[0] = nir_src_for_ssa(&deref->def);
216*61046927SAndroid Build Coastguard Worker    intrin->src[1] = nir_src_for_ssa(vtn_get_nir_ssa(b, w[6]));
217*61046927SAndroid Build Coastguard Worker 
218*61046927SAndroid Build Coastguard Worker    intrin->num_components = glsl_get_vector_elements(deref->type);
219*61046927SAndroid Build Coastguard Worker    nir_def_init(&intrin->instr, &intrin->def,
220*61046927SAndroid Build Coastguard Worker                 glsl_get_vector_elements(deref->type),
221*61046927SAndroid Build Coastguard Worker                 glsl_get_bit_size(deref->type));
222*61046927SAndroid Build Coastguard Worker 
223*61046927SAndroid Build Coastguard Worker    nir_builder_instr_insert(&b->nb, &intrin->instr);
224*61046927SAndroid Build Coastguard Worker 
225*61046927SAndroid Build Coastguard Worker    nir_def *def;
226*61046927SAndroid Build Coastguard Worker    if (vec_array_deref) {
227*61046927SAndroid Build Coastguard Worker       assert(vec_deref);
228*61046927SAndroid Build Coastguard Worker       def = nir_vector_extract(&b->nb, &intrin->def,
229*61046927SAndroid Build Coastguard Worker                                vec_deref->arr.index.ssa);
230*61046927SAndroid Build Coastguard Worker    } else {
231*61046927SAndroid Build Coastguard Worker       def = &intrin->def;
232*61046927SAndroid Build Coastguard Worker    }
233*61046927SAndroid Build Coastguard Worker    vtn_push_nir_ssa(b, w[2], def);
234*61046927SAndroid Build Coastguard Worker 
235*61046927SAndroid Build Coastguard Worker    return true;
236*61046927SAndroid Build Coastguard Worker }
237