1*61046927SAndroid Build Coastguard Worker /*
2*61046927SAndroid Build Coastguard Worker * Copyright (C) 2019 Collabora, Ltd.
3*61046927SAndroid Build Coastguard Worker *
4*61046927SAndroid Build Coastguard Worker * Permission is hereby granted, free of charge, to any person obtaining a
5*61046927SAndroid Build Coastguard Worker * copy of this software and associated documentation files (the "Software"),
6*61046927SAndroid Build Coastguard Worker * to deal in the Software without restriction, including without limitation
7*61046927SAndroid Build Coastguard Worker * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8*61046927SAndroid Build Coastguard Worker * and/or sell copies of the Software, and to permit persons to whom the
9*61046927SAndroid Build Coastguard Worker * Software is furnished to do so, subject to the following conditions:
10*61046927SAndroid Build Coastguard Worker *
11*61046927SAndroid Build Coastguard Worker * The above copyright notice and this permission notice (including the next
12*61046927SAndroid Build Coastguard Worker * paragraph) shall be included in all copies or substantial portions of the
13*61046927SAndroid Build Coastguard Worker * Software.
14*61046927SAndroid Build Coastguard Worker *
15*61046927SAndroid Build Coastguard Worker * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16*61046927SAndroid Build Coastguard Worker * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17*61046927SAndroid Build Coastguard Worker * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18*61046927SAndroid Build Coastguard Worker * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19*61046927SAndroid Build Coastguard Worker * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20*61046927SAndroid Build Coastguard Worker * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21*61046927SAndroid Build Coastguard Worker * SOFTWARE.
22*61046927SAndroid Build Coastguard Worker *
23*61046927SAndroid Build Coastguard Worker */
24*61046927SAndroid Build Coastguard Worker
25*61046927SAndroid Build Coastguard Worker #include "util/u_math.h"
26*61046927SAndroid Build Coastguard Worker #include "pan_encoder.h"
27*61046927SAndroid Build Coastguard Worker
28*61046927SAndroid Build Coastguard Worker /* This file handles attribute descriptors. The
29*61046927SAndroid Build Coastguard Worker * bulk of the complexity is from instancing. See mali_job for
30*61046927SAndroid Build Coastguard Worker * notes on how this works. But basically, for small vertex
31*61046927SAndroid Build Coastguard Worker * counts, we have a lookup table, and for large vertex counts,
32*61046927SAndroid Build Coastguard Worker * we look at the high bits as a heuristic. This has to match
33*61046927SAndroid Build Coastguard Worker * exactly how the hardware calculates this (which is why the
34*61046927SAndroid Build Coastguard Worker * algorithm is so weird) or else instancing will break. */
35*61046927SAndroid Build Coastguard Worker
36*61046927SAndroid Build Coastguard Worker /* Given an odd number (of the form 2k + 1), compute k */
37*61046927SAndroid Build Coastguard Worker #define ODD(odd) ((odd - 1) >> 1)
38*61046927SAndroid Build Coastguard Worker
39*61046927SAndroid Build Coastguard Worker static unsigned
panfrost_small_padded_vertex_count(unsigned idx)40*61046927SAndroid Build Coastguard Worker panfrost_small_padded_vertex_count(unsigned idx)
41*61046927SAndroid Build Coastguard Worker {
42*61046927SAndroid Build Coastguard Worker if (idx < 10)
43*61046927SAndroid Build Coastguard Worker return idx;
44*61046927SAndroid Build Coastguard Worker else
45*61046927SAndroid Build Coastguard Worker return (idx + 1) & ~1;
46*61046927SAndroid Build Coastguard Worker }
47*61046927SAndroid Build Coastguard Worker
48*61046927SAndroid Build Coastguard Worker static unsigned
panfrost_large_padded_vertex_count(uint32_t vertex_count)49*61046927SAndroid Build Coastguard Worker panfrost_large_padded_vertex_count(uint32_t vertex_count)
50*61046927SAndroid Build Coastguard Worker {
51*61046927SAndroid Build Coastguard Worker /* First, we have to find the highest set one */
52*61046927SAndroid Build Coastguard Worker unsigned highest = 32 - __builtin_clz(vertex_count);
53*61046927SAndroid Build Coastguard Worker
54*61046927SAndroid Build Coastguard Worker /* Using that, we mask out the highest 4-bits */
55*61046927SAndroid Build Coastguard Worker unsigned n = highest - 4;
56*61046927SAndroid Build Coastguard Worker unsigned nibble = (vertex_count >> n) & 0xF;
57*61046927SAndroid Build Coastguard Worker
58*61046927SAndroid Build Coastguard Worker /* Great, we have the nibble. Now we can just try possibilities. Note
59*61046927SAndroid Build Coastguard Worker * that we don't care about the bottom most bit in most cases, and we
60*61046927SAndroid Build Coastguard Worker * know the top bit must be 1 */
61*61046927SAndroid Build Coastguard Worker
62*61046927SAndroid Build Coastguard Worker unsigned middle_two = (nibble >> 1) & 0x3;
63*61046927SAndroid Build Coastguard Worker
64*61046927SAndroid Build Coastguard Worker switch (middle_two) {
65*61046927SAndroid Build Coastguard Worker case 0b00:
66*61046927SAndroid Build Coastguard Worker if (!(nibble & 1))
67*61046927SAndroid Build Coastguard Worker return (1 << n) * 9;
68*61046927SAndroid Build Coastguard Worker else
69*61046927SAndroid Build Coastguard Worker return (1 << (n + 1)) * 5;
70*61046927SAndroid Build Coastguard Worker case 0b01:
71*61046927SAndroid Build Coastguard Worker return (1 << (n + 2)) * 3;
72*61046927SAndroid Build Coastguard Worker case 0b10:
73*61046927SAndroid Build Coastguard Worker return (1 << (n + 1)) * 7;
74*61046927SAndroid Build Coastguard Worker case 0b11:
75*61046927SAndroid Build Coastguard Worker return (1 << (n + 4));
76*61046927SAndroid Build Coastguard Worker default:
77*61046927SAndroid Build Coastguard Worker return 0; /* unreachable */
78*61046927SAndroid Build Coastguard Worker }
79*61046927SAndroid Build Coastguard Worker }
80*61046927SAndroid Build Coastguard Worker
81*61046927SAndroid Build Coastguard Worker unsigned
panfrost_padded_vertex_count(unsigned vertex_count)82*61046927SAndroid Build Coastguard Worker panfrost_padded_vertex_count(unsigned vertex_count)
83*61046927SAndroid Build Coastguard Worker {
84*61046927SAndroid Build Coastguard Worker if (vertex_count < 20)
85*61046927SAndroid Build Coastguard Worker return panfrost_small_padded_vertex_count(vertex_count);
86*61046927SAndroid Build Coastguard Worker else
87*61046927SAndroid Build Coastguard Worker return panfrost_large_padded_vertex_count(vertex_count);
88*61046927SAndroid Build Coastguard Worker }
89*61046927SAndroid Build Coastguard Worker
90*61046927SAndroid Build Coastguard Worker /* The much, much more irritating case -- instancing is enabled. See
91*61046927SAndroid Build Coastguard Worker * panfrost_job.h for notes on how this works */
92*61046927SAndroid Build Coastguard Worker
93*61046927SAndroid Build Coastguard Worker unsigned
panfrost_compute_magic_divisor(unsigned hw_divisor,unsigned * o_shift,unsigned * extra_flags)94*61046927SAndroid Build Coastguard Worker panfrost_compute_magic_divisor(unsigned hw_divisor, unsigned *o_shift,
95*61046927SAndroid Build Coastguard Worker unsigned *extra_flags)
96*61046927SAndroid Build Coastguard Worker {
97*61046927SAndroid Build Coastguard Worker /* We have a NPOT divisor. Here's the fun one (multipling by
98*61046927SAndroid Build Coastguard Worker * the inverse and shifting) */
99*61046927SAndroid Build Coastguard Worker
100*61046927SAndroid Build Coastguard Worker /* floor(log2(d)) */
101*61046927SAndroid Build Coastguard Worker unsigned shift = util_logbase2(hw_divisor);
102*61046927SAndroid Build Coastguard Worker
103*61046927SAndroid Build Coastguard Worker /* m = ceil(2^(32 + shift) / d) */
104*61046927SAndroid Build Coastguard Worker uint64_t shift_hi = 32 + shift;
105*61046927SAndroid Build Coastguard Worker uint64_t t = 1ll << shift_hi;
106*61046927SAndroid Build Coastguard Worker double t_f = t;
107*61046927SAndroid Build Coastguard Worker double hw_divisor_d = hw_divisor;
108*61046927SAndroid Build Coastguard Worker double m_f = ceil(t_f / hw_divisor_d);
109*61046927SAndroid Build Coastguard Worker unsigned m = m_f;
110*61046927SAndroid Build Coastguard Worker
111*61046927SAndroid Build Coastguard Worker /* Default case */
112*61046927SAndroid Build Coastguard Worker uint32_t magic_divisor = m;
113*61046927SAndroid Build Coastguard Worker
114*61046927SAndroid Build Coastguard Worker /* e = 2^(shift + 32) % d */
115*61046927SAndroid Build Coastguard Worker uint64_t e = t % hw_divisor;
116*61046927SAndroid Build Coastguard Worker
117*61046927SAndroid Build Coastguard Worker /* Apply round-down algorithm? e <= 2^shift?. XXX: The blob
118*61046927SAndroid Build Coastguard Worker * seems to use a different condition */
119*61046927SAndroid Build Coastguard Worker if (e <= (1ll << shift)) {
120*61046927SAndroid Build Coastguard Worker magic_divisor = m - 1;
121*61046927SAndroid Build Coastguard Worker *extra_flags = 1;
122*61046927SAndroid Build Coastguard Worker }
123*61046927SAndroid Build Coastguard Worker
124*61046927SAndroid Build Coastguard Worker /* Top flag implicitly set */
125*61046927SAndroid Build Coastguard Worker assert(magic_divisor & (1u << 31));
126*61046927SAndroid Build Coastguard Worker magic_divisor &= ~(1u << 31);
127*61046927SAndroid Build Coastguard Worker *o_shift = shift;
128*61046927SAndroid Build Coastguard Worker
129*61046927SAndroid Build Coastguard Worker return magic_divisor;
130*61046927SAndroid Build Coastguard Worker }
131