1*61046927SAndroid Build Coastguard Worker /*
2*61046927SAndroid Build Coastguard Worker * Copyright (C) 2019 Collabora, Ltd.
3*61046927SAndroid Build Coastguard Worker *
4*61046927SAndroid Build Coastguard Worker * Permission is hereby granted, free of charge, to any person obtaining a
5*61046927SAndroid Build Coastguard Worker * copy of this software and associated documentation files (the "Software"),
6*61046927SAndroid Build Coastguard Worker * to deal in the Software without restriction, including without limitation
7*61046927SAndroid Build Coastguard Worker * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8*61046927SAndroid Build Coastguard Worker * and/or sell copies of the Software, and to permit persons to whom the
9*61046927SAndroid Build Coastguard Worker * Software is furnished to do so, subject to the following conditions:
10*61046927SAndroid Build Coastguard Worker *
11*61046927SAndroid Build Coastguard Worker * The above copyright notice and this permission notice (including the next
12*61046927SAndroid Build Coastguard Worker * paragraph) shall be included in all copies or substantial portions of the
13*61046927SAndroid Build Coastguard Worker * Software.
14*61046927SAndroid Build Coastguard Worker *
15*61046927SAndroid Build Coastguard Worker * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16*61046927SAndroid Build Coastguard Worker * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17*61046927SAndroid Build Coastguard Worker * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18*61046927SAndroid Build Coastguard Worker * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19*61046927SAndroid Build Coastguard Worker * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20*61046927SAndroid Build Coastguard Worker * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21*61046927SAndroid Build Coastguard Worker * SOFTWARE.
22*61046927SAndroid Build Coastguard Worker *
23*61046927SAndroid Build Coastguard Worker * Authors:
24*61046927SAndroid Build Coastguard Worker * Alyssa Rosenzweig <[email protected]>
25*61046927SAndroid Build Coastguard Worker */
26*61046927SAndroid Build Coastguard Worker
27*61046927SAndroid Build Coastguard Worker #include "util/macros.h"
28*61046927SAndroid Build Coastguard Worker
29*61046927SAndroid Build Coastguard Worker #include "kmod/pan_kmod.h"
30*61046927SAndroid Build Coastguard Worker #include "panfrost/util/pan_ir.h"
31*61046927SAndroid Build Coastguard Worker #include "pan_props.h"
32*61046927SAndroid Build Coastguard Worker
33*61046927SAndroid Build Coastguard Worker #include <genxml/gen_macros.h>
34*61046927SAndroid Build Coastguard Worker
35*61046927SAndroid Build Coastguard Worker /* Fixed "minimum revisions" */
36*61046927SAndroid Build Coastguard Worker #define NO_ANISO (~0)
37*61046927SAndroid Build Coastguard Worker #define HAS_ANISO (0)
38*61046927SAndroid Build Coastguard Worker
39*61046927SAndroid Build Coastguard Worker #define MODEL(gpu_id_, gpu_variant_, shortname, counters_, \
40*61046927SAndroid Build Coastguard Worker min_rev_anisotropic_, tib_size_, quirks_) \
41*61046927SAndroid Build Coastguard Worker { \
42*61046927SAndroid Build Coastguard Worker .gpu_id = gpu_id_, .gpu_variant = gpu_variant_, \
43*61046927SAndroid Build Coastguard Worker .name = "Mali-" shortname " (Panfrost)", \
44*61046927SAndroid Build Coastguard Worker .performance_counters = counters_, \
45*61046927SAndroid Build Coastguard Worker .min_rev_anisotropic = min_rev_anisotropic_, \
46*61046927SAndroid Build Coastguard Worker .tilebuffer_size = tib_size_, .quirks = quirks_, \
47*61046927SAndroid Build Coastguard Worker }
48*61046927SAndroid Build Coastguard Worker
49*61046927SAndroid Build Coastguard Worker /* Table of supported Mali GPUs */
50*61046927SAndroid Build Coastguard Worker /* clang-format off */
51*61046927SAndroid Build Coastguard Worker const struct panfrost_model panfrost_model_list[] = {
52*61046927SAndroid Build Coastguard Worker MODEL(0x600, 0, "T600", "T60x", NO_ANISO, 8192, {}),
53*61046927SAndroid Build Coastguard Worker MODEL(0x620, 0, "T620", "T62x", NO_ANISO, 8192, {}),
54*61046927SAndroid Build Coastguard Worker MODEL(0x720, 0, "T720", "T72x", NO_ANISO, 8192, { .no_hierarchical_tiling = true }),
55*61046927SAndroid Build Coastguard Worker MODEL(0x750, 0, "T760", "T76x", NO_ANISO, 8192, {}),
56*61046927SAndroid Build Coastguard Worker MODEL(0x820, 0, "T820", "T82x", NO_ANISO, 8192, { .no_hierarchical_tiling = true }),
57*61046927SAndroid Build Coastguard Worker MODEL(0x830, 0, "T830", "T83x", NO_ANISO, 8192, { .no_hierarchical_tiling = true }),
58*61046927SAndroid Build Coastguard Worker MODEL(0x860, 0, "T860", "T86x", NO_ANISO, 8192, {}),
59*61046927SAndroid Build Coastguard Worker MODEL(0x880, 0, "T880", "T88x", NO_ANISO, 8192, {}),
60*61046927SAndroid Build Coastguard Worker
61*61046927SAndroid Build Coastguard Worker MODEL(0x6000, 0, "G71", "TMIx", NO_ANISO, 8192, {}),
62*61046927SAndroid Build Coastguard Worker MODEL(0x6221, 0, "G72", "THEx", 0x0030 /* r0p3 */, 16384, {}),
63*61046927SAndroid Build Coastguard Worker MODEL(0x7090, 0, "G51", "TSIx", 0x1010 /* r1p1 */, 16384, {}),
64*61046927SAndroid Build Coastguard Worker MODEL(0x7093, 0, "G31", "TDVx", HAS_ANISO, 16384, {}),
65*61046927SAndroid Build Coastguard Worker MODEL(0x7211, 0, "G76", "TNOx", HAS_ANISO, 16384, {}),
66*61046927SAndroid Build Coastguard Worker MODEL(0x7212, 0, "G52", "TGOx", HAS_ANISO, 16384, {}),
67*61046927SAndroid Build Coastguard Worker MODEL(0x7402, 0, "G52 r1", "TGOx", HAS_ANISO, 16384, {}),
68*61046927SAndroid Build Coastguard Worker MODEL(0x9091, 0, "G57", "TNAx", HAS_ANISO, 16384, {}),
69*61046927SAndroid Build Coastguard Worker MODEL(0x9093, 0, "G57", "TNAx", HAS_ANISO, 16384, {}),
70*61046927SAndroid Build Coastguard Worker
71*61046927SAndroid Build Coastguard Worker MODEL(0xa867, 0, "G610", "TVIx", HAS_ANISO, 32768, {}),
72*61046927SAndroid Build Coastguard Worker MODEL(0xac74, 0, "G310", "TVAx", HAS_ANISO, 16384, {}),
73*61046927SAndroid Build Coastguard Worker MODEL(0xac74, 1, "G310", "TVAx", HAS_ANISO, 16384, {}),
74*61046927SAndroid Build Coastguard Worker MODEL(0xac74, 2, "G310", "TVAx", HAS_ANISO, 16384, {}),
75*61046927SAndroid Build Coastguard Worker MODEL(0xac74, 3, "G310", "TVAx", HAS_ANISO, 32768, {}),
76*61046927SAndroid Build Coastguard Worker MODEL(0xac74, 4, "G310", "TVAx", HAS_ANISO, 32768, {}),
77*61046927SAndroid Build Coastguard Worker };
78*61046927SAndroid Build Coastguard Worker /* clang-format on */
79*61046927SAndroid Build Coastguard Worker
80*61046927SAndroid Build Coastguard Worker #undef NO_ANISO
81*61046927SAndroid Build Coastguard Worker #undef HAS_ANISO
82*61046927SAndroid Build Coastguard Worker #undef MODEL
83*61046927SAndroid Build Coastguard Worker
84*61046927SAndroid Build Coastguard Worker /*
85*61046927SAndroid Build Coastguard Worker * Look up a supported model by its GPU ID, or return NULL if the model is not
86*61046927SAndroid Build Coastguard Worker * supported at this time.
87*61046927SAndroid Build Coastguard Worker */
88*61046927SAndroid Build Coastguard Worker const struct panfrost_model *
panfrost_get_model(uint32_t gpu_id,uint32_t gpu_variant)89*61046927SAndroid Build Coastguard Worker panfrost_get_model(uint32_t gpu_id, uint32_t gpu_variant)
90*61046927SAndroid Build Coastguard Worker {
91*61046927SAndroid Build Coastguard Worker for (unsigned i = 0; i < ARRAY_SIZE(panfrost_model_list); ++i) {
92*61046927SAndroid Build Coastguard Worker if (panfrost_model_list[i].gpu_id == gpu_id &&
93*61046927SAndroid Build Coastguard Worker panfrost_model_list[i].gpu_variant == gpu_variant)
94*61046927SAndroid Build Coastguard Worker return &panfrost_model_list[i];
95*61046927SAndroid Build Coastguard Worker }
96*61046927SAndroid Build Coastguard Worker
97*61046927SAndroid Build Coastguard Worker return NULL;
98*61046927SAndroid Build Coastguard Worker }
99*61046927SAndroid Build Coastguard Worker
100*61046927SAndroid Build Coastguard Worker unsigned
panfrost_query_l2_slices(const struct pan_kmod_dev_props * props)101*61046927SAndroid Build Coastguard Worker panfrost_query_l2_slices(const struct pan_kmod_dev_props *props)
102*61046927SAndroid Build Coastguard Worker {
103*61046927SAndroid Build Coastguard Worker /* L2_SLICES is MEM_FEATURES[11:8] minus(1) */
104*61046927SAndroid Build Coastguard Worker return ((props->mem_features >> 8) & 0xF) + 1;
105*61046927SAndroid Build Coastguard Worker }
106*61046927SAndroid Build Coastguard Worker
107*61046927SAndroid Build Coastguard Worker struct panfrost_tiler_features
panfrost_query_tiler_features(const struct pan_kmod_dev_props * props)108*61046927SAndroid Build Coastguard Worker panfrost_query_tiler_features(const struct pan_kmod_dev_props *props)
109*61046927SAndroid Build Coastguard Worker {
110*61046927SAndroid Build Coastguard Worker /* Default value (2^9 bytes and 8 levels) to match old behaviour */
111*61046927SAndroid Build Coastguard Worker uint32_t raw = props->tiler_features;
112*61046927SAndroid Build Coastguard Worker
113*61046927SAndroid Build Coastguard Worker /* Bin size is log2 in the first byte, max levels in the second byte */
114*61046927SAndroid Build Coastguard Worker return (struct panfrost_tiler_features){
115*61046927SAndroid Build Coastguard Worker .bin_size = (1 << (raw & BITFIELD_MASK(5))),
116*61046927SAndroid Build Coastguard Worker .max_levels = (raw >> 8) & BITFIELD_MASK(4),
117*61046927SAndroid Build Coastguard Worker };
118*61046927SAndroid Build Coastguard Worker }
119*61046927SAndroid Build Coastguard Worker
120*61046927SAndroid Build Coastguard Worker unsigned
panfrost_query_core_count(const struct pan_kmod_dev_props * props,unsigned * core_id_range)121*61046927SAndroid Build Coastguard Worker panfrost_query_core_count(const struct pan_kmod_dev_props *props,
122*61046927SAndroid Build Coastguard Worker unsigned *core_id_range)
123*61046927SAndroid Build Coastguard Worker {
124*61046927SAndroid Build Coastguard Worker /* On older kernels, worst-case to 16 cores */
125*61046927SAndroid Build Coastguard Worker
126*61046927SAndroid Build Coastguard Worker unsigned mask = props->shader_present;
127*61046927SAndroid Build Coastguard Worker
128*61046927SAndroid Build Coastguard Worker /* Some cores might be absent. In some cases, we care
129*61046927SAndroid Build Coastguard Worker * about the range of core IDs (that is, the greatest core ID + 1). If
130*61046927SAndroid Build Coastguard Worker * the core mask is contiguous, this equals the core count.
131*61046927SAndroid Build Coastguard Worker */
132*61046927SAndroid Build Coastguard Worker *core_id_range = util_last_bit(mask);
133*61046927SAndroid Build Coastguard Worker
134*61046927SAndroid Build Coastguard Worker /* The actual core count skips overs the gaps */
135*61046927SAndroid Build Coastguard Worker return util_bitcount(mask);
136*61046927SAndroid Build Coastguard Worker }
137*61046927SAndroid Build Coastguard Worker
138*61046927SAndroid Build Coastguard Worker unsigned
panfrost_query_thread_tls_alloc(const struct pan_kmod_dev_props * props)139*61046927SAndroid Build Coastguard Worker panfrost_query_thread_tls_alloc(const struct pan_kmod_dev_props *props)
140*61046927SAndroid Build Coastguard Worker {
141*61046927SAndroid Build Coastguard Worker return props->max_tls_instance_per_core ?: props->max_threads_per_core;
142*61046927SAndroid Build Coastguard Worker }
143*61046927SAndroid Build Coastguard Worker
144*61046927SAndroid Build Coastguard Worker unsigned
panfrost_compute_max_thread_count(const struct pan_kmod_dev_props * props,unsigned work_reg_count)145*61046927SAndroid Build Coastguard Worker panfrost_compute_max_thread_count(const struct pan_kmod_dev_props *props,
146*61046927SAndroid Build Coastguard Worker unsigned work_reg_count)
147*61046927SAndroid Build Coastguard Worker {
148*61046927SAndroid Build Coastguard Worker unsigned aligned_reg_count;
149*61046927SAndroid Build Coastguard Worker
150*61046927SAndroid Build Coastguard Worker /* 4, 8 or 16 registers per shader on Midgard
151*61046927SAndroid Build Coastguard Worker * 32 or 64 registers per shader on Bifrost
152*61046927SAndroid Build Coastguard Worker */
153*61046927SAndroid Build Coastguard Worker if (pan_arch(props->gpu_prod_id) <= 5) {
154*61046927SAndroid Build Coastguard Worker aligned_reg_count = util_next_power_of_two(MAX2(work_reg_count, 4));
155*61046927SAndroid Build Coastguard Worker assert(aligned_reg_count <= 16);
156*61046927SAndroid Build Coastguard Worker } else {
157*61046927SAndroid Build Coastguard Worker aligned_reg_count = work_reg_count <= 32 ? 32 : 64;
158*61046927SAndroid Build Coastguard Worker }
159*61046927SAndroid Build Coastguard Worker
160*61046927SAndroid Build Coastguard Worker return MIN3(props->max_threads_per_wg, props->max_threads_per_core,
161*61046927SAndroid Build Coastguard Worker props->num_registers_per_core / aligned_reg_count);
162*61046927SAndroid Build Coastguard Worker }
163*61046927SAndroid Build Coastguard Worker
164*61046927SAndroid Build Coastguard Worker uint32_t
panfrost_query_compressed_formats(const struct pan_kmod_dev_props * props)165*61046927SAndroid Build Coastguard Worker panfrost_query_compressed_formats(const struct pan_kmod_dev_props *props)
166*61046927SAndroid Build Coastguard Worker {
167*61046927SAndroid Build Coastguard Worker return props->texture_features[0];
168*61046927SAndroid Build Coastguard Worker }
169*61046927SAndroid Build Coastguard Worker
170*61046927SAndroid Build Coastguard Worker /* Check for AFBC hardware support. AFBC is introduced in v5. Implementations
171*61046927SAndroid Build Coastguard Worker * may omit it, signaled as a nonzero value in the AFBC_FEATURES property. */
172*61046927SAndroid Build Coastguard Worker
173*61046927SAndroid Build Coastguard Worker bool
panfrost_query_afbc(const struct pan_kmod_dev_props * props)174*61046927SAndroid Build Coastguard Worker panfrost_query_afbc(const struct pan_kmod_dev_props *props)
175*61046927SAndroid Build Coastguard Worker {
176*61046927SAndroid Build Coastguard Worker unsigned reg = props->afbc_features;
177*61046927SAndroid Build Coastguard Worker
178*61046927SAndroid Build Coastguard Worker return (pan_arch(props->gpu_prod_id) >= 5) && (reg == 0);
179*61046927SAndroid Build Coastguard Worker }
180*61046927SAndroid Build Coastguard Worker
181*61046927SAndroid Build Coastguard Worker /* Check for AFRC hardware support. AFRC is introduced in v10. Implementations
182*61046927SAndroid Build Coastguard Worker * may omit it, signaled in bit 25 of TEXTURE_FEATURES_0 property. */
183*61046927SAndroid Build Coastguard Worker
184*61046927SAndroid Build Coastguard Worker bool
panfrost_query_afrc(const struct pan_kmod_dev_props * props)185*61046927SAndroid Build Coastguard Worker panfrost_query_afrc(const struct pan_kmod_dev_props *props)
186*61046927SAndroid Build Coastguard Worker {
187*61046927SAndroid Build Coastguard Worker return (pan_arch(props->gpu_prod_id) >= 10) &&
188*61046927SAndroid Build Coastguard Worker (props->texture_features[0] & (1 << 25));
189*61046927SAndroid Build Coastguard Worker }
190*61046927SAndroid Build Coastguard Worker
191*61046927SAndroid Build Coastguard Worker /*
192*61046927SAndroid Build Coastguard Worker * To pipeline multiple tiles, a given tile may use at most half of the tile
193*61046927SAndroid Build Coastguard Worker * buffer. This function returns the optimal size (assuming pipelining).
194*61046927SAndroid Build Coastguard Worker *
195*61046927SAndroid Build Coastguard Worker * For Mali-G510 and Mali-G310, we will need extra logic to query the tilebuffer
196*61046927SAndroid Build Coastguard Worker * size for the particular variant. The CORE_FEATURES register might help.
197*61046927SAndroid Build Coastguard Worker */
198*61046927SAndroid Build Coastguard Worker unsigned
panfrost_query_optimal_tib_size(const struct panfrost_model * model)199*61046927SAndroid Build Coastguard Worker panfrost_query_optimal_tib_size(const struct panfrost_model *model)
200*61046927SAndroid Build Coastguard Worker {
201*61046927SAndroid Build Coastguard Worker /* Preconditions ensure the returned value is a multiple of 1 KiB, the
202*61046927SAndroid Build Coastguard Worker * granularity of the colour buffer allocation field.
203*61046927SAndroid Build Coastguard Worker */
204*61046927SAndroid Build Coastguard Worker assert(model->tilebuffer_size >= 2048);
205*61046927SAndroid Build Coastguard Worker assert(util_is_power_of_two_nonzero(model->tilebuffer_size));
206*61046927SAndroid Build Coastguard Worker
207*61046927SAndroid Build Coastguard Worker return model->tilebuffer_size / 2;
208*61046927SAndroid Build Coastguard Worker }
209*61046927SAndroid Build Coastguard Worker
210*61046927SAndroid Build Coastguard Worker uint64_t
panfrost_clamp_to_usable_va_range(const struct pan_kmod_dev * dev,uint64_t va)211*61046927SAndroid Build Coastguard Worker panfrost_clamp_to_usable_va_range(const struct pan_kmod_dev *dev, uint64_t va)
212*61046927SAndroid Build Coastguard Worker {
213*61046927SAndroid Build Coastguard Worker struct pan_kmod_va_range user_va_range =
214*61046927SAndroid Build Coastguard Worker pan_kmod_dev_query_user_va_range(dev);
215*61046927SAndroid Build Coastguard Worker
216*61046927SAndroid Build Coastguard Worker if (va < user_va_range.start)
217*61046927SAndroid Build Coastguard Worker return user_va_range.start;
218*61046927SAndroid Build Coastguard Worker else if (va > user_va_range.start + user_va_range.size)
219*61046927SAndroid Build Coastguard Worker return user_va_range.start + user_va_range.size;
220*61046927SAndroid Build Coastguard Worker
221*61046927SAndroid Build Coastguard Worker return va;
222*61046927SAndroid Build Coastguard Worker }
223