Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
PojavLauncherTeam
GitHub Repository: PojavLauncherTeam/mesa
Path: blob/21.2-virgl/src/gallium/drivers/panfrost/pan_screen.c
4570 views
1
/*
2
* Copyright (C) 2008 VMware, Inc.
3
* Copyright (C) 2014 Broadcom
4
* Copyright (C) 2018 Alyssa Rosenzweig
5
* Copyright (C) 2019 Collabora, Ltd.
6
* Copyright (C) 2012 Rob Clark <[email protected]>
7
*
8
* Permission is hereby granted, free of charge, to any person obtaining a
9
* copy of this software and associated documentation files (the "Software"),
10
* to deal in the Software without restriction, including without limitation
11
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
12
* and/or sell copies of the Software, and to permit persons to whom the
13
* Software is furnished to do so, subject to the following conditions:
14
*
15
* The above copyright notice and this permission notice (including the next
16
* paragraph) shall be included in all copies or substantial portions of the
17
* Software.
18
*
19
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
20
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
22
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
23
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
24
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
25
* SOFTWARE.
26
*
27
*/
28
29
#include "util/u_debug.h"
30
#include "util/u_memory.h"
31
#include "util/format/u_format.h"
32
#include "util/format/u_format_s3tc.h"
33
#include "util/u_video.h"
34
#include "util/u_screen.h"
35
#include "util/os_time.h"
36
#include "util/u_process.h"
37
#include "pipe/p_defines.h"
38
#include "pipe/p_screen.h"
39
#include "draw/draw_context.h"
40
41
#include <fcntl.h>
42
43
#include "drm-uapi/drm_fourcc.h"
44
#include "drm-uapi/panfrost_drm.h"
45
46
#include "pan_bo.h"
47
#include "pan_shader.h"
48
#include "pan_screen.h"
49
#include "pan_resource.h"
50
#include "pan_public.h"
51
#include "pan_util.h"
52
#include "pan_indirect_dispatch.h"
53
#include "pan_indirect_draw.h"
54
#include "decode.h"
55
56
#include "pan_context.h"
57
#include "panfrost-quirks.h"
58
59
static const struct debug_named_value panfrost_debug_options[] = {
60
{"trace", PAN_DBG_TRACE, "Trace the command stream"},
61
{"deqp", PAN_DBG_DEQP, "Hacks for dEQP"},
62
{"dirty", PAN_DBG_DIRTY, "Always re-emit all state"},
63
{"sync", PAN_DBG_SYNC, "Wait for each job's completion and abort on GPU faults"},
64
{"precompile", PAN_DBG_PRECOMPILE, "Precompile shaders for shader-db"},
65
{"nofp16", PAN_DBG_NOFP16, "Disable 16-bit support"},
66
{"gl3", PAN_DBG_GL3, "Enable experimental GL 3.x implementation, up to 3.3"},
67
{"noafbc", PAN_DBG_NO_AFBC, "Disable AFBC support"},
68
{"nocrc", PAN_DBG_NO_CRC, "Disable transaction elimination"},
69
{"msaa16", PAN_DBG_MSAA16, "Enable MSAA 8x and 16x support"},
70
{"noindirect", PAN_DBG_NOINDIRECT, "Emulate indirect draws on the CPU"},
71
DEBUG_NAMED_VALUE_END
72
};
73
74
static const char *
75
panfrost_get_name(struct pipe_screen *screen)
76
{
77
return panfrost_model_name(pan_device(screen)->gpu_id);
78
}
79
80
static const char *
81
panfrost_get_vendor(struct pipe_screen *screen)
82
{
83
return "Panfrost";
84
}
85
86
static const char *
87
panfrost_get_device_vendor(struct pipe_screen *screen)
88
{
89
return "Arm";
90
}
91
92
static int
93
panfrost_get_param(struct pipe_screen *screen, enum pipe_cap param)
94
{
95
struct panfrost_device *dev = pan_device(screen);
96
97
/* Our GL 3.x implementation is WIP */
98
bool is_gl3 = dev->debug & (PAN_DBG_GL3 | PAN_DBG_DEQP);
99
100
/* Don't expose MRT related CAPs on GPUs that don't implement them */
101
bool has_mrt = !(dev->quirks & MIDGARD_SFBD);
102
103
/* Only kernel drivers >= 1.1 can allocate HEAP BOs */
104
bool has_heap = dev->kernel_version->version_major > 1 ||
105
dev->kernel_version->version_minor >= 1;
106
107
/* Bifrost is WIP */
108
switch (param) {
109
case PIPE_CAP_NPOT_TEXTURES:
110
case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
111
case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
112
case PIPE_CAP_VERTEX_SHADER_SATURATE:
113
case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
114
case PIPE_CAP_POINT_SPRITE:
115
case PIPE_CAP_DEPTH_CLIP_DISABLE:
116
case PIPE_CAP_DEPTH_CLIP_DISABLE_SEPARATE:
117
case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
118
case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
119
case PIPE_CAP_FRONTEND_NOOP:
120
case PIPE_CAP_SAMPLE_SHADING:
121
case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
122
case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
123
return 1;
124
125
case PIPE_CAP_MAX_RENDER_TARGETS:
126
case PIPE_CAP_FBFETCH:
127
case PIPE_CAP_FBFETCH_COHERENT:
128
return has_mrt ? 8 : 1;
129
130
case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
131
return 1;
132
133
case PIPE_CAP_OCCLUSION_QUERY:
134
case PIPE_CAP_PRIMITIVE_RESTART:
135
case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:
136
return true;
137
138
case PIPE_CAP_ANISOTROPIC_FILTER:
139
return !!(dev->quirks & HAS_ANISOTROPIC);
140
141
/* Compile side is done for Bifrost, Midgard TODO. Needs some kernel
142
* work to turn on, since CYCLE_COUNT_START needs to be issued. In
143
* kbase, userspace requests this via BASE_JD_REQ_PERMON. There is not
144
* yet way to request this with mainline TODO */
145
case PIPE_CAP_TGSI_CLOCK:
146
return 0;
147
148
case PIPE_CAP_TGSI_INSTANCEID:
149
case PIPE_CAP_TEXTURE_MULTISAMPLE:
150
case PIPE_CAP_SURFACE_SAMPLE_COUNT:
151
return true;
152
153
case PIPE_CAP_SAMPLER_VIEW_TARGET:
154
case PIPE_CAP_TEXTURE_SWIZZLE:
155
case PIPE_CAP_TEXTURE_MIRROR_CLAMP:
156
case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE:
157
case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
158
case PIPE_CAP_BLEND_EQUATION_SEPARATE:
159
case PIPE_CAP_INDEP_BLEND_ENABLE:
160
case PIPE_CAP_INDEP_BLEND_FUNC:
161
case PIPE_CAP_GENERATE_MIPMAP:
162
case PIPE_CAP_ACCELERATED:
163
case PIPE_CAP_UMA:
164
case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
165
case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
166
case PIPE_CAP_TGSI_ARRAY_COMPONENTS:
167
case PIPE_CAP_CS_DERIVED_SYSTEM_VALUES_SUPPORTED:
168
case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
169
case PIPE_CAP_TEXTURE_BUFFER_SAMPLER:
170
case PIPE_CAP_PACKED_UNIFORMS:
171
case PIPE_CAP_IMAGE_LOAD_FORMATTED:
172
case PIPE_CAP_CUBE_MAP_ARRAY:
173
case PIPE_CAP_COMPUTE:
174
return 1;
175
176
/* We need this for OES_copy_image, but currently there are some awful
177
* interactions with AFBC that need to be worked out. */
178
case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
179
return 0;
180
181
case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
182
return PIPE_MAX_SO_BUFFERS;
183
184
case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
185
case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
186
return PIPE_MAX_SO_OUTPUTS;
187
188
case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
189
case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
190
return 1;
191
192
case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
193
return 256;
194
195
case PIPE_CAP_GLSL_FEATURE_LEVEL:
196
case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
197
return is_gl3 ? 330 : 140;
198
case PIPE_CAP_ESSL_FEATURE_LEVEL:
199
return pan_is_bifrost(dev) ? 320 : 310;
200
201
case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
202
return 16;
203
204
case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
205
return 65536;
206
207
/* Must be at least 64 for correct behaviour */
208
case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
209
return 64;
210
211
case PIPE_CAP_QUERY_TIMESTAMP:
212
return is_gl3;
213
214
/* TODO: Where does this req come from in practice? */
215
case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:
216
return 1;
217
218
case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
219
return 4096;
220
case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
221
return 13;
222
case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
223
return 13;
224
225
case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
226
/* Hardware is natively upper left */
227
return 0;
228
229
case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
230
case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
231
case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
232
case PIPE_CAP_TGSI_TEXCOORD:
233
return 1;
234
235
/* We would prefer varyings on Midgard, but proper sysvals on Bifrost */
236
case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
237
case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL:
238
case PIPE_CAP_TGSI_FS_POINT_IS_SYSVAL:
239
return pan_is_bifrost(dev);
240
241
case PIPE_CAP_SEAMLESS_CUBE_MAP:
242
case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
243
return true;
244
245
case PIPE_CAP_MAX_VERTEX_ELEMENT_SRC_OFFSET:
246
return 0xffff;
247
248
case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
249
return 0;
250
251
case PIPE_CAP_ENDIANNESS:
252
return PIPE_ENDIAN_NATIVE;
253
254
case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
255
return 4;
256
257
case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
258
return -8;
259
260
case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
261
return 7;
262
263
case PIPE_CAP_VIDEO_MEMORY: {
264
uint64_t system_memory;
265
266
if (!os_get_total_physical_memory(&system_memory))
267
return 0;
268
269
return (int)(system_memory >> 20);
270
}
271
272
case PIPE_CAP_SHADER_STENCIL_EXPORT:
273
case PIPE_CAP_CONDITIONAL_RENDER:
274
case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:
275
return true;
276
277
case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
278
return 4;
279
280
case PIPE_CAP_MAX_VARYINGS:
281
return PIPE_MAX_ATTRIBS;
282
283
/* Removed in v6 (Bifrost) */
284
case PIPE_CAP_ALPHA_TEST:
285
return dev->arch <= 5;
286
287
case PIPE_CAP_FLATSHADE:
288
case PIPE_CAP_TWO_SIDED_COLOR:
289
case PIPE_CAP_CLIP_PLANES:
290
return 0;
291
292
case PIPE_CAP_PACKED_STREAM_OUTPUT:
293
return 0;
294
295
case PIPE_CAP_VIEWPORT_TRANSFORM_LOWERED:
296
case PIPE_CAP_PSIZ_CLAMPED:
297
return 1;
298
299
case PIPE_CAP_NIR_IMAGES_AS_DEREF:
300
return 0;
301
302
case PIPE_CAP_DRAW_INDIRECT:
303
return has_heap;
304
305
case PIPE_CAP_START_INSTANCE:
306
case PIPE_CAP_DRAW_PARAMETERS:
307
return pan_is_bifrost(dev);
308
309
default:
310
return u_pipe_screen_get_param_defaults(screen, param);
311
}
312
}
313
314
static int
315
panfrost_get_shader_param(struct pipe_screen *screen,
316
enum pipe_shader_type shader,
317
enum pipe_shader_cap param)
318
{
319
struct panfrost_device *dev = pan_device(screen);
320
bool is_nofp16 = dev->debug & PAN_DBG_NOFP16;
321
bool is_deqp = dev->debug & PAN_DBG_DEQP;
322
323
switch (shader) {
324
case PIPE_SHADER_VERTEX:
325
case PIPE_SHADER_FRAGMENT:
326
case PIPE_SHADER_COMPUTE:
327
break;
328
default:
329
return 0;
330
}
331
332
switch (param) {
333
case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
334
case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
335
case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
336
case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
337
return 16384; /* arbitrary */
338
339
case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
340
return 1024; /* arbitrary */
341
342
case PIPE_SHADER_CAP_MAX_INPUTS:
343
/* Used as ABI on Midgard */
344
return 16;
345
346
case PIPE_SHADER_CAP_MAX_OUTPUTS:
347
return shader == PIPE_SHADER_FRAGMENT ? 8 : PIPE_MAX_ATTRIBS;
348
349
case PIPE_SHADER_CAP_MAX_TEMPS:
350
return 256; /* arbitrary */
351
352
case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
353
return 16 * 1024 * sizeof(float);
354
355
case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
356
STATIC_ASSERT(PAN_MAX_CONST_BUFFERS < 0x100);
357
return PAN_MAX_CONST_BUFFERS;
358
359
case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
360
return 0;
361
362
case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
363
return 1;
364
case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
365
return 0;
366
367
case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
368
return pan_is_bifrost(dev);
369
370
case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
371
return 1;
372
373
case PIPE_SHADER_CAP_SUBROUTINES:
374
return 0;
375
376
case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
377
return 0;
378
379
case PIPE_SHADER_CAP_INTEGERS:
380
return 1;
381
382
/* The Bifrost compiler supports full 16-bit. Midgard could but int16
383
* support is untested, so restrict INT16 to Bifrost. Midgard
384
* architecturally cannot support fp16 derivatives. */
385
386
case PIPE_SHADER_CAP_FP16:
387
case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
388
return !is_nofp16;
389
case PIPE_SHADER_CAP_FP16_DERIVATIVES:
390
case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:
391
return pan_is_bifrost(dev) && !is_nofp16;
392
case PIPE_SHADER_CAP_INT16:
393
/* XXX: Advertise this CAP when a proper fix to lower_precision
394
* lands. GLSL IR validation failure in glmark2 -bterrain */
395
return pan_is_bifrost(dev) && !is_nofp16 && is_deqp;
396
397
case PIPE_SHADER_CAP_INT64_ATOMICS:
398
case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
399
case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
400
case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
401
case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
402
case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
403
return 0;
404
405
case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
406
STATIC_ASSERT(PIPE_MAX_SAMPLERS < 0x10000);
407
return PIPE_MAX_SAMPLERS;
408
409
case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
410
STATIC_ASSERT(PIPE_MAX_SHADER_SAMPLER_VIEWS < 0x10000);
411
return PIPE_MAX_SHADER_SAMPLER_VIEWS;
412
413
case PIPE_SHADER_CAP_PREFERRED_IR:
414
return PIPE_SHADER_IR_NIR;
415
416
case PIPE_SHADER_CAP_SUPPORTED_IRS:
417
return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_NIR_SERIALIZED);
418
419
case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
420
return 16;
421
422
case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
423
return PIPE_MAX_SHADER_IMAGES;
424
425
case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
426
case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
427
case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
428
case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
429
case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
430
return 0;
431
432
default:
433
return 0;
434
}
435
436
return 0;
437
}
438
439
static float
440
panfrost_get_paramf(struct pipe_screen *screen, enum pipe_capf param)
441
{
442
switch (param) {
443
case PIPE_CAPF_MAX_LINE_WIDTH:
444
445
FALLTHROUGH;
446
case PIPE_CAPF_MAX_LINE_WIDTH_AA:
447
return 255.0; /* arbitrary */
448
449
case PIPE_CAPF_MAX_POINT_WIDTH:
450
451
FALLTHROUGH;
452
case PIPE_CAPF_MAX_POINT_WIDTH_AA:
453
return 1024.0;
454
455
case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
456
return 16.0;
457
458
case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
459
return 16.0; /* arbitrary */
460
461
case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
462
case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
463
case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
464
return 0.0f;
465
466
default:
467
debug_printf("Unexpected PIPE_CAPF %d query\n", param);
468
return 0.0;
469
}
470
}
471
472
/**
473
* Query format support for creating a texture, drawing surface, etc.
474
* \param format the format to test
475
* \param type one of PIPE_TEXTURE, PIPE_SURFACE
476
*/
477
static bool
478
panfrost_is_format_supported( struct pipe_screen *screen,
479
enum pipe_format format,
480
enum pipe_texture_target target,
481
unsigned sample_count,
482
unsigned storage_sample_count,
483
unsigned bind)
484
{
485
struct panfrost_device *dev = pan_device(screen);
486
const struct util_format_description *format_desc;
487
488
assert(target == PIPE_BUFFER ||
489
target == PIPE_TEXTURE_1D ||
490
target == PIPE_TEXTURE_1D_ARRAY ||
491
target == PIPE_TEXTURE_2D ||
492
target == PIPE_TEXTURE_2D_ARRAY ||
493
target == PIPE_TEXTURE_RECT ||
494
target == PIPE_TEXTURE_3D ||
495
target == PIPE_TEXTURE_CUBE ||
496
target == PIPE_TEXTURE_CUBE_ARRAY);
497
498
format_desc = util_format_description(format);
499
500
if (!format_desc)
501
return false;
502
503
/* MSAA 2x gets rounded up to 4x. MSAA 8x/16x only supported on v5+.
504
* TODO: debug MSAA 8x/16x */
505
506
switch (sample_count) {
507
case 0:
508
case 1:
509
case 4:
510
break;
511
case 8:
512
case 16:
513
if (dev->debug & PAN_DBG_MSAA16)
514
break;
515
else
516
return false;
517
default:
518
return false;
519
}
520
521
if (MAX2(sample_count, 1) != MAX2(storage_sample_count, 1))
522
return false;
523
524
/* Z16 causes dEQP failures on t720 */
525
if (format == PIPE_FORMAT_Z16_UNORM && dev->quirks & MIDGARD_SFBD)
526
return false;
527
528
/* Check we support the format with the given bind */
529
530
unsigned relevant_bind = bind &
531
( PIPE_BIND_DEPTH_STENCIL | PIPE_BIND_RENDER_TARGET
532
| PIPE_BIND_VERTEX_BUFFER | PIPE_BIND_SAMPLER_VIEW);
533
534
struct panfrost_format fmt = dev->formats[format];
535
536
/* Also check that compressed texture formats are supported on this
537
* particular chip. They may not be depending on system integration
538
* differences. RGTC can be emulated so is always supported. */
539
540
bool is_rgtc = format_desc->layout == UTIL_FORMAT_LAYOUT_RGTC;
541
bool supported = panfrost_supports_compressed_format(dev,
542
MALI_EXTRACT_INDEX(fmt.hw));
543
544
if (!is_rgtc && !supported)
545
return false;
546
547
return MALI_EXTRACT_INDEX(fmt.hw) && ((relevant_bind & ~fmt.bind) == 0);
548
}
549
550
/* We always support linear and tiled operations, both external and internal.
551
* We support AFBC for a subset of formats, and colourspace transform for a
552
* subset of those. */
553
554
static void
555
panfrost_walk_dmabuf_modifiers(struct pipe_screen *screen,
556
enum pipe_format format, int max, uint64_t *modifiers, unsigned
557
int *external_only, int *out_count, uint64_t test_modifier)
558
{
559
/* Query AFBC status */
560
struct panfrost_device *dev = pan_device(screen);
561
bool afbc = panfrost_format_supports_afbc(dev, format);
562
bool ytr = panfrost_afbc_can_ytr(format);
563
564
/* Don't advertise AFBC before T760 */
565
afbc &= !(dev->quirks & MIDGARD_NO_AFBC);
566
567
unsigned count = 0;
568
569
for (unsigned i = 0; i < PAN_MODIFIER_COUNT; ++i) {
570
if (drm_is_afbc(pan_best_modifiers[i]) && !afbc)
571
continue;
572
573
if ((pan_best_modifiers[i] & AFBC_FORMAT_MOD_YTR) && !ytr)
574
continue;
575
576
if (test_modifier != DRM_FORMAT_MOD_INVALID &&
577
test_modifier != pan_best_modifiers[i])
578
continue;
579
580
count++;
581
582
if (max > (int) count) {
583
modifiers[count] = pan_best_modifiers[i];
584
585
if (external_only)
586
external_only[count] = false;
587
}
588
}
589
590
*out_count = count;
591
}
592
593
static void
594
panfrost_query_dmabuf_modifiers(struct pipe_screen *screen,
595
enum pipe_format format, int max, uint64_t *modifiers, unsigned
596
int *external_only, int *out_count)
597
{
598
panfrost_walk_dmabuf_modifiers(screen, format, max, modifiers,
599
external_only, out_count, DRM_FORMAT_MOD_INVALID);
600
}
601
602
static bool
603
panfrost_is_dmabuf_modifier_supported(struct pipe_screen *screen,
604
uint64_t modifier, enum pipe_format format,
605
bool *external_only)
606
{
607
uint64_t unused;
608
unsigned int uint_extern_only = 0;
609
int count;
610
611
panfrost_walk_dmabuf_modifiers(screen, format, 1, &unused,
612
&uint_extern_only, &count, modifier);
613
614
if (external_only)
615
*external_only = uint_extern_only ? true : false;
616
617
return count > 0;
618
}
619
620
static int
621
panfrost_get_compute_param(struct pipe_screen *pscreen, enum pipe_shader_ir ir_type,
622
enum pipe_compute_cap param, void *ret)
623
{
624
struct panfrost_device *dev = pan_device(pscreen);
625
const char * const ir = "panfrost";
626
627
#define RET(x) do { \
628
if (ret) \
629
memcpy(ret, x, sizeof(x)); \
630
return sizeof(x); \
631
} while (0)
632
633
switch (param) {
634
case PIPE_COMPUTE_CAP_ADDRESS_BITS:
635
RET((uint32_t []){ 64 });
636
637
case PIPE_COMPUTE_CAP_IR_TARGET:
638
if (ret)
639
sprintf(ret, "%s", ir);
640
return strlen(ir) * sizeof(char);
641
642
case PIPE_COMPUTE_CAP_GRID_DIMENSION:
643
RET((uint64_t []) { 3 });
644
645
case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:
646
RET(((uint64_t []) { 65535, 65535, 65535 }));
647
648
case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
649
/* Unpredictable behaviour at larger sizes. Mali-G52 advertises
650
* 384x384x384. The smaller size is advertised by Mali-T628,
651
* use min until we have a need to key by arch */
652
RET(((uint64_t []) { 256, 256, 256 }));
653
654
case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
655
RET((uint64_t []) { 256 });
656
657
case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:
658
RET((uint64_t []) { 1024*1024*512 /* Maybe get memory */ });
659
660
case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:
661
RET((uint64_t []) { 32768 });
662
663
case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:
664
case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:
665
RET((uint64_t []) { 4096 });
666
667
case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE:
668
RET((uint64_t []) { 1024*1024*512 /* Maybe get memory */ });
669
670
case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:
671
RET((uint32_t []) { 800 /* MHz -- TODO */ });
672
673
case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:
674
RET((uint32_t []) { 9999 }); // TODO
675
676
case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:
677
RET((uint32_t []) { 1 });
678
679
case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:
680
RET((uint32_t []) { dev->arch >= 7 ? 8 : 4 });
681
682
case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK:
683
RET((uint64_t []) { 1024 }); // TODO
684
}
685
686
return 0;
687
}
688
689
static void
690
panfrost_destroy_screen(struct pipe_screen *pscreen)
691
{
692
struct panfrost_device *dev = pan_device(pscreen);
693
struct panfrost_screen *screen = pan_screen(pscreen);
694
695
pan_indirect_dispatch_cleanup(dev);
696
panfrost_cleanup_indirect_draw_shaders(dev);
697
panfrost_pool_cleanup(&screen->indirect_draw.bin_pool);
698
panfrost_pool_cleanup(&screen->blitter.bin_pool);
699
panfrost_pool_cleanup(&screen->blitter.desc_pool);
700
pan_blend_shaders_cleanup(dev);
701
702
screen->vtbl.screen_destroy(pscreen);
703
704
if (dev->ro)
705
dev->ro->destroy(dev->ro);
706
panfrost_close_device(dev);
707
ralloc_free(pscreen);
708
}
709
710
static uint64_t
711
panfrost_get_timestamp(struct pipe_screen *_screen)
712
{
713
return os_time_get_nano();
714
}
715
716
static void
717
panfrost_fence_reference(struct pipe_screen *pscreen,
718
struct pipe_fence_handle **ptr,
719
struct pipe_fence_handle *fence)
720
{
721
struct panfrost_device *dev = pan_device(pscreen);
722
struct pipe_fence_handle *old = *ptr;
723
724
if (pipe_reference(&old->reference, &fence->reference)) {
725
drmSyncobjDestroy(dev->fd, old->syncobj);
726
free(old);
727
}
728
729
*ptr = fence;
730
}
731
732
static bool
733
panfrost_fence_finish(struct pipe_screen *pscreen,
734
struct pipe_context *ctx,
735
struct pipe_fence_handle *fence,
736
uint64_t timeout)
737
{
738
struct panfrost_device *dev = pan_device(pscreen);
739
int ret;
740
741
if (fence->signaled)
742
return true;
743
744
uint64_t abs_timeout = os_time_get_absolute_timeout(timeout);
745
if (abs_timeout == OS_TIMEOUT_INFINITE)
746
abs_timeout = INT64_MAX;
747
748
ret = drmSyncobjWait(dev->fd, &fence->syncobj,
749
1,
750
abs_timeout, DRM_SYNCOBJ_WAIT_FLAGS_WAIT_ALL,
751
NULL);
752
753
fence->signaled = (ret >= 0);
754
return fence->signaled;
755
}
756
757
struct pipe_fence_handle *
758
panfrost_fence_create(struct panfrost_context *ctx)
759
{
760
struct pipe_fence_handle *f = calloc(1, sizeof(*f));
761
if (!f)
762
return NULL;
763
764
struct panfrost_device *dev = pan_device(ctx->base.screen);
765
int fd = -1, ret;
766
767
/* Snapshot the last rendering out fence. We'd rather have another
768
* syncobj instead of a sync file, but this is all we get.
769
* (HandleToFD/FDToHandle just gives you another syncobj ID for the
770
* same syncobj).
771
*/
772
ret = drmSyncobjExportSyncFile(dev->fd, ctx->syncobj, &fd);
773
if (ret || fd == -1) {
774
fprintf(stderr, "export failed\n");
775
goto err_free_fence;
776
}
777
778
ret = drmSyncobjCreate(dev->fd, 0, &f->syncobj);
779
if (ret) {
780
fprintf(stderr, "create syncobj failed\n");
781
goto err_close_fd;
782
}
783
784
ret = drmSyncobjImportSyncFile(dev->fd, f->syncobj, fd);
785
if (ret) {
786
fprintf(stderr, "create syncobj failed\n");
787
goto err_destroy_syncobj;
788
}
789
790
assert(f->syncobj != ctx->syncobj);
791
close(fd);
792
pipe_reference_init(&f->reference, 1);
793
794
return f;
795
796
err_destroy_syncobj:
797
drmSyncobjDestroy(dev->fd, f->syncobj);
798
err_close_fd:
799
close(fd);
800
err_free_fence:
801
free(f);
802
return NULL;
803
}
804
805
static const void *
806
panfrost_screen_get_compiler_options(struct pipe_screen *pscreen,
807
enum pipe_shader_ir ir,
808
enum pipe_shader_type shader)
809
{
810
return pan_shader_get_compiler_options(pan_device(pscreen));
811
}
812
813
struct pipe_screen *
814
panfrost_create_screen(int fd, struct renderonly *ro)
815
{
816
/* Create the screen */
817
struct panfrost_screen *screen = rzalloc(NULL, struct panfrost_screen);
818
819
if (!screen)
820
return NULL;
821
822
struct panfrost_device *dev = pan_device(&screen->base);
823
824
/* Debug must be set first for pandecode to work correctly */
825
dev->debug = debug_get_flags_option("PAN_MESA_DEBUG", panfrost_debug_options, 0);
826
panfrost_open_device(screen, fd, dev);
827
828
if (dev->debug & PAN_DBG_NO_AFBC)
829
dev->quirks |= MIDGARD_NO_AFBC;
830
831
/* XXX: AFBC is currently broken on Bifrost in a few different ways
832
*
833
* - Preload is broken if the effective tile size is not 16x16
834
* - Some systems lack AFBC but we need kernel changes to know that
835
*/
836
if (dev->arch == 7)
837
dev->quirks |= MIDGARD_NO_AFBC;
838
839
/* XXX: Indirect draws on Midgard need debugging, emulate for now */
840
if (dev->arch < 6)
841
dev->debug |= PAN_DBG_NOINDIRECT;
842
843
dev->ro = ro;
844
845
/* Check if we're loading against a supported GPU model. */
846
847
switch (dev->gpu_id) {
848
case 0x720: /* T720 */
849
case 0x750: /* T760 */
850
case 0x820: /* T820 */
851
case 0x860: /* T860 */
852
case 0x6221: /* G72 */
853
case 0x7093: /* G31 */
854
case 0x7212: /* G52 */
855
case 0x7402: /* G52r1 */
856
break;
857
default:
858
/* Fail to load against untested models */
859
debug_printf("panfrost: Unsupported model %X", dev->gpu_id);
860
panfrost_destroy_screen(&(screen->base));
861
return NULL;
862
}
863
864
screen->base.destroy = panfrost_destroy_screen;
865
866
screen->base.get_name = panfrost_get_name;
867
screen->base.get_vendor = panfrost_get_vendor;
868
screen->base.get_device_vendor = panfrost_get_device_vendor;
869
screen->base.get_param = panfrost_get_param;
870
screen->base.get_shader_param = panfrost_get_shader_param;
871
screen->base.get_compute_param = panfrost_get_compute_param;
872
screen->base.get_paramf = panfrost_get_paramf;
873
screen->base.get_timestamp = panfrost_get_timestamp;
874
screen->base.is_format_supported = panfrost_is_format_supported;
875
screen->base.query_dmabuf_modifiers = panfrost_query_dmabuf_modifiers;
876
screen->base.is_dmabuf_modifier_supported =
877
panfrost_is_dmabuf_modifier_supported;
878
screen->base.context_create = panfrost_create_context;
879
screen->base.get_compiler_options = panfrost_screen_get_compiler_options;
880
screen->base.fence_reference = panfrost_fence_reference;
881
screen->base.fence_finish = panfrost_fence_finish;
882
screen->base.set_damage_region = panfrost_resource_set_damage_region;
883
884
panfrost_resource_screen_init(&screen->base);
885
pan_blend_shaders_init(dev);
886
panfrost_pool_init(&screen->indirect_draw.bin_pool, NULL, dev,
887
PAN_BO_EXECUTE, 65536, "Indirect draw shaders",
888
false, true);
889
panfrost_init_indirect_draw_shaders(dev, &screen->indirect_draw.bin_pool.base);
890
pan_indirect_dispatch_init(dev);
891
panfrost_pool_init(&screen->blitter.bin_pool, NULL, dev, PAN_BO_EXECUTE,
892
4096, "Blitter shaders", false, true);
893
panfrost_pool_init(&screen->blitter.desc_pool, NULL, dev, 0, 65536,
894
"Blitter RSDs", false, true);
895
panfrost_cmdstream_screen_init(screen);
896
897
return &screen->base;
898
}
899
900