Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
PojavLauncherTeam
GitHub Repository: PojavLauncherTeam/mesa
Path: blob/21.2-virgl/src/gallium/drivers/v3d/v3d_screen.c
4570 views
1
/*
2
* Copyright © 2014-2017 Broadcom
3
* Copyright (C) 2012 Rob Clark <[email protected]>
4
*
5
* Permission is hereby granted, free of charge, to any person obtaining a
6
* copy of this software and associated documentation files (the "Software"),
7
* to deal in the Software without restriction, including without limitation
8
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
9
* and/or sell copies of the Software, and to permit persons to whom the
10
* Software is furnished to do so, subject to the following conditions:
11
*
12
* The above copyright notice and this permission notice (including the next
13
* paragraph) shall be included in all copies or substantial portions of the
14
* Software.
15
*
16
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
21
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
22
* IN THE SOFTWARE.
23
*/
24
25
#include <sys/sysinfo.h>
26
27
#include "common/v3d_device_info.h"
28
#include "common/v3d_limits.h"
29
#include "util/os_misc.h"
30
#include "pipe/p_defines.h"
31
#include "pipe/p_screen.h"
32
#include "pipe/p_state.h"
33
34
#include "util/u_debug.h"
35
#include "util/u_memory.h"
36
#include "util/format/u_format.h"
37
#include "util/u_hash_table.h"
38
#include "util/u_screen.h"
39
#include "util/u_transfer_helper.h"
40
#include "util/ralloc.h"
41
#include "util/xmlconfig.h"
42
43
#include <xf86drm.h>
44
#include "v3d_screen.h"
45
#include "v3d_context.h"
46
#include "v3d_resource.h"
47
#include "compiler/v3d_compiler.h"
48
#include "drm-uapi/drm_fourcc.h"
49
50
static const char *
51
v3d_screen_get_name(struct pipe_screen *pscreen)
52
{
53
struct v3d_screen *screen = v3d_screen(pscreen);
54
55
if (!screen->name) {
56
screen->name = ralloc_asprintf(screen,
57
"V3D %d.%d",
58
screen->devinfo.ver / 10,
59
screen->devinfo.ver % 10);
60
}
61
62
return screen->name;
63
}
64
65
static const char *
66
v3d_screen_get_vendor(struct pipe_screen *pscreen)
67
{
68
return "Broadcom";
69
}
70
71
static void
72
v3d_screen_destroy(struct pipe_screen *pscreen)
73
{
74
struct v3d_screen *screen = v3d_screen(pscreen);
75
76
_mesa_hash_table_destroy(screen->bo_handles, NULL);
77
v3d_bufmgr_destroy(pscreen);
78
slab_destroy_parent(&screen->transfer_pool);
79
if (screen->ro)
80
screen->ro->destroy(screen->ro);
81
82
if (using_v3d_simulator)
83
v3d_simulator_destroy(screen->sim_file);
84
85
v3d_compiler_free(screen->compiler);
86
u_transfer_helper_destroy(pscreen->transfer_helper);
87
88
close(screen->fd);
89
ralloc_free(pscreen);
90
}
91
92
static bool
93
v3d_has_feature(struct v3d_screen *screen, enum drm_v3d_param feature)
94
{
95
struct drm_v3d_get_param p = {
96
.param = feature,
97
};
98
int ret = v3d_ioctl(screen->fd, DRM_IOCTL_V3D_GET_PARAM, &p);
99
100
if (ret != 0)
101
return false;
102
103
return p.value;
104
}
105
106
static int
107
v3d_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
108
{
109
struct v3d_screen *screen = v3d_screen(pscreen);
110
111
switch (param) {
112
/* Supported features (boolean caps). */
113
case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
114
case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
115
case PIPE_CAP_NPOT_TEXTURES:
116
case PIPE_CAP_BLEND_EQUATION_SEPARATE:
117
case PIPE_CAP_TEXTURE_MULTISAMPLE:
118
case PIPE_CAP_TEXTURE_SWIZZLE:
119
case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
120
case PIPE_CAP_START_INSTANCE:
121
case PIPE_CAP_TGSI_INSTANCEID:
122
case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
123
case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
124
case PIPE_CAP_VERTEX_SHADER_SATURATE:
125
case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:
126
case PIPE_CAP_OCCLUSION_QUERY:
127
case PIPE_CAP_POINT_SPRITE:
128
case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
129
case PIPE_CAP_DRAW_INDIRECT:
130
case PIPE_CAP_MULTI_DRAW_INDIRECT:
131
case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
132
case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:
133
case PIPE_CAP_TGSI_CAN_READ_OUTPUTS:
134
case PIPE_CAP_TGSI_PACK_HALF_FLOAT:
135
case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
136
case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
137
case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
138
case PIPE_CAP_TGSI_TEXCOORD:
139
return 1;
140
141
case PIPE_CAP_TEXTURE_QUERY_LOD:
142
return screen->devinfo.ver >= 42;
143
break;
144
145
case PIPE_CAP_PACKED_UNIFORMS:
146
/* We can't enable this flag, because it results in load_ubo
147
* intrinsics across a 16b boundary, but v3d's TMU general
148
* memory accesses wrap on 16b boundaries.
149
*/
150
return 0;
151
152
case PIPE_CAP_NIR_IMAGES_AS_DEREF:
153
return 0;
154
155
case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
156
/* XXX perf: we don't want to emit these extra blits for
157
* glReadPixels(), since we still have to do an uncached read
158
* from the GPU of the result after waiting for the TFU blit
159
* to happen. However, disabling this introduces instability
160
* in
161
* dEQP-GLES31.functional.image_load_store.early_fragment_tests.*
162
* and corruption in chromium's rendering.
163
*/
164
return 1;
165
166
case PIPE_CAP_COMPUTE:
167
return screen->has_csd && screen->devinfo.ver >= 41;
168
169
case PIPE_CAP_GENERATE_MIPMAP:
170
return v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_TFU);
171
172
case PIPE_CAP_INDEP_BLEND_ENABLE:
173
return screen->devinfo.ver >= 40;
174
175
case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
176
return 256;
177
178
case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
179
if (screen->devinfo.ver < 40)
180
return 0;
181
return 4;
182
183
case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
184
if (screen->has_cache_flush)
185
return 4;
186
else
187
return 0; /* Disables shader storage */
188
189
case PIPE_CAP_GLSL_FEATURE_LEVEL:
190
return 330;
191
192
case PIPE_CAP_ESSL_FEATURE_LEVEL:
193
return 310;
194
195
case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
196
return 140;
197
198
case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
199
return 1;
200
case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:
201
return 0;
202
case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
203
if (screen->devinfo.ver >= 40)
204
return 0;
205
else
206
return 1;
207
case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:
208
if (screen->devinfo.ver >= 40)
209
return 1;
210
else
211
return 0;
212
213
case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
214
case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
215
case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:
216
return 1;
217
218
case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
219
return 4;
220
221
case PIPE_CAP_MAX_VARYINGS:
222
return V3D_MAX_FS_INPUTS / 4;
223
224
/* Texturing. */
225
case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
226
if (screen->devinfo.ver < 40)
227
return 2048;
228
else if (screen->nonmsaa_texture_size_limit)
229
return 7680;
230
else
231
return 4096;
232
case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
233
case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
234
if (screen->devinfo.ver < 40)
235
return 12;
236
else
237
return V3D_MAX_MIP_LEVELS;
238
case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
239
return 2048;
240
241
/* Render targets. */
242
case PIPE_CAP_MAX_RENDER_TARGETS:
243
return 4;
244
245
case PIPE_CAP_VENDOR_ID:
246
return 0x14E4;
247
case PIPE_CAP_ACCELERATED:
248
return 1;
249
case PIPE_CAP_VIDEO_MEMORY: {
250
uint64_t system_memory;
251
252
if (!os_get_total_physical_memory(&system_memory))
253
return 0;
254
255
return (int)(system_memory >> 20);
256
}
257
case PIPE_CAP_UMA:
258
return 1;
259
260
case PIPE_CAP_ALPHA_TEST:
261
case PIPE_CAP_FLATSHADE:
262
case PIPE_CAP_TWO_SIDED_COLOR:
263
case PIPE_CAP_VERTEX_COLOR_CLAMPED:
264
case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:
265
case PIPE_CAP_GL_CLAMP:
266
return 0;
267
268
/* Geometry shaders */
269
case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
270
/* Minimum required by GLES 3.2 */
271
return 1024;
272
case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
273
/* MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS / 4 */
274
return 256;
275
case PIPE_CAP_MAX_GS_INVOCATIONS:
276
return 32;
277
278
default:
279
return u_pipe_screen_get_param_defaults(pscreen, param);
280
}
281
}
282
283
static float
284
v3d_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
285
{
286
switch (param) {
287
case PIPE_CAPF_MAX_LINE_WIDTH:
288
case PIPE_CAPF_MAX_LINE_WIDTH_AA:
289
return V3D_MAX_LINE_WIDTH;
290
291
case PIPE_CAPF_MAX_POINT_WIDTH:
292
case PIPE_CAPF_MAX_POINT_WIDTH_AA:
293
return V3D_MAX_POINT_SIZE;
294
295
case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
296
return 0.0f;
297
case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
298
return 16.0f;
299
300
case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
301
case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
302
case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
303
return 0.0f;
304
default:
305
fprintf(stderr, "unknown paramf %d\n", param);
306
return 0;
307
}
308
}
309
310
static int
311
v3d_screen_get_shader_param(struct pipe_screen *pscreen, unsigned shader,
312
enum pipe_shader_cap param)
313
{
314
struct v3d_screen *screen = v3d_screen(pscreen);
315
316
switch (shader) {
317
case PIPE_SHADER_VERTEX:
318
case PIPE_SHADER_FRAGMENT:
319
break;
320
case PIPE_SHADER_COMPUTE:
321
if (!screen->has_csd)
322
return 0;
323
break;
324
case PIPE_SHADER_GEOMETRY:
325
if (screen->devinfo.ver < 41)
326
return 0;
327
break;
328
default:
329
return 0;
330
}
331
332
/* this is probably not totally correct.. but it's a start: */
333
switch (param) {
334
case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
335
case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
336
case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
337
case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
338
return 16384;
339
340
case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
341
return UINT_MAX;
342
343
case PIPE_SHADER_CAP_MAX_INPUTS:
344
switch (shader) {
345
case PIPE_SHADER_VERTEX:
346
return V3D_MAX_VS_INPUTS / 4;
347
case PIPE_SHADER_GEOMETRY:
348
return V3D_MAX_GS_INPUTS / 4;
349
case PIPE_SHADER_FRAGMENT:
350
return V3D_MAX_FS_INPUTS / 4;
351
default:
352
return 0;
353
};
354
case PIPE_SHADER_CAP_MAX_OUTPUTS:
355
if (shader == PIPE_SHADER_FRAGMENT)
356
return 4;
357
else
358
return V3D_MAX_FS_INPUTS / 4;
359
case PIPE_SHADER_CAP_MAX_TEMPS:
360
return 256; /* GL_MAX_PROGRAM_TEMPORARIES_ARB */
361
case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
362
/* Note: Limited by the offset size in
363
* v3d_unit_data_create().
364
*/
365
return 16 * 1024 * sizeof(float);
366
case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
367
return 16;
368
case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
369
return 0;
370
case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
371
/* We don't currently support this in the backend, but that is
372
* okay because our NIR compiler sets the option
373
* lower_all_io_to_temps, which will eliminate indirect
374
* indexing on all input/output variables by translating it to
375
* indirect indexing on temporary variables instead, which we
376
* will then lower to scratch. We prefer this over setting this
377
* to 0, which would cause if-ladder injection to eliminate
378
* indirect indexing on inputs.
379
*/
380
return 1;
381
case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
382
return 1;
383
case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
384
return 1;
385
case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
386
return 1;
387
case PIPE_SHADER_CAP_SUBROUTINES:
388
return 0;
389
case PIPE_SHADER_CAP_INTEGERS:
390
return 1;
391
case PIPE_SHADER_CAP_FP16:
392
case PIPE_SHADER_CAP_FP16_DERIVATIVES:
393
case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:
394
case PIPE_SHADER_CAP_INT16:
395
case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
396
case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
397
case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
398
case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
399
case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
400
case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
401
case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
402
case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
403
case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
404
return 0;
405
case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
406
case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
407
return V3D_OPENGL_MAX_TEXTURE_SAMPLERS;
408
409
case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
410
if (screen->has_cache_flush) {
411
if (shader == PIPE_SHADER_VERTEX ||
412
shader == PIPE_SHADER_GEOMETRY) {
413
return 0;
414
}
415
return PIPE_MAX_SHADER_BUFFERS;
416
} else {
417
return 0;
418
}
419
420
case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
421
if (screen->has_cache_flush) {
422
if (screen->devinfo.ver < 41)
423
return 0;
424
else
425
return PIPE_MAX_SHADER_IMAGES;
426
} else {
427
return 0;
428
}
429
430
case PIPE_SHADER_CAP_PREFERRED_IR:
431
return PIPE_SHADER_IR_NIR;
432
case PIPE_SHADER_CAP_SUPPORTED_IRS:
433
return 1 << PIPE_SHADER_IR_NIR;
434
case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
435
/* We use NIR's loop unrolling */
436
return 0;
437
case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
438
case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
439
return 0;
440
default:
441
fprintf(stderr, "unknown shader param %d\n", param);
442
return 0;
443
}
444
return 0;
445
}
446
447
static int
448
v3d_get_compute_param(struct pipe_screen *pscreen, enum pipe_shader_ir ir_type,
449
enum pipe_compute_cap param, void *ret)
450
{
451
struct v3d_screen *screen = v3d_screen(pscreen);
452
453
if (!screen->has_csd)
454
return 0;
455
456
#define RET(x) do { \
457
if (ret) \
458
memcpy(ret, x, sizeof(x)); \
459
return sizeof(x); \
460
} while (0)
461
462
switch (param) {
463
case PIPE_COMPUTE_CAP_ADDRESS_BITS:
464
RET((uint32_t []) { 32 });
465
break;
466
467
case PIPE_COMPUTE_CAP_IR_TARGET:
468
sprintf(ret, "v3d");
469
return strlen(ret);
470
471
case PIPE_COMPUTE_CAP_GRID_DIMENSION:
472
RET((uint64_t []) { 3 });
473
474
case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:
475
/* GL_MAX_COMPUTE_SHADER_WORK_GROUP_COUNT: The CSD has a
476
* 16-bit field for the number of workgroups in each
477
* dimension.
478
*/
479
RET(((uint64_t []) { 65535, 65535, 65535 }));
480
481
case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
482
/* GL_MAX_COMPUTE_WORK_GROUP_SIZE */
483
RET(((uint64_t []) { 256, 256, 256 }));
484
485
case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
486
case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK:
487
/* GL_MAX_COMPUTE_WORK_GROUP_INVOCATIONS: This is
488
* limited by WG_SIZE in the CSD.
489
*/
490
RET((uint64_t []) { 256 });
491
492
case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:
493
RET((uint64_t []) { 1024 * 1024 * 1024 });
494
495
case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:
496
/* GL_MAX_COMPUTE_SHARED_MEMORY_SIZE */
497
RET((uint64_t []) { 32768 });
498
499
case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:
500
case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:
501
RET((uint64_t []) { 4096 });
502
503
case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE: {
504
struct sysinfo si;
505
sysinfo(&si);
506
RET((uint64_t []) { si.totalram });
507
}
508
509
case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:
510
/* OpenCL only */
511
RET((uint32_t []) { 0 });
512
513
case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:
514
RET((uint32_t []) { 1 });
515
516
case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:
517
RET((uint32_t []) { 1 });
518
519
case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:
520
RET((uint32_t []) { 16 });
521
522
}
523
524
return 0;
525
}
526
527
static bool
528
v3d_screen_is_format_supported(struct pipe_screen *pscreen,
529
enum pipe_format format,
530
enum pipe_texture_target target,
531
unsigned sample_count,
532
unsigned storage_sample_count,
533
unsigned usage)
534
{
535
struct v3d_screen *screen = v3d_screen(pscreen);
536
537
if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))
538
return false;
539
540
if (sample_count > 1 && sample_count != V3D_MAX_SAMPLES)
541
return false;
542
543
if (target >= PIPE_MAX_TEXTURE_TYPES) {
544
return false;
545
}
546
547
if (usage & PIPE_BIND_VERTEX_BUFFER) {
548
switch (format) {
549
case PIPE_FORMAT_R32G32B32A32_FLOAT:
550
case PIPE_FORMAT_R32G32B32_FLOAT:
551
case PIPE_FORMAT_R32G32_FLOAT:
552
case PIPE_FORMAT_R32_FLOAT:
553
case PIPE_FORMAT_R32G32B32A32_SNORM:
554
case PIPE_FORMAT_R32G32B32_SNORM:
555
case PIPE_FORMAT_R32G32_SNORM:
556
case PIPE_FORMAT_R32_SNORM:
557
case PIPE_FORMAT_R32G32B32A32_SSCALED:
558
case PIPE_FORMAT_R32G32B32_SSCALED:
559
case PIPE_FORMAT_R32G32_SSCALED:
560
case PIPE_FORMAT_R32_SSCALED:
561
case PIPE_FORMAT_R16G16B16A16_UNORM:
562
case PIPE_FORMAT_R16G16B16_UNORM:
563
case PIPE_FORMAT_R16G16_UNORM:
564
case PIPE_FORMAT_R16_UNORM:
565
case PIPE_FORMAT_R16G16B16A16_SNORM:
566
case PIPE_FORMAT_R16G16B16_SNORM:
567
case PIPE_FORMAT_R16G16_SNORM:
568
case PIPE_FORMAT_R16_SNORM:
569
case PIPE_FORMAT_R16G16B16A16_USCALED:
570
case PIPE_FORMAT_R16G16B16_USCALED:
571
case PIPE_FORMAT_R16G16_USCALED:
572
case PIPE_FORMAT_R16_USCALED:
573
case PIPE_FORMAT_R16G16B16A16_SSCALED:
574
case PIPE_FORMAT_R16G16B16_SSCALED:
575
case PIPE_FORMAT_R16G16_SSCALED:
576
case PIPE_FORMAT_R16_SSCALED:
577
case PIPE_FORMAT_B8G8R8A8_UNORM:
578
case PIPE_FORMAT_R8G8B8A8_UNORM:
579
case PIPE_FORMAT_R8G8B8_UNORM:
580
case PIPE_FORMAT_R8G8_UNORM:
581
case PIPE_FORMAT_R8_UNORM:
582
case PIPE_FORMAT_R8G8B8A8_SNORM:
583
case PIPE_FORMAT_R8G8B8_SNORM:
584
case PIPE_FORMAT_R8G8_SNORM:
585
case PIPE_FORMAT_R8_SNORM:
586
case PIPE_FORMAT_R8G8B8A8_USCALED:
587
case PIPE_FORMAT_R8G8B8_USCALED:
588
case PIPE_FORMAT_R8G8_USCALED:
589
case PIPE_FORMAT_R8_USCALED:
590
case PIPE_FORMAT_R8G8B8A8_SSCALED:
591
case PIPE_FORMAT_R8G8B8_SSCALED:
592
case PIPE_FORMAT_R8G8_SSCALED:
593
case PIPE_FORMAT_R8_SSCALED:
594
case PIPE_FORMAT_R10G10B10A2_UNORM:
595
case PIPE_FORMAT_B10G10R10A2_UNORM:
596
case PIPE_FORMAT_R10G10B10A2_SNORM:
597
case PIPE_FORMAT_B10G10R10A2_SNORM:
598
case PIPE_FORMAT_R10G10B10A2_USCALED:
599
case PIPE_FORMAT_B10G10R10A2_USCALED:
600
case PIPE_FORMAT_R10G10B10A2_SSCALED:
601
case PIPE_FORMAT_B10G10R10A2_SSCALED:
602
break;
603
default:
604
return false;
605
}
606
}
607
608
/* FORMAT_NONE gets allowed for ARB_framebuffer_no_attachments's probe
609
* of FRAMEBUFFER_MAX_SAMPLES
610
*/
611
if ((usage & PIPE_BIND_RENDER_TARGET) &&
612
format != PIPE_FORMAT_NONE &&
613
!v3d_rt_format_supported(&screen->devinfo, format)) {
614
return false;
615
}
616
617
if ((usage & PIPE_BIND_SAMPLER_VIEW) &&
618
!v3d_tex_format_supported(&screen->devinfo, format)) {
619
return false;
620
}
621
622
if ((usage & PIPE_BIND_DEPTH_STENCIL) &&
623
!(format == PIPE_FORMAT_S8_UINT_Z24_UNORM ||
624
format == PIPE_FORMAT_X8Z24_UNORM ||
625
format == PIPE_FORMAT_Z16_UNORM ||
626
format == PIPE_FORMAT_Z32_FLOAT ||
627
format == PIPE_FORMAT_Z32_FLOAT_S8X24_UINT)) {
628
return false;
629
}
630
631
if ((usage & PIPE_BIND_INDEX_BUFFER) &&
632
!(format == PIPE_FORMAT_R8_UINT ||
633
format == PIPE_FORMAT_R16_UINT ||
634
format == PIPE_FORMAT_R32_UINT)) {
635
return false;
636
}
637
638
return true;
639
}
640
641
static const nir_shader_compiler_options v3d_nir_options = {
642
.lower_add_sat = true,
643
.lower_all_io_to_temps = true,
644
.lower_extract_byte = true,
645
.lower_extract_word = true,
646
.lower_insert_byte = true,
647
.lower_insert_word = true,
648
.lower_bitfield_insert_to_shifts = true,
649
.lower_bitfield_extract_to_shifts = true,
650
.lower_bitfield_reverse = true,
651
.lower_bit_count = true,
652
.lower_cs_local_id_from_index = true,
653
.lower_ffract = true,
654
.lower_fmod = true,
655
.lower_pack_unorm_2x16 = true,
656
.lower_pack_snorm_2x16 = true,
657
.lower_pack_unorm_4x8 = true,
658
.lower_pack_snorm_4x8 = true,
659
.lower_unpack_unorm_4x8 = true,
660
.lower_unpack_snorm_4x8 = true,
661
.lower_pack_half_2x16 = true,
662
.lower_unpack_half_2x16 = true,
663
.lower_fdiv = true,
664
.lower_find_lsb = true,
665
.lower_ffma16 = true,
666
.lower_ffma32 = true,
667
.lower_ffma64 = true,
668
.lower_flrp32 = true,
669
.lower_fpow = true,
670
.lower_fsat = true,
671
.lower_fsqrt = true,
672
.lower_ifind_msb = true,
673
.lower_isign = true,
674
.lower_ldexp = true,
675
.lower_mul_high = true,
676
.lower_wpos_pntc = true,
677
.lower_rotate = true,
678
.lower_to_scalar = true,
679
.has_fsub = true,
680
.has_isub = true,
681
.divergence_analysis_options =
682
nir_divergence_multiple_workgroup_per_compute_subgroup,
683
/* This will enable loop unrolling in the state tracker so we won't
684
* be able to selectively disable it in backend if it leads to
685
* lower thread counts or TMU spills. Choose a conservative maximum to
686
* limit register pressure impact.
687
*/
688
.max_unroll_iterations = 16,
689
};
690
691
static const void *
692
v3d_screen_get_compiler_options(struct pipe_screen *pscreen,
693
enum pipe_shader_ir ir, unsigned shader)
694
{
695
return &v3d_nir_options;
696
}
697
698
static const uint64_t v3d_available_modifiers[] = {
699
DRM_FORMAT_MOD_BROADCOM_UIF,
700
DRM_FORMAT_MOD_LINEAR,
701
DRM_FORMAT_MOD_BROADCOM_SAND128,
702
};
703
704
static void
705
v3d_screen_query_dmabuf_modifiers(struct pipe_screen *pscreen,
706
enum pipe_format format, int max,
707
uint64_t *modifiers,
708
unsigned int *external_only,
709
int *count)
710
{
711
int i;
712
int num_modifiers = ARRAY_SIZE(v3d_available_modifiers);
713
714
/* Expose DRM_FORMAT_MOD_BROADCOM_SAND128 only for PIPE_FORMAT_NV12 */
715
if (format != PIPE_FORMAT_NV12)
716
num_modifiers--;
717
718
if (!modifiers) {
719
*count = num_modifiers;
720
return;
721
}
722
723
*count = MIN2(max, num_modifiers);
724
for (i = 0; i < *count; i++) {
725
modifiers[i] = v3d_available_modifiers[i];
726
if (external_only)
727
external_only[i] = util_format_is_yuv(format);
728
}
729
}
730
731
static bool
732
v3d_screen_is_dmabuf_modifier_supported(struct pipe_screen *pscreen,
733
uint64_t modifier,
734
enum pipe_format format,
735
bool *external_only)
736
{
737
int i;
738
bool is_sand_col128 = (format == PIPE_FORMAT_NV12) &&
739
(fourcc_mod_broadcom_mod(modifier) == DRM_FORMAT_MOD_BROADCOM_SAND128);
740
741
if (is_sand_col128) {
742
if (external_only)
743
*external_only = true;
744
return true;
745
}
746
747
/* We don't want to generally allow DRM_FORMAT_MOD_BROADCOM_SAND128
748
* modifier, that is the last v3d_available_modifiers. We only accept
749
* it in the case of having a PIPE_FORMAT_NV12.
750
*/
751
assert(v3d_available_modifiers[ARRAY_SIZE(v3d_available_modifiers) - 1] ==
752
DRM_FORMAT_MOD_BROADCOM_SAND128);
753
for (i = 0; i < ARRAY_SIZE(v3d_available_modifiers) - 1; i++) {
754
if (v3d_available_modifiers[i] == modifier) {
755
if (external_only)
756
*external_only = util_format_is_yuv(format);
757
758
return true;
759
}
760
}
761
762
return false;
763
}
764
765
struct pipe_screen *
766
v3d_screen_create(int fd, const struct pipe_screen_config *config,
767
struct renderonly *ro)
768
{
769
struct v3d_screen *screen = rzalloc(NULL, struct v3d_screen);
770
struct pipe_screen *pscreen;
771
772
pscreen = &screen->base;
773
774
pscreen->destroy = v3d_screen_destroy;
775
pscreen->get_param = v3d_screen_get_param;
776
pscreen->get_paramf = v3d_screen_get_paramf;
777
pscreen->get_shader_param = v3d_screen_get_shader_param;
778
pscreen->get_compute_param = v3d_get_compute_param;
779
pscreen->context_create = v3d_context_create;
780
pscreen->is_format_supported = v3d_screen_is_format_supported;
781
782
screen->fd = fd;
783
screen->ro = ro;
784
785
list_inithead(&screen->bo_cache.time_list);
786
(void)mtx_init(&screen->bo_handles_mutex, mtx_plain);
787
screen->bo_handles = util_hash_table_create_ptr_keys();
788
789
#if defined(USE_V3D_SIMULATOR)
790
screen->sim_file = v3d_simulator_init(screen->fd);
791
#endif
792
793
if (!v3d_get_device_info(screen->fd, &screen->devinfo, &v3d_ioctl))
794
goto fail;
795
796
/* We have to driCheckOption for the simulator mode to not assertion
797
* fail on not having our XML config.
798
*/
799
const char *nonmsaa_name = "v3d_nonmsaa_texture_size_limit";
800
screen->nonmsaa_texture_size_limit =
801
driCheckOption(config->options, nonmsaa_name, DRI_BOOL) &&
802
driQueryOptionb(config->options, nonmsaa_name);
803
804
slab_create_parent(&screen->transfer_pool, sizeof(struct v3d_transfer), 16);
805
806
screen->has_csd = v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_CSD);
807
screen->has_cache_flush =
808
v3d_has_feature(screen, DRM_V3D_PARAM_SUPPORTS_CACHE_FLUSH);
809
810
v3d_fence_init(screen);
811
812
v3d_process_debug_variable();
813
814
v3d_resource_screen_init(pscreen);
815
816
screen->compiler = v3d_compiler_init(&screen->devinfo);
817
818
pscreen->get_name = v3d_screen_get_name;
819
pscreen->get_vendor = v3d_screen_get_vendor;
820
pscreen->get_device_vendor = v3d_screen_get_vendor;
821
pscreen->get_compiler_options = v3d_screen_get_compiler_options;
822
pscreen->query_dmabuf_modifiers = v3d_screen_query_dmabuf_modifiers;
823
pscreen->is_dmabuf_modifier_supported =
824
v3d_screen_is_dmabuf_modifier_supported;
825
826
return pscreen;
827
828
fail:
829
close(fd);
830
ralloc_free(pscreen);
831
return NULL;
832
}
833
834