Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
PojavLauncherTeam
GitHub Repository: PojavLauncherTeam/mesa
Path: blob/21.2-virgl/src/gallium/drivers/crocus/crocus_screen.c
4570 views
1
/*
2
* Copyright © 2017 Intel Corporation
3
*
4
* Permission is hereby granted, free of charge, to any person obtaining a
5
* copy of this software and associated documentation files (the "Software"),
6
* to deal in the Software without restriction, including without limitation
7
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
8
* and/or sell copies of the Software, and to permit persons to whom the
9
* Software is furnished to do so, subject to the following conditions:
10
*
11
* The above copyright notice and this permission notice shall be included
12
* in all copies or substantial portions of the Software.
13
*
14
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
15
* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
18
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
19
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
20
* DEALINGS IN THE SOFTWARE.
21
*/
22
23
/**
24
* @file crocus_screen.c
25
*
26
* Screen related driver hooks and capability lists.
27
*
28
* A program may use multiple rendering contexts (crocus_context), but
29
* they all share a common screen (crocus_screen). Global driver state
30
* can be stored in the screen; it may be accessed by multiple threads.
31
*/
32
33
#include <stdio.h>
34
#include <errno.h>
35
#include <sys/ioctl.h>
36
#include "pipe/p_defines.h"
37
#include "pipe/p_state.h"
38
#include "pipe/p_context.h"
39
#include "pipe/p_screen.h"
40
#include "util/debug.h"
41
#include "util/u_inlines.h"
42
#include "util/format/u_format.h"
43
#include "util/u_transfer_helper.h"
44
#include "util/u_upload_mgr.h"
45
#include "util/ralloc.h"
46
#include "util/xmlconfig.h"
47
#include "drm-uapi/i915_drm.h"
48
#include "crocus_context.h"
49
#include "crocus_defines.h"
50
#include "crocus_fence.h"
51
#include "crocus_pipe.h"
52
#include "crocus_resource.h"
53
#include "crocus_screen.h"
54
#include "intel/compiler/brw_compiler.h"
55
#include "intel/common/intel_gem.h"
56
#include "intel/common/intel_l3_config.h"
57
#include "intel/common/intel_uuid.h"
58
#include "crocus_monitor.h"
59
60
#define genX_call(devinfo, func, ...) \
61
switch ((devinfo)->verx10) { \
62
case 80: \
63
gfx8_##func(__VA_ARGS__); \
64
break; \
65
case 75: \
66
gfx75_##func(__VA_ARGS__); \
67
break; \
68
case 70: \
69
gfx7_##func(__VA_ARGS__); \
70
break; \
71
case 60: \
72
gfx6_##func(__VA_ARGS__); \
73
break; \
74
case 50: \
75
gfx5_##func(__VA_ARGS__); \
76
break; \
77
case 45: \
78
gfx45_##func(__VA_ARGS__); \
79
break; \
80
case 40: \
81
gfx4_##func(__VA_ARGS__); \
82
break; \
83
default: \
84
unreachable("Unknown hardware generation"); \
85
}
86
87
static void
88
crocus_flush_frontbuffer(struct pipe_screen *_screen,
89
struct pipe_context *_pipe,
90
struct pipe_resource *resource,
91
unsigned level, unsigned layer,
92
void *context_private, struct pipe_box *box)
93
{
94
}
95
96
static const char *
97
crocus_get_vendor(struct pipe_screen *pscreen)
98
{
99
return "Intel";
100
}
101
102
static const char *
103
crocus_get_device_vendor(struct pipe_screen *pscreen)
104
{
105
return "Intel";
106
}
107
108
static void
109
crocus_get_device_uuid(struct pipe_screen *pscreen, char *uuid)
110
{
111
struct crocus_screen *screen = (struct crocus_screen *)pscreen;
112
const struct isl_device *isldev = &screen->isl_dev;
113
114
intel_uuid_compute_device_id((uint8_t *)uuid, isldev, PIPE_UUID_SIZE);
115
}
116
117
static void
118
crocus_get_driver_uuid(struct pipe_screen *pscreen, char *uuid)
119
{
120
struct crocus_screen *screen = (struct crocus_screen *)pscreen;
121
const struct intel_device_info *devinfo = &screen->devinfo;
122
123
intel_uuid_compute_driver_id((uint8_t *)uuid, devinfo, PIPE_UUID_SIZE);
124
}
125
126
static const char *
127
crocus_get_name(struct pipe_screen *pscreen)
128
{
129
struct crocus_screen *screen = (struct crocus_screen *)pscreen;
130
static char buf[128];
131
132
const char *name = intel_get_device_name(screen->pci_id);
133
134
if (!name)
135
name = "Intel Unknown";
136
137
snprintf(buf, sizeof(buf), "Mesa %s", name);
138
return buf;
139
}
140
141
static uint64_t
142
get_aperture_size(int fd)
143
{
144
struct drm_i915_gem_get_aperture aperture = {};
145
intel_ioctl(fd, DRM_IOCTL_I915_GEM_GET_APERTURE, &aperture);
146
return aperture.aper_size;
147
}
148
149
static int
150
crocus_get_param(struct pipe_screen *pscreen, enum pipe_cap param)
151
{
152
struct crocus_screen *screen = (struct crocus_screen *)pscreen;
153
const struct intel_device_info *devinfo = &screen->devinfo;
154
155
switch (param) {
156
case PIPE_CAP_NPOT_TEXTURES:
157
case PIPE_CAP_ANISOTROPIC_FILTER:
158
case PIPE_CAP_POINT_SPRITE:
159
case PIPE_CAP_OCCLUSION_QUERY:
160
case PIPE_CAP_TEXTURE_SWIZZLE:
161
case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE:
162
case PIPE_CAP_BLEND_EQUATION_SEPARATE:
163
case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:
164
case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:
165
case PIPE_CAP_VERTEX_SHADER_SATURATE:
166
case PIPE_CAP_PRIMITIVE_RESTART:
167
case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:
168
case PIPE_CAP_INDEP_BLEND_ENABLE:
169
case PIPE_CAP_RGB_OVERRIDE_DST_ALPHA_BLEND:
170
case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:
171
case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:
172
case PIPE_CAP_DEPTH_CLIP_DISABLE:
173
case PIPE_CAP_TGSI_INSTANCEID:
174
case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:
175
case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:
176
case PIPE_CAP_SEAMLESS_CUBE_MAP:
177
case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:
178
case PIPE_CAP_CONDITIONAL_RENDER:
179
case PIPE_CAP_TEXTURE_BARRIER:
180
case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:
181
case PIPE_CAP_START_INSTANCE:
182
case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:
183
case PIPE_CAP_FORCE_PERSAMPLE_INTERP:
184
case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:
185
case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT:
186
case PIPE_CAP_TGSI_TES_LAYER_VIEWPORT:
187
case PIPE_CAP_ACCELERATED:
188
case PIPE_CAP_UMA:
189
case PIPE_CAP_CLIP_HALFZ:
190
case PIPE_CAP_TGSI_TEXCOORD:
191
case PIPE_CAP_DEVICE_RESET_STATUS_QUERY:
192
case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:
193
case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:
194
case PIPE_CAP_TEXTURE_FLOAT_LINEAR:
195
case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:
196
case PIPE_CAP_POLYGON_OFFSET_CLAMP:
197
case PIPE_CAP_TGSI_TEX_TXF_LZ:
198
case PIPE_CAP_MULTISAMPLE_Z_RESOLVE:
199
case PIPE_CAP_CLEAR_TEXTURE:
200
case PIPE_CAP_TGSI_VOTE:
201
case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:
202
case PIPE_CAP_TEXTURE_GATHER_SM5:
203
case PIPE_CAP_TGSI_ARRAY_COMPONENTS:
204
case PIPE_CAP_GLSL_TESS_LEVELS_AS_INPUTS:
205
case PIPE_CAP_NIR_COMPACT_ARRAYS:
206
case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL:
207
case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:
208
case PIPE_CAP_INVALIDATE_BUFFER:
209
case PIPE_CAP_SURFACE_REINTERPRET_BLOCKS:
210
case PIPE_CAP_CS_DERIVED_SYSTEM_VALUES_SUPPORTED:
211
case PIPE_CAP_FENCE_SIGNAL:
212
case PIPE_CAP_DEMOTE_TO_HELPER_INVOCATION:
213
case PIPE_CAP_GL_CLAMP:
214
return true;
215
case PIPE_CAP_INT64:
216
case PIPE_CAP_INT64_DIVMOD:
217
case PIPE_CAP_TGSI_BALLOT:
218
case PIPE_CAP_PACKED_UNIFORMS:
219
return devinfo->ver == 8;
220
case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:
221
return devinfo->ver <= 5;
222
case PIPE_CAP_TEXTURE_QUERY_LOD:
223
case PIPE_CAP_QUERY_TIME_ELAPSED:
224
return devinfo->ver >= 5;
225
case PIPE_CAP_DRAW_INDIRECT:
226
case PIPE_CAP_MULTI_DRAW_INDIRECT:
227
case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS:
228
case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:
229
case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:
230
case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:
231
case PIPE_CAP_TGSI_CLOCK:
232
case PIPE_CAP_TGSI_TXQS:
233
case PIPE_CAP_COMPUTE:
234
case PIPE_CAP_SAMPLER_VIEW_TARGET:
235
case PIPE_CAP_SHADER_SAMPLES_IDENTICAL:
236
case PIPE_CAP_TGSI_PACK_HALF_FLOAT:
237
case PIPE_CAP_GL_SPIRV:
238
case PIPE_CAP_GL_SPIRV_VARIABLE_POINTERS:
239
case PIPE_CAP_COMPUTE_SHADER_DERIVATIVES:
240
case PIPE_CAP_DOUBLES:
241
case PIPE_CAP_MEMOBJ:
242
return devinfo->ver >= 7;
243
case PIPE_CAP_QUERY_BUFFER_OBJECT:
244
case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR:
245
return devinfo->verx10 >= 75;
246
case PIPE_CAP_CULL_DISTANCE:
247
case PIPE_CAP_QUERY_PIPELINE_STATISTICS_SINGLE:
248
case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:
249
case PIPE_CAP_SAMPLE_SHADING:
250
case PIPE_CAP_CUBE_MAP_ARRAY:
251
case PIPE_CAP_QUERY_SO_OVERFLOW:
252
case PIPE_CAP_TEXTURE_MULTISAMPLE:
253
case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:
254
case PIPE_CAP_QUERY_TIMESTAMP:
255
case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:
256
case PIPE_CAP_INDEP_BLEND_FUNC:
257
case PIPE_CAP_TEXTURE_SHADOW_LOD:
258
case PIPE_CAP_LOAD_CONSTBUF:
259
case PIPE_CAP_DRAW_PARAMETERS:
260
case PIPE_CAP_CLEAR_SCISSORED:
261
return devinfo->ver >= 6;
262
case PIPE_CAP_FBFETCH:
263
return devinfo->verx10 >= 45 ? BRW_MAX_DRAW_BUFFERS : 0;
264
case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:
265
/* in theory CL (965gm) can do this */
266
return devinfo->verx10 >= 45 ? 1 : 0;
267
case PIPE_CAP_MAX_RENDER_TARGETS:
268
return BRW_MAX_DRAW_BUFFERS;
269
case PIPE_CAP_MAX_TEXTURE_2D_SIZE:
270
if (devinfo->ver >= 7)
271
return 16384;
272
else
273
return 8192;
274
case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:
275
if (devinfo->ver >= 7)
276
return CROCUS_MAX_MIPLEVELS; /* 16384x16384 */
277
else
278
return CROCUS_MAX_MIPLEVELS - 1; /* 8192x8192 */
279
case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:
280
return 12; /* 2048x2048 */
281
case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:
282
return (devinfo->ver >= 6) ? 4 : 0;
283
case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:
284
return devinfo->ver >= 7 ? 2048 : 512;
285
case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:
286
return BRW_MAX_SOL_BINDINGS / CROCUS_MAX_SOL_BUFFERS;
287
case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:
288
return BRW_MAX_SOL_BINDINGS;
289
case PIPE_CAP_GLSL_FEATURE_LEVEL: {
290
if (devinfo->verx10 >= 75)
291
return 460;
292
else if (devinfo->ver >= 7)
293
return 420;
294
else if (devinfo->ver >= 6)
295
return 330;
296
return 140;
297
}
298
case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:
299
return 140;
300
301
case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:
302
/* 3DSTATE_CONSTANT_XS requires the start of UBOs to be 32B aligned */
303
return 32;
304
case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:
305
return CROCUS_MAP_BUFFER_ALIGNMENT;
306
case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:
307
return devinfo->ver >= 7 ? 4 : 0;
308
case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:
309
return devinfo->ver >= 7 ? (1 << 27) : 0;
310
case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:
311
return 16; // XXX: u_screen says 256 is the minimum value...
312
case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:
313
return true;
314
case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:
315
return CROCUS_MAX_TEXTURE_BUFFER_SIZE;
316
case PIPE_CAP_MAX_VIEWPORTS:
317
return devinfo->ver >= 6 ? 16 : 1;
318
case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:
319
return devinfo->ver >= 6 ? 256 : 0;
320
case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:
321
return devinfo->ver >= 6 ? 1024 : 0;
322
case PIPE_CAP_MAX_GS_INVOCATIONS:
323
return devinfo->ver >= 7 ? 32 : 1;
324
case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:
325
if (devinfo->ver >= 7)
326
return 4;
327
else if (devinfo->ver == 6)
328
return 1;
329
else
330
return 0;
331
case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:
332
if (devinfo->ver >= 7)
333
return -32;
334
else if (devinfo->ver == 6)
335
return -8;
336
else
337
return 0;
338
case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:
339
if (devinfo->ver >= 7)
340
return 31;
341
else if (devinfo->ver == 6)
342
return 7;
343
else
344
return 0;
345
case PIPE_CAP_MAX_VERTEX_STREAMS:
346
return devinfo->ver >= 7 ? 4 : 1;
347
case PIPE_CAP_VENDOR_ID:
348
return 0x8086;
349
case PIPE_CAP_DEVICE_ID:
350
return screen->pci_id;
351
case PIPE_CAP_VIDEO_MEMORY: {
352
/* Once a batch uses more than 75% of the maximum mappable size, we
353
* assume that there's some fragmentation, and we start doing extra
354
* flushing, etc. That's the big cliff apps will care about.
355
*/
356
const unsigned gpu_mappable_megabytes =
357
(screen->aperture_bytes * 3 / 4) / (1024 * 1024);
358
359
const long system_memory_pages = sysconf(_SC_PHYS_PAGES);
360
const long system_page_size = sysconf(_SC_PAGE_SIZE);
361
362
if (system_memory_pages <= 0 || system_page_size <= 0)
363
return -1;
364
365
const uint64_t system_memory_bytes =
366
(uint64_t) system_memory_pages * (uint64_t) system_page_size;
367
368
const unsigned system_memory_megabytes =
369
(unsigned) (system_memory_bytes / (1024 * 1024));
370
371
return MIN2(system_memory_megabytes, gpu_mappable_megabytes);
372
}
373
case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS:
374
case PIPE_CAP_MAX_VARYINGS:
375
return (screen->devinfo.ver >= 6) ? 32 : 16;
376
case PIPE_CAP_RESOURCE_FROM_USER_MEMORY:
377
/* AMD_pinned_memory assumes the flexibility of using client memory
378
* for any buffer (incl. vertex buffers) which rules out the prospect
379
* of using snooped buffers, as using snooped buffers without
380
* cogniscience is likely to be detrimental to performance and require
381
* extensive checking in the driver for correctness, e.g. to prevent
382
* illegal snoop <-> snoop transfers.
383
*/
384
return devinfo->has_llc;
385
case PIPE_CAP_THROTTLE:
386
return screen->driconf.disable_throttling ? 0 : 1;
387
388
case PIPE_CAP_CONTEXT_PRIORITY_MASK:
389
return PIPE_CONTEXT_PRIORITY_LOW |
390
PIPE_CONTEXT_PRIORITY_MEDIUM |
391
PIPE_CONTEXT_PRIORITY_HIGH;
392
393
case PIPE_CAP_FRONTEND_NOOP:
394
return true;
395
// XXX: don't hardcode 00:00:02.0 PCI here
396
case PIPE_CAP_PCI_GROUP:
397
return 0;
398
case PIPE_CAP_PCI_BUS:
399
return 0;
400
case PIPE_CAP_PCI_DEVICE:
401
return 2;
402
case PIPE_CAP_PCI_FUNCTION:
403
return 0;
404
405
default:
406
return u_pipe_screen_get_param_defaults(pscreen, param);
407
}
408
return 0;
409
}
410
411
static float
412
crocus_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)
413
{
414
struct crocus_screen *screen = (struct crocus_screen *)pscreen;
415
const struct intel_device_info *devinfo = &screen->devinfo;
416
417
switch (param) {
418
case PIPE_CAPF_MAX_LINE_WIDTH:
419
case PIPE_CAPF_MAX_LINE_WIDTH_AA:
420
if (devinfo->ver >= 6)
421
return 7.375f;
422
else
423
return 7.0f;
424
425
case PIPE_CAPF_MAX_POINT_WIDTH:
426
case PIPE_CAPF_MAX_POINT_WIDTH_AA:
427
return 255.0f;
428
429
case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:
430
return 16.0f;
431
case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:
432
return 15.0f;
433
case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:
434
case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:
435
case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:
436
return 0.0f;
437
default:
438
unreachable("unknown param");
439
}
440
}
441
442
static int
443
crocus_get_shader_param(struct pipe_screen *pscreen,
444
enum pipe_shader_type p_stage,
445
enum pipe_shader_cap param)
446
{
447
gl_shader_stage stage = stage_from_pipe(p_stage);
448
struct crocus_screen *screen = (struct crocus_screen *)pscreen;
449
const struct intel_device_info *devinfo = &screen->devinfo;
450
451
if (devinfo->ver < 6 &&
452
p_stage != PIPE_SHADER_VERTEX &&
453
p_stage != PIPE_SHADER_FRAGMENT)
454
return 0;
455
456
if (devinfo->ver == 6 &&
457
p_stage != PIPE_SHADER_VERTEX &&
458
p_stage != PIPE_SHADER_FRAGMENT &&
459
p_stage != PIPE_SHADER_GEOMETRY)
460
return 0;
461
462
/* this is probably not totally correct.. but it's a start: */
463
switch (param) {
464
case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:
465
return stage == MESA_SHADER_FRAGMENT ? 1024 : 16384;
466
case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:
467
case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:
468
case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:
469
return stage == MESA_SHADER_FRAGMENT ? 1024 : 0;
470
471
case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:
472
return UINT_MAX;
473
474
case PIPE_SHADER_CAP_MAX_INPUTS:
475
if (stage == MESA_SHADER_VERTEX ||
476
stage == MESA_SHADER_GEOMETRY)
477
return 16; /* Gen7 vec4 geom backend */
478
return 32;
479
case PIPE_SHADER_CAP_MAX_OUTPUTS:
480
return 32;
481
case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:
482
return 16 * 1024 * sizeof(float);
483
case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:
484
return devinfo->ver >= 6 ? 16 : 1;
485
case PIPE_SHADER_CAP_MAX_TEMPS:
486
return 256; /* GL_MAX_PROGRAM_TEMPORARIES_ARB */
487
case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:
488
return 0;
489
case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:
490
case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:
491
case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:
492
case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:
493
/* Lie about these to avoid st/mesa's GLSL IR lowering of indirects,
494
* which we don't want. Our compiler backend will check brw_compiler's
495
* options and call nir_lower_indirect_derefs appropriately anyway.
496
*/
497
return true;
498
case PIPE_SHADER_CAP_SUBROUTINES:
499
return 0;
500
case PIPE_SHADER_CAP_INTEGERS:
501
return 1;
502
case PIPE_SHADER_CAP_INT64_ATOMICS:
503
case PIPE_SHADER_CAP_FP16:
504
return 0;
505
case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:
506
case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:
507
return (devinfo->verx10 >= 75) ? CROCUS_MAX_TEXTURE_SAMPLERS : 16;
508
case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:
509
if (devinfo->ver >= 7 &&
510
(p_stage == PIPE_SHADER_FRAGMENT ||
511
p_stage == PIPE_SHADER_COMPUTE))
512
return CROCUS_MAX_TEXTURE_SAMPLERS;
513
return 0;
514
case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:
515
return devinfo->ver >= 7 ? (CROCUS_MAX_ABOS + CROCUS_MAX_SSBOS) : 0;
516
case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:
517
case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:
518
return 0;
519
case PIPE_SHADER_CAP_PREFERRED_IR:
520
return PIPE_SHADER_IR_NIR;
521
case PIPE_SHADER_CAP_SUPPORTED_IRS:
522
return 1 << PIPE_SHADER_IR_NIR;
523
case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:
524
case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:
525
return 1;
526
case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:
527
case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:
528
case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:
529
case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:
530
case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:
531
case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:
532
case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:
533
case PIPE_SHADER_CAP_FP16_DERIVATIVES:
534
case PIPE_SHADER_CAP_INT16:
535
case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:
536
case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:
537
return 0;
538
default:
539
unreachable("unknown shader param");
540
}
541
}
542
543
static int
544
crocus_get_compute_param(struct pipe_screen *pscreen,
545
enum pipe_shader_ir ir_type,
546
enum pipe_compute_cap param,
547
void *ret)
548
{
549
struct crocus_screen *screen = (struct crocus_screen *)pscreen;
550
const struct intel_device_info *devinfo = &screen->devinfo;
551
552
const unsigned max_threads = MIN2(64, devinfo->max_cs_threads);
553
const uint32_t max_invocations = 32 * max_threads;
554
555
if (devinfo->ver < 7)
556
return 0;
557
#define RET(x) do { \
558
if (ret) \
559
memcpy(ret, x, sizeof(x)); \
560
return sizeof(x); \
561
} while (0)
562
563
switch (param) {
564
case PIPE_COMPUTE_CAP_ADDRESS_BITS:
565
RET((uint32_t []){ 32 });
566
567
case PIPE_COMPUTE_CAP_IR_TARGET:
568
if (ret)
569
strcpy(ret, "gen");
570
return 4;
571
572
case PIPE_COMPUTE_CAP_GRID_DIMENSION:
573
RET((uint64_t []) { 3 });
574
575
case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:
576
RET(((uint64_t []) { 65535, 65535, 65535 }));
577
578
case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:
579
/* MaxComputeWorkGroupSize[0..2] */
580
RET(((uint64_t []) {max_invocations, max_invocations, max_invocations}));
581
582
case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:
583
/* MaxComputeWorkGroupInvocations */
584
RET((uint64_t []) { max_invocations });
585
586
case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:
587
/* MaxComputeSharedMemorySize */
588
RET((uint64_t []) { 64 * 1024 });
589
590
case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:
591
RET((uint32_t []) { 1 });
592
593
case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:
594
RET((uint32_t []) { BRW_SUBGROUP_SIZE });
595
596
case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK:
597
RET((uint64_t []) { max_invocations });
598
599
case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE:
600
case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:
601
case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:
602
case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:
603
case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:
604
case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:
605
606
// XXX: I think these are for Clover...
607
return 0;
608
609
default:
610
unreachable("unknown compute param");
611
}
612
}
613
614
static uint64_t
615
crocus_get_timestamp(struct pipe_screen *pscreen)
616
{
617
struct crocus_screen *screen = (struct crocus_screen *) pscreen;
618
const unsigned TIMESTAMP = 0x2358;
619
uint64_t result;
620
621
crocus_reg_read(screen->bufmgr, TIMESTAMP | 1, &result);
622
623
result = intel_device_info_timebase_scale(&screen->devinfo, result);
624
result &= (1ull << TIMESTAMP_BITS) - 1;
625
626
return result;
627
}
628
629
void
630
crocus_screen_destroy(struct crocus_screen *screen)
631
{
632
u_transfer_helper_destroy(screen->base.transfer_helper);
633
crocus_bufmgr_unref(screen->bufmgr);
634
disk_cache_destroy(screen->disk_cache);
635
close(screen->winsys_fd);
636
ralloc_free(screen);
637
}
638
639
static void
640
crocus_screen_unref(struct pipe_screen *pscreen)
641
{
642
crocus_pscreen_unref(pscreen);
643
}
644
645
static void
646
crocus_query_memory_info(struct pipe_screen *pscreen,
647
struct pipe_memory_info *info)
648
{
649
}
650
651
static const void *
652
crocus_get_compiler_options(struct pipe_screen *pscreen,
653
enum pipe_shader_ir ir,
654
enum pipe_shader_type pstage)
655
{
656
struct crocus_screen *screen = (struct crocus_screen *) pscreen;
657
gl_shader_stage stage = stage_from_pipe(pstage);
658
assert(ir == PIPE_SHADER_IR_NIR);
659
660
return screen->compiler->glsl_compiler_options[stage].NirOptions;
661
}
662
663
static struct disk_cache *
664
crocus_get_disk_shader_cache(struct pipe_screen *pscreen)
665
{
666
struct crocus_screen *screen = (struct crocus_screen *) pscreen;
667
return screen->disk_cache;
668
}
669
670
static const struct intel_l3_config *
671
crocus_get_default_l3_config(const struct intel_device_info *devinfo,
672
bool compute)
673
{
674
bool wants_dc_cache = true;
675
bool has_slm = compute;
676
const struct intel_l3_weights w =
677
intel_get_default_l3_weights(devinfo, wants_dc_cache, has_slm);
678
return intel_get_l3_config(devinfo, w);
679
}
680
681
static void
682
crocus_shader_debug_log(void *data, const char *fmt, ...)
683
{
684
struct pipe_debug_callback *dbg = data;
685
unsigned id = 0;
686
va_list args;
687
688
if (!dbg->debug_message)
689
return;
690
691
va_start(args, fmt);
692
dbg->debug_message(dbg->data, &id, PIPE_DEBUG_TYPE_SHADER_INFO, fmt, args);
693
va_end(args);
694
}
695
696
static void
697
crocus_shader_perf_log(void *data, const char *fmt, ...)
698
{
699
struct pipe_debug_callback *dbg = data;
700
unsigned id = 0;
701
va_list args;
702
va_start(args, fmt);
703
704
if (unlikely(INTEL_DEBUG & DEBUG_PERF)) {
705
va_list args_copy;
706
va_copy(args_copy, args);
707
vfprintf(stderr, fmt, args_copy);
708
va_end(args_copy);
709
}
710
711
if (dbg->debug_message) {
712
dbg->debug_message(dbg->data, &id, PIPE_DEBUG_TYPE_PERF_INFO, fmt, args);
713
}
714
715
va_end(args);
716
}
717
718
static bool
719
crocus_detect_swizzling(struct crocus_screen *screen)
720
{
721
/* Broadwell PRM says:
722
*
723
* "Before Gen8, there was a historical configuration control field to
724
* swizzle address bit[6] for in X/Y tiling modes. This was set in three
725
* different places: TILECTL[1:0], ARB_MODE[5:4], and
726
* DISP_ARB_CTL[14:13].
727
*
728
* For Gen8 and subsequent generations, the swizzle fields are all
729
* reserved, and the CPU's memory controller performs all address
730
* swizzling modifications."
731
*/
732
uint32_t tiling = I915_TILING_X;
733
uint32_t swizzle_mode = 0;
734
struct crocus_bo *buffer =
735
crocus_bo_alloc_tiled(screen->bufmgr, "swizzle test", 32768,
736
0, tiling, 512, 0);
737
if (buffer == NULL)
738
return false;
739
740
crocus_bo_get_tiling(buffer, &tiling, &swizzle_mode);
741
crocus_bo_unreference(buffer);
742
743
return swizzle_mode != I915_BIT_6_SWIZZLE_NONE;
744
}
745
746
struct pipe_screen *
747
crocus_screen_create(int fd, const struct pipe_screen_config *config)
748
{
749
struct crocus_screen *screen = rzalloc(NULL, struct crocus_screen);
750
if (!screen)
751
return NULL;
752
753
if (!intel_get_device_info_from_fd(fd, &screen->devinfo))
754
return NULL;
755
screen->pci_id = screen->devinfo.chipset_id;
756
screen->no_hw = screen->devinfo.no_hw;
757
758
if (screen->devinfo.ver > 8)
759
return NULL;
760
761
if (screen->devinfo.ver == 8) {
762
/* bind to cherryview or bdw if forced */
763
if (!screen->devinfo.is_cherryview &&
764
!getenv("CROCUS_GEN8"))
765
return NULL;
766
}
767
768
p_atomic_set(&screen->refcount, 1);
769
770
screen->aperture_bytes = get_aperture_size(fd);
771
772
if (getenv("INTEL_NO_HW") != NULL)
773
screen->no_hw = true;
774
775
bool bo_reuse = false;
776
int bo_reuse_mode = driQueryOptioni(config->options, "bo_reuse");
777
switch (bo_reuse_mode) {
778
case DRI_CONF_BO_REUSE_DISABLED:
779
break;
780
case DRI_CONF_BO_REUSE_ALL:
781
bo_reuse = true;
782
break;
783
}
784
785
screen->bufmgr = crocus_bufmgr_get_for_fd(&screen->devinfo, fd, bo_reuse);
786
if (!screen->bufmgr)
787
return NULL;
788
screen->fd = crocus_bufmgr_get_fd(screen->bufmgr);
789
screen->winsys_fd = fd;
790
791
screen->has_swizzling = crocus_detect_swizzling(screen);
792
brw_process_intel_debug_variable();
793
794
screen->driconf.dual_color_blend_by_location =
795
driQueryOptionb(config->options, "dual_color_blend_by_location");
796
screen->driconf.disable_throttling =
797
driQueryOptionb(config->options, "disable_throttling");
798
screen->driconf.always_flush_cache =
799
driQueryOptionb(config->options, "always_flush_cache");
800
801
screen->precompile = env_var_as_boolean("shader_precompile", true);
802
803
isl_device_init(&screen->isl_dev, &screen->devinfo,
804
screen->has_swizzling);
805
806
screen->compiler = brw_compiler_create(screen, &screen->devinfo);
807
screen->compiler->shader_debug_log = crocus_shader_debug_log;
808
screen->compiler->shader_perf_log = crocus_shader_perf_log;
809
screen->compiler->supports_pull_constants = false;
810
screen->compiler->supports_shader_constants = false;
811
screen->compiler->compact_params = false;
812
screen->compiler->constant_buffer_0_is_relative = true;
813
814
if (screen->devinfo.ver >= 7) {
815
screen->l3_config_3d = crocus_get_default_l3_config(&screen->devinfo, false);
816
screen->l3_config_cs = crocus_get_default_l3_config(&screen->devinfo, true);
817
}
818
819
crocus_disk_cache_init(screen);
820
821
slab_create_parent(&screen->transfer_pool,
822
sizeof(struct crocus_transfer), 64);
823
824
screen->subslice_total = intel_device_info_subslice_total(&screen->devinfo);
825
assert(screen->subslice_total >= 1);
826
827
struct pipe_screen *pscreen = &screen->base;
828
829
crocus_init_screen_fence_functions(pscreen);
830
crocus_init_screen_resource_functions(pscreen);
831
832
pscreen->destroy = crocus_screen_unref;
833
pscreen->get_name = crocus_get_name;
834
pscreen->get_vendor = crocus_get_vendor;
835
pscreen->get_device_vendor = crocus_get_device_vendor;
836
pscreen->get_param = crocus_get_param;
837
pscreen->get_shader_param = crocus_get_shader_param;
838
pscreen->get_compute_param = crocus_get_compute_param;
839
pscreen->get_paramf = crocus_get_paramf;
840
pscreen->get_compiler_options = crocus_get_compiler_options;
841
pscreen->get_device_uuid = crocus_get_device_uuid;
842
pscreen->get_driver_uuid = crocus_get_driver_uuid;
843
pscreen->get_disk_shader_cache = crocus_get_disk_shader_cache;
844
pscreen->is_format_supported = crocus_is_format_supported;
845
pscreen->context_create = crocus_create_context;
846
pscreen->flush_frontbuffer = crocus_flush_frontbuffer;
847
pscreen->get_timestamp = crocus_get_timestamp;
848
pscreen->query_memory_info = crocus_query_memory_info;
849
pscreen->get_driver_query_group_info = crocus_get_monitor_group_info;
850
pscreen->get_driver_query_info = crocus_get_monitor_info;
851
852
genX_call(&screen->devinfo, crocus_init_screen_state, screen);
853
genX_call(&screen->devinfo, crocus_init_screen_query, screen);
854
return pscreen;
855
}
856
857