Path: blob/21.2-virgl/src/gallium/drivers/llvmpipe/lp_screen.c
4570 views
/**************************************************************************1*2* Copyright 2008 VMware, Inc.3* All Rights Reserved.4*5* Permission is hereby granted, free of charge, to any person obtaining a6* copy of this software and associated documentation files (the7* "Software"), to deal in the Software without restriction, including8* without limitation the rights to use, copy, modify, merge, publish,9* distribute, sub license, and/or sell copies of the Software, and to10* permit persons to whom the Software is furnished to do so, subject to11* the following conditions:12*13* The above copyright notice and this permission notice (including the14* next paragraph) shall be included in all copies or substantial portions15* of the Software.16*17* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS18* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF19* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.20* IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR21* ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,22* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE23* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.24*25**************************************************************************/262728#include "util/u_memory.h"29#include "util/u_math.h"30#include "util/u_cpu_detect.h"31#include "util/format/u_format.h"32#include "util/u_screen.h"33#include "util/u_string.h"34#include "util/format/u_format_s3tc.h"35#include "pipe/p_defines.h"36#include "pipe/p_screen.h"37#include "draw/draw_context.h"38#include "gallivm/lp_bld_type.h"39#include "gallivm/lp_bld_nir.h"40#include "util/disk_cache.h"41#include "util/os_misc.h"42#include "util/os_time.h"43#include "lp_texture.h"44#include "lp_fence.h"45#include "lp_jit.h"46#include "lp_screen.h"47#include "lp_context.h"48#include "lp_debug.h"49#include "lp_public.h"50#include "lp_limits.h"51#include "lp_rast.h"52#include "lp_cs_tpool.h"5354#include "frontend/sw_winsys.h"5556#include "nir.h"5758#ifdef DEBUG59int LP_DEBUG = 0;6061static const struct debug_named_value lp_debug_flags[] = {62{ "pipe", DEBUG_PIPE, NULL },63{ "tgsi", DEBUG_TGSI, NULL },64{ "tex", DEBUG_TEX, NULL },65{ "setup", DEBUG_SETUP, NULL },66{ "rast", DEBUG_RAST, NULL },67{ "query", DEBUG_QUERY, NULL },68{ "screen", DEBUG_SCREEN, NULL },69{ "counters", DEBUG_COUNTERS, NULL },70{ "scene", DEBUG_SCENE, NULL },71{ "fence", DEBUG_FENCE, NULL },72{ "mem", DEBUG_MEM, NULL },73{ "fs", DEBUG_FS, NULL },74{ "cs", DEBUG_CS, NULL },75{ "tgsi_ir", DEBUG_TGSI_IR, NULL },76{ "cache_stats", DEBUG_CACHE_STATS, NULL },77DEBUG_NAMED_VALUE_END78};79#endif8081int LP_PERF = 0;82static const struct debug_named_value lp_perf_flags[] = {83{ "texmem", PERF_TEX_MEM, NULL },84{ "no_mipmap", PERF_NO_MIPMAPS, NULL },85{ "no_linear", PERF_NO_LINEAR, NULL },86{ "no_mip_linear", PERF_NO_MIP_LINEAR, NULL },87{ "no_tex", PERF_NO_TEX, NULL },88{ "no_blend", PERF_NO_BLEND, NULL },89{ "no_depth", PERF_NO_DEPTH, NULL },90{ "no_alphatest", PERF_NO_ALPHATEST, NULL },91DEBUG_NAMED_VALUE_END92};939495static const char *96llvmpipe_get_vendor(struct pipe_screen *screen)97{98return "Mesa/X.org";99}100101102static const char *103llvmpipe_get_name(struct pipe_screen *screen)104{105static char buf[100];106snprintf(buf, sizeof(buf), "llvmpipe (LLVM " MESA_LLVM_VERSION_STRING ", %u bits)",107lp_native_vector_width );108return buf;109}110111112static int113llvmpipe_get_param(struct pipe_screen *screen, enum pipe_cap param)114{115switch (param) {116case PIPE_CAP_NPOT_TEXTURES:117case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:118case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:119return 1;120case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:121case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:122case PIPE_CAP_VERTEX_SHADER_SATURATE:123return 1;124case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:125return 1;126case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:127return PIPE_MAX_SO_BUFFERS;128case PIPE_CAP_POINT_SPRITE:129return 1;130case PIPE_CAP_MAX_RENDER_TARGETS:131return PIPE_MAX_COLOR_BUFS;132case PIPE_CAP_OCCLUSION_QUERY:133case PIPE_CAP_QUERY_TIMESTAMP:134case PIPE_CAP_QUERY_TIME_ELAPSED:135return 1;136case PIPE_CAP_QUERY_PIPELINE_STATISTICS:137return 1;138case PIPE_CAP_TEXTURE_MIRROR_CLAMP:139case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE:140return 1;141case PIPE_CAP_TEXTURE_SWIZZLE:142case PIPE_CAP_TEXTURE_SHADOW_LOD:143return 1;144case PIPE_CAP_MAX_TEXTURE_2D_SIZE:145return 1 << (LP_MAX_TEXTURE_2D_LEVELS - 1);146case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:147return LP_MAX_TEXTURE_3D_LEVELS;148case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:149return LP_MAX_TEXTURE_CUBE_LEVELS;150case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:151return LP_MAX_TEXTURE_ARRAY_LAYERS;152case PIPE_CAP_BLEND_EQUATION_SEPARATE:153return 1;154case PIPE_CAP_INDEP_BLEND_ENABLE:155return 1;156case PIPE_CAP_INDEP_BLEND_FUNC:157return 1;158case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:159case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:160case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:161return 1;162case PIPE_CAP_PRIMITIVE_RESTART:163case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:164return 1;165case PIPE_CAP_DEPTH_CLIP_DISABLE:166return 1;167case PIPE_CAP_SHADER_STENCIL_EXPORT:168return 1;169case PIPE_CAP_TGSI_INSTANCEID:170case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:171case PIPE_CAP_START_INSTANCE:172case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:173return 1;174case PIPE_CAP_SEAMLESS_CUBE_MAP:175case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:176return 1;177/* this is a lie could support arbitrary large offsets */178case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:179case PIPE_CAP_MIN_TEXEL_OFFSET:180return -32;181case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:182case PIPE_CAP_MAX_TEXEL_OFFSET:183return 31;184case PIPE_CAP_CONDITIONAL_RENDER:185case PIPE_CAP_TEXTURE_BARRIER:186return 1;187case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:188case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:189return 16*4;190case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:191case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:192return 1024;193case PIPE_CAP_MAX_VERTEX_STREAMS: {194struct llvmpipe_screen *lscreen = llvmpipe_screen(screen);195return lscreen->use_tgsi ? 1 : 4;196}197case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:198return 2048;199case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:200case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:201case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:202case PIPE_CAP_VERTEX_COLOR_CLAMPED:203return 1;204case PIPE_CAP_GLSL_FEATURE_LEVEL: {205struct llvmpipe_screen *lscreen = llvmpipe_screen(screen);206return lscreen->use_tgsi ? 330 : 450;207}208case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:209return 140;210case PIPE_CAP_COMPUTE:211return GALLIVM_HAVE_CORO;212case PIPE_CAP_USER_VERTEX_BUFFERS:213return 1;214case PIPE_CAP_TGSI_TEXCOORD:215case PIPE_CAP_DRAW_INDIRECT:216return 1;217218case PIPE_CAP_CUBE_MAP_ARRAY:219return 1;220case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:221return 16;222case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:223return 64;224case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:225return 1;226/* Adressing that many 64bpp texels fits in an i32 so this is a reasonable value */227case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:228return 134217728;229case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:230return 16;231case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:232return 0;233case PIPE_CAP_MAX_VIEWPORTS:234return PIPE_MAX_VIEWPORTS;235case PIPE_CAP_ENDIANNESS:236return PIPE_ENDIAN_NATIVE;237case PIPE_CAP_TGSI_TES_LAYER_VIEWPORT:238case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT:239return 1;240case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:241return 1;242case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:243return 4;244case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:245return 1;246case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:247return 1;248case PIPE_CAP_TGSI_TEX_TXF_LZ:249case PIPE_CAP_SAMPLER_VIEW_TARGET:250return 1;251case PIPE_CAP_FAKE_SW_MSAA: {252struct llvmpipe_screen *lscreen = llvmpipe_screen(screen);253return lscreen->use_tgsi ? 1 : 0;254}255case PIPE_CAP_TEXTURE_QUERY_LOD:256case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:257case PIPE_CAP_TGSI_ARRAY_COMPONENTS:258case PIPE_CAP_DOUBLES:259case PIPE_CAP_INT64:260case PIPE_CAP_INT64_DIVMOD:261case PIPE_CAP_QUERY_SO_OVERFLOW:262case PIPE_CAP_TGSI_DIV:263return 1;264265case PIPE_CAP_VENDOR_ID:266return 0xFFFFFFFF;267case PIPE_CAP_DEVICE_ID:268return 0xFFFFFFFF;269case PIPE_CAP_ACCELERATED:270return 0;271case PIPE_CAP_VIDEO_MEMORY: {272/* XXX: Do we want to return the full amount fo system memory ? */273uint64_t system_memory;274275if (!os_get_total_physical_memory(&system_memory))276return 0;277278if (sizeof(void *) == 4)279/* Cap to 2 GB on 32 bits system. We do this because llvmpipe does280* eat application memory, which is quite limited on 32 bits. App281* shouldn't expect too much available memory. */282system_memory = MIN2(system_memory, 2048 << 20);283284return (int)(system_memory >> 20);285}286case PIPE_CAP_UMA:287return 0;288case PIPE_CAP_CLIP_HALFZ:289return 1;290case PIPE_CAP_POLYGON_OFFSET_CLAMP:291case PIPE_CAP_TEXTURE_FLOAT_LINEAR:292case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:293return 1;294case PIPE_CAP_CULL_DISTANCE:295return 1;296case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:297return 1;298case PIPE_CAP_CLEAR_TEXTURE:299return 1;300case PIPE_CAP_MAX_VARYINGS:301return 32;302case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:303return 16;304case PIPE_CAP_QUERY_BUFFER_OBJECT:305return 1;306case PIPE_CAP_DRAW_PARAMETERS:307return 1;308case PIPE_CAP_FBFETCH:309return 8;310case PIPE_CAP_FBFETCH_COHERENT:311return 0;312case PIPE_CAP_MULTI_DRAW_INDIRECT:313case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS:314return 1;315case PIPE_CAP_DEVICE_RESET_STATUS_QUERY:316case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR:317return 1;318case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS:319return 32;320case PIPE_CAP_RASTERIZER_SUBPIXEL_BITS:321return 8;322case PIPE_CAP_PCI_GROUP:323case PIPE_CAP_PCI_BUS:324case PIPE_CAP_PCI_DEVICE:325case PIPE_CAP_PCI_FUNCTION:326case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:327case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:328return 0;329330case PIPE_CAP_SHAREABLE_SHADERS:331/* Can't expose shareable shaders because the draw shaders reference the332* draw module's state, which is per-context.333*/334return 0;335336case PIPE_CAP_MAX_GS_INVOCATIONS:337return 32;338case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:339return LP_MAX_TGSI_SHADER_BUFFER_SIZE;340case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:341case PIPE_CAP_TGSI_TG4_COMPONENT_IN_SWIZZLE:342case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:343return 1;344case PIPE_CAP_SAMPLER_REDUCTION_MINMAX:345case PIPE_CAP_TGSI_TXQS:346case PIPE_CAP_TGSI_VOTE:347case PIPE_CAP_LOAD_CONSTBUF:348case PIPE_CAP_TEXTURE_MULTISAMPLE:349case PIPE_CAP_SAMPLE_SHADING:350case PIPE_CAP_GL_SPIRV:351case PIPE_CAP_POST_DEPTH_COVERAGE:352case PIPE_CAP_PACKED_UNIFORMS: {353struct llvmpipe_screen *lscreen = llvmpipe_screen(screen);354return !lscreen->use_tgsi;355}356default:357return u_pipe_screen_get_param_defaults(screen, param);358}359}360361static int362llvmpipe_get_shader_param(struct pipe_screen *screen,363enum pipe_shader_type shader,364enum pipe_shader_cap param)365{366struct llvmpipe_screen *lscreen = llvmpipe_screen(screen);367switch(shader)368{369case PIPE_SHADER_COMPUTE:370if ((lscreen->allow_cl) && param == PIPE_SHADER_CAP_SUPPORTED_IRS)371return (1 << PIPE_SHADER_IR_TGSI) | (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_NIR_SERIALIZED);372FALLTHROUGH;373case PIPE_SHADER_FRAGMENT:374if (param == PIPE_SHADER_CAP_PREFERRED_IR) {375if (lscreen->use_tgsi)376return PIPE_SHADER_IR_TGSI;377else378return PIPE_SHADER_IR_NIR;379}380381return gallivm_get_shader_param(param);382case PIPE_SHADER_TESS_CTRL:383case PIPE_SHADER_TESS_EVAL:384/* Tessellation shader needs llvm coroutines support */385if (!GALLIVM_HAVE_CORO || lscreen->use_tgsi)386return 0;387FALLTHROUGH;388case PIPE_SHADER_VERTEX:389case PIPE_SHADER_GEOMETRY:390if (param == PIPE_SHADER_CAP_PREFERRED_IR) {391if (lscreen->use_tgsi)392return PIPE_SHADER_IR_TGSI;393else394return PIPE_SHADER_IR_NIR;395}396397switch (param) {398case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:399/* At this time, the draw module and llvmpipe driver only400* support vertex shader texture lookups when LLVM is enabled in401* the draw module.402*/403if (debug_get_bool_option("DRAW_USE_LLVM", TRUE))404return PIPE_MAX_SAMPLERS;405else406return 0;407case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:408if (debug_get_bool_option("DRAW_USE_LLVM", TRUE))409return PIPE_MAX_SHADER_SAMPLER_VIEWS;410else411return 0;412default:413return draw_get_shader_param(shader, param);414}415default:416return 0;417}418}419420static float421llvmpipe_get_paramf(struct pipe_screen *screen, enum pipe_capf param)422{423switch (param) {424case PIPE_CAPF_MAX_LINE_WIDTH:425FALLTHROUGH;426case PIPE_CAPF_MAX_LINE_WIDTH_AA:427return 255.0; /* arbitrary */428case PIPE_CAPF_MAX_POINT_WIDTH:429FALLTHROUGH;430case PIPE_CAPF_MAX_POINT_WIDTH_AA:431return LP_MAX_POINT_WIDTH; /* arbitrary */432case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:433return 16.0; /* not actually signficant at this time */434case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:435return 16.0; /* arbitrary */436case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:437return 0.0;438case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:439return 0.0;440case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:441return 0.0;442}443/* should only get here on unhandled cases */444debug_printf("Unexpected PIPE_CAP %d query\n", param);445return 0.0;446}447448static int449llvmpipe_get_compute_param(struct pipe_screen *_screen,450enum pipe_shader_ir ir_type,451enum pipe_compute_cap param,452void *ret)453{454switch (param) {455case PIPE_COMPUTE_CAP_IR_TARGET:456return 0;457case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:458if (ret) {459uint64_t *grid_size = ret;460grid_size[0] = 65535;461grid_size[1] = 65535;462grid_size[2] = 65535;463}464return 3 * sizeof(uint64_t) ;465case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:466if (ret) {467uint64_t *block_size = ret;468block_size[0] = 1024;469block_size[1] = 1024;470block_size[2] = 1024;471}472return 3 * sizeof(uint64_t);473case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:474if (ret) {475uint64_t *max_threads_per_block = ret;476*max_threads_per_block = 1024;477}478return sizeof(uint64_t);479case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE:480if (ret) {481uint64_t *max_local_size = ret;482*max_local_size = 32768;483}484return sizeof(uint64_t);485case PIPE_COMPUTE_CAP_GRID_DIMENSION:486if (ret) {487uint32_t *grid_dim = ret;488*grid_dim = 3;489}490return sizeof(uint32_t);491case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE:492if (ret) {493uint64_t *max_global_size = ret;494*max_global_size = (1ULL << 31);495}496return sizeof(uint64_t);497case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE:498if (ret) {499uint64_t *max_mem_alloc_size = ret;500*max_mem_alloc_size = (1ULL << 31);501}502return sizeof(uint64_t);503case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE:504if (ret) {505uint64_t *max_private = ret;506*max_private = (1UL << 31);507}508return sizeof(uint64_t);509case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE:510if (ret) {511uint64_t *max_input = ret;512*max_input = 4096;513}514return sizeof(uint64_t);515case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:516if (ret) {517uint32_t *images = ret;518*images = LP_MAX_TGSI_SHADER_IMAGES;519}520return sizeof(uint32_t);521case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK:522return 0;523case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:524if (ret) {525uint32_t *subgroup_size = ret;526*subgroup_size = 32;527}528return sizeof(uint32_t);529case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:530if (ret) {531uint32_t *max_compute_units = ret;532*max_compute_units = 8;533}534return sizeof(uint32_t);535case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:536if (ret) {537uint32_t *max_clock_freq = ret;538*max_clock_freq = 300;539}540return sizeof(uint32_t);541case PIPE_COMPUTE_CAP_ADDRESS_BITS:542if (ret) {543uint32_t *address_bits = ret;544*address_bits = 64;545}546return sizeof(uint32_t);547}548return 0;549}550551static const struct nir_shader_compiler_options gallivm_nir_options = {552.lower_scmp = true,553.lower_flrp32 = true,554.lower_flrp64 = true,555.lower_fsat = true,556.lower_bitfield_insert_to_shifts = true,557.lower_bitfield_extract_to_shifts = true,558.lower_fdot = true,559.lower_fdph = true,560.lower_ffma16 = true,561.lower_ffma32 = true,562.lower_ffma64 = true,563.lower_fmod = true,564.lower_hadd = true,565.lower_add_sat = true,566.lower_ldexp = true,567.lower_pack_snorm_2x16 = true,568.lower_pack_snorm_4x8 = true,569.lower_pack_unorm_2x16 = true,570.lower_pack_unorm_4x8 = true,571.lower_pack_half_2x16 = true,572.lower_pack_split = true,573.lower_unpack_snorm_2x16 = true,574.lower_unpack_snorm_4x8 = true,575.lower_unpack_unorm_2x16 = true,576.lower_unpack_unorm_4x8 = true,577.lower_unpack_half_2x16 = true,578.lower_extract_byte = true,579.lower_extract_word = true,580.lower_insert_byte = true,581.lower_insert_word = true,582.lower_rotate = true,583.lower_uadd_carry = true,584.lower_usub_borrow = true,585.lower_mul_2x32_64 = true,586.lower_ifind_msb = true,587.max_unroll_iterations = 32,588.use_interpolated_input_intrinsics = true,589.lower_to_scalar = true,590.lower_cs_local_index_from_id = true,591.lower_uniforms_to_ubo = true,592.lower_vector_cmp = true,593.lower_device_index_to_zero = true,594.support_16bit_alu = true,595};596597static void598llvmpipe_finalize_nir(struct pipe_screen *screen,599void *nirptr,600bool optimize)601{602struct nir_shader *nir = (struct nir_shader *)nirptr;603lp_build_opt_nir(nir);604}605606static inline const void *607llvmpipe_get_compiler_options(struct pipe_screen *screen,608enum pipe_shader_ir ir,609enum pipe_shader_type shader)610{611assert(ir == PIPE_SHADER_IR_NIR);612return &gallivm_nir_options;613}614615/**616* Query format support for creating a texture, drawing surface, etc.617* \param format the format to test618* \param type one of PIPE_TEXTURE, PIPE_SURFACE619*/620static bool621llvmpipe_is_format_supported( struct pipe_screen *_screen,622enum pipe_format format,623enum pipe_texture_target target,624unsigned sample_count,625unsigned storage_sample_count,626unsigned bind)627{628struct llvmpipe_screen *screen = llvmpipe_screen(_screen);629struct sw_winsys *winsys = screen->winsys;630const struct util_format_description *format_desc;631632format_desc = util_format_description(format);633if (!format_desc)634return false;635636assert(target == PIPE_BUFFER ||637target == PIPE_TEXTURE_1D ||638target == PIPE_TEXTURE_1D_ARRAY ||639target == PIPE_TEXTURE_2D ||640target == PIPE_TEXTURE_2D_ARRAY ||641target == PIPE_TEXTURE_RECT ||642target == PIPE_TEXTURE_3D ||643target == PIPE_TEXTURE_CUBE ||644target == PIPE_TEXTURE_CUBE_ARRAY);645646if (sample_count != 0 && sample_count != 1 && sample_count != 4)647return false;648649if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))650return false;651652if (bind & (PIPE_BIND_RENDER_TARGET | PIPE_BIND_SHADER_IMAGE)) {653if (format_desc->colorspace == UTIL_FORMAT_COLORSPACE_SRGB) {654/* this is a lie actually other formats COULD exist where we would fail */655if (format_desc->nr_channels < 3)656return false;657}658else if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_RGB)659return false;660661if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN &&662format != PIPE_FORMAT_R11G11B10_FLOAT)663return false;664665assert(format_desc->block.width == 1);666assert(format_desc->block.height == 1);667668if (format_desc->is_mixed)669return false;670671if (!format_desc->is_array && !format_desc->is_bitmask &&672format != PIPE_FORMAT_R11G11B10_FLOAT)673return false;674}675676if (bind & PIPE_BIND_SHADER_IMAGE) {677switch (format) {678case PIPE_FORMAT_R32G32B32A32_FLOAT:679case PIPE_FORMAT_R16G16B16A16_FLOAT:680case PIPE_FORMAT_R32G32_FLOAT:681case PIPE_FORMAT_R16G16_FLOAT:682case PIPE_FORMAT_R11G11B10_FLOAT:683case PIPE_FORMAT_R32_FLOAT:684case PIPE_FORMAT_R16_FLOAT:685case PIPE_FORMAT_R32G32B32A32_UINT:686case PIPE_FORMAT_R16G16B16A16_UINT:687case PIPE_FORMAT_R10G10B10A2_UINT:688case PIPE_FORMAT_R8G8B8A8_UINT:689case PIPE_FORMAT_R32G32_UINT:690case PIPE_FORMAT_R16G16_UINT:691case PIPE_FORMAT_R8G8_UINT:692case PIPE_FORMAT_R32_UINT:693case PIPE_FORMAT_R16_UINT:694case PIPE_FORMAT_R8_UINT:695case PIPE_FORMAT_R32G32B32A32_SINT:696case PIPE_FORMAT_R16G16B16A16_SINT:697case PIPE_FORMAT_R8G8B8A8_SINT:698case PIPE_FORMAT_R32G32_SINT:699case PIPE_FORMAT_R16G16_SINT:700case PIPE_FORMAT_R8G8_SINT:701case PIPE_FORMAT_R32_SINT:702case PIPE_FORMAT_R16_SINT:703case PIPE_FORMAT_R8_SINT:704case PIPE_FORMAT_R16G16B16A16_UNORM:705case PIPE_FORMAT_R10G10B10A2_UNORM:706case PIPE_FORMAT_R8G8B8A8_UNORM:707case PIPE_FORMAT_R16G16_UNORM:708case PIPE_FORMAT_R8G8_UNORM:709case PIPE_FORMAT_R16_UNORM:710case PIPE_FORMAT_R8_UNORM:711case PIPE_FORMAT_R16G16B16A16_SNORM:712case PIPE_FORMAT_R8G8B8A8_SNORM:713case PIPE_FORMAT_R16G16_SNORM:714case PIPE_FORMAT_R8G8_SNORM:715case PIPE_FORMAT_R16_SNORM:716case PIPE_FORMAT_R8_SNORM:717break;718719default:720return false;721}722}723724if ((bind & (PIPE_BIND_RENDER_TARGET | PIPE_BIND_SAMPLER_VIEW)) &&725((bind & PIPE_BIND_DISPLAY_TARGET) == 0)) {726/* Disable all 3-channel formats, where channel size != 32 bits.727* In some cases we run into crashes (in generate_unswizzled_blend()),728* for 3-channel RGB16 variants, there was an apparent LLVM bug.729* In any case, disabling the shallower 3-channel formats avoids a730* number of issues with GL_ARB_copy_image support.731*/732if (format_desc->is_array &&733format_desc->nr_channels == 3 &&734format_desc->block.bits != 96) {735return false;736}737}738739if (!(bind & PIPE_BIND_VERTEX_BUFFER) &&740util_format_is_scaled(format))741return false;742743if (bind & PIPE_BIND_DISPLAY_TARGET) {744if(!winsys->is_displaytarget_format_supported(winsys, bind, format))745return false;746}747748if (bind & PIPE_BIND_DEPTH_STENCIL) {749if (format_desc->layout != UTIL_FORMAT_LAYOUT_PLAIN)750return false;751752if (format_desc->colorspace != UTIL_FORMAT_COLORSPACE_ZS)753return false;754}755756if (format_desc->layout == UTIL_FORMAT_LAYOUT_ASTC ||757format_desc->layout == UTIL_FORMAT_LAYOUT_ATC) {758/* Software decoding is not hooked up. */759return false;760}761762if (format_desc->layout == UTIL_FORMAT_LAYOUT_ETC &&763format != PIPE_FORMAT_ETC1_RGB8)764return false;765766/*767* Everything can be supported by u_format768* (those without fetch_rgba_float might be not but shouldn't hit that)769*/770771return true;772}773774775776777static void778llvmpipe_flush_frontbuffer(struct pipe_screen *_screen,779struct pipe_context *_pipe,780struct pipe_resource *resource,781unsigned level, unsigned layer,782void *context_private,783struct pipe_box *sub_box)784{785struct llvmpipe_screen *screen = llvmpipe_screen(_screen);786struct sw_winsys *winsys = screen->winsys;787struct llvmpipe_resource *texture = llvmpipe_resource(resource);788789assert(texture->dt);790if (texture->dt)791winsys->displaytarget_display(winsys, texture->dt, context_private, sub_box);792}793794static void795llvmpipe_destroy_screen( struct pipe_screen *_screen )796{797struct llvmpipe_screen *screen = llvmpipe_screen(_screen);798struct sw_winsys *winsys = screen->winsys;799800if (screen->cs_tpool)801lp_cs_tpool_destroy(screen->cs_tpool);802803if (screen->rast)804lp_rast_destroy(screen->rast);805806lp_jit_screen_cleanup(screen);807808if (LP_DEBUG & DEBUG_CACHE_STATS)809printf("disk shader cache: hits = %u, misses = %u\n", screen->num_disk_shader_cache_hits,810screen->num_disk_shader_cache_misses);811disk_cache_destroy(screen->disk_shader_cache);812if(winsys->destroy)813winsys->destroy(winsys);814815glsl_type_singleton_decref();816817mtx_destroy(&screen->rast_mutex);818mtx_destroy(&screen->cs_mutex);819FREE(screen);820}821822823824825/**826* Fence reference counting.827*/828static void829llvmpipe_fence_reference(struct pipe_screen *screen,830struct pipe_fence_handle **ptr,831struct pipe_fence_handle *fence)832{833struct lp_fence **old = (struct lp_fence **) ptr;834struct lp_fence *f = (struct lp_fence *) fence;835836lp_fence_reference(old, f);837}838839840/**841* Wait for the fence to finish.842*/843static bool844llvmpipe_fence_finish(struct pipe_screen *screen,845struct pipe_context *ctx,846struct pipe_fence_handle *fence_handle,847uint64_t timeout)848{849struct lp_fence *f = (struct lp_fence *) fence_handle;850851if (!timeout)852return lp_fence_signalled(f);853854if (!lp_fence_signalled(f)) {855if (timeout != PIPE_TIMEOUT_INFINITE)856return lp_fence_timedwait(f, timeout);857858lp_fence_wait(f);859}860return true;861}862863static uint64_t864llvmpipe_get_timestamp(struct pipe_screen *_screen)865{866return os_time_get_nano();867}868869static void update_cache_sha1_cpu(struct mesa_sha1 *ctx)870{871const struct util_cpu_caps_t *cpu_caps = util_get_cpu_caps();872/*873* Don't need the cpu cache affinity stuff. The rest874* is contained in first 5 dwords.875*/876STATIC_ASSERT(offsetof(struct util_cpu_caps_t, num_L3_caches) == 5 * sizeof(uint32_t));877_mesa_sha1_update(ctx, cpu_caps, 5 * sizeof(uint32_t));878}879880static void lp_disk_cache_create(struct llvmpipe_screen *screen)881{882struct mesa_sha1 ctx;883unsigned gallivm_perf = gallivm_get_perf_flags();884unsigned char sha1[20];885char cache_id[20 * 2 + 1];886_mesa_sha1_init(&ctx);887888if (!disk_cache_get_function_identifier(lp_disk_cache_create, &ctx) ||889!disk_cache_get_function_identifier(LLVMLinkInMCJIT, &ctx))890return;891892_mesa_sha1_update(&ctx, &gallivm_perf, sizeof(gallivm_perf));893update_cache_sha1_cpu(&ctx);894_mesa_sha1_final(&ctx, sha1);895disk_cache_format_hex_id(cache_id, sha1, 20 * 2);896897screen->disk_shader_cache = disk_cache_create("llvmpipe", cache_id, 0);898}899900static struct disk_cache *lp_get_disk_shader_cache(struct pipe_screen *_screen)901{902struct llvmpipe_screen *screen = llvmpipe_screen(_screen);903904return screen->disk_shader_cache;905}906907void lp_disk_cache_find_shader(struct llvmpipe_screen *screen,908struct lp_cached_code *cache,909unsigned char ir_sha1_cache_key[20])910{911unsigned char sha1[CACHE_KEY_SIZE];912913if (!screen->disk_shader_cache)914return;915disk_cache_compute_key(screen->disk_shader_cache, ir_sha1_cache_key, 20, sha1);916917size_t binary_size;918uint8_t *buffer = disk_cache_get(screen->disk_shader_cache, sha1, &binary_size);919if (!buffer) {920cache->data_size = 0;921p_atomic_inc(&screen->num_disk_shader_cache_misses);922return;923}924cache->data_size = binary_size;925cache->data = buffer;926p_atomic_inc(&screen->num_disk_shader_cache_hits);927}928929void lp_disk_cache_insert_shader(struct llvmpipe_screen *screen,930struct lp_cached_code *cache,931unsigned char ir_sha1_cache_key[20])932{933unsigned char sha1[CACHE_KEY_SIZE];934935if (!screen->disk_shader_cache || !cache->data_size || cache->dont_cache)936return;937disk_cache_compute_key(screen->disk_shader_cache, ir_sha1_cache_key, 20, sha1);938disk_cache_put(screen->disk_shader_cache, sha1, cache->data, cache->data_size, NULL);939}940941bool942llvmpipe_screen_late_init(struct llvmpipe_screen *screen)943{944bool ret = true;945mtx_lock(&screen->late_mutex);946947if (screen->late_init_done)948goto out;949950screen->rast = lp_rast_create(screen->num_threads);951if (!screen->rast) {952ret = false;953goto out;954}955956screen->cs_tpool = lp_cs_tpool_create(screen->num_threads);957if (!screen->cs_tpool) {958lp_rast_destroy(screen->rast);959ret = false;960goto out;961}962963lp_disk_cache_create(screen);964screen->late_init_done = true;965out:966mtx_unlock(&screen->late_mutex);967return ret;968}969970/**971* Create a new pipe_screen object972* Note: we're not presently subclassing pipe_screen (no llvmpipe_screen).973*/974struct pipe_screen *975llvmpipe_create_screen(struct sw_winsys *winsys)976{977struct llvmpipe_screen *screen;978979util_cpu_detect();980981glsl_type_singleton_init_or_ref();982983#ifdef DEBUG984LP_DEBUG = debug_get_flags_option("LP_DEBUG", lp_debug_flags, 0 );985#endif986987LP_PERF = debug_get_flags_option("LP_PERF", lp_perf_flags, 0 );988989screen = CALLOC_STRUCT(llvmpipe_screen);990if (!screen)991return NULL;992993if (!lp_jit_screen_init(screen)) {994FREE(screen);995return NULL;996}997998screen->winsys = winsys;9991000screen->base.destroy = llvmpipe_destroy_screen;10011002screen->base.get_name = llvmpipe_get_name;1003screen->base.get_vendor = llvmpipe_get_vendor;1004screen->base.get_device_vendor = llvmpipe_get_vendor; // TODO should be the CPU vendor1005screen->base.get_param = llvmpipe_get_param;1006screen->base.get_shader_param = llvmpipe_get_shader_param;1007screen->base.get_compute_param = llvmpipe_get_compute_param;1008screen->base.get_paramf = llvmpipe_get_paramf;1009screen->base.get_compiler_options = llvmpipe_get_compiler_options;1010screen->base.is_format_supported = llvmpipe_is_format_supported;10111012screen->base.context_create = llvmpipe_create_context;1013screen->base.flush_frontbuffer = llvmpipe_flush_frontbuffer;1014screen->base.fence_reference = llvmpipe_fence_reference;1015screen->base.fence_finish = llvmpipe_fence_finish;10161017screen->base.get_timestamp = llvmpipe_get_timestamp;10181019screen->base.finalize_nir = llvmpipe_finalize_nir;10201021screen->base.get_disk_shader_cache = lp_get_disk_shader_cache;1022llvmpipe_init_screen_resource_funcs(&screen->base);10231024screen->allow_cl = !!getenv("LP_CL");1025screen->use_tgsi = (LP_DEBUG & DEBUG_TGSI_IR);1026screen->num_threads = util_get_cpu_caps()->nr_cpus > 1 ? util_get_cpu_caps()->nr_cpus : 0;1027#ifdef EMBEDDED_DEVICE1028screen->num_threads = 0;1029#endif1030screen->num_threads = debug_get_num_option("LP_NUM_THREADS", screen->num_threads);1031screen->num_threads = MIN2(screen->num_threads, LP_MAX_THREADS);10321033(void) mtx_init(&screen->cs_mutex, mtx_plain);1034(void) mtx_init(&screen->rast_mutex, mtx_plain);10351036(void) mtx_init(&screen->late_mutex, mtx_plain);10371038return &screen->base;1039}104010411042