Path: blob/21.2-virgl/src/gallium/drivers/i915/i915_screen.c
4570 views
/**************************************************************************1*2* Copyright 2008 VMware, Inc.3* All Rights Reserved.4*5* Permission is hereby granted, free of charge, to any person obtaining a6* copy of this software and associated documentation files (the7* "Software"), to deal in the Software without restriction, including8* without limitation the rights to use, copy, modify, merge, publish,9* distribute, sub license, and/or sell copies of the Software, and to10* permit persons to whom the Software is furnished to do so, subject to11* the following conditions:12*13* The above copyright notice and this permission notice (including the14* next paragraph) shall be included in all copies or substantial portions15* of the Software.16*17* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS18* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF19* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.20* IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR21* ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,22* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE23* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.24*25**************************************************************************/2627#include "compiler/nir/nir.h"28#include "draw/draw_context.h"29#include "util/format/u_format.h"30#include "util/format/u_format_s3tc.h"31#include "util/os_misc.h"32#include "util/u_inlines.h"33#include "util/u_memory.h"34#include "util/u_screen.h"35#include "util/u_string.h"3637#include "i915_context.h"38#include "i915_debug.h"39#include "i915_public.h"40#include "i915_reg.h"41#include "i915_resource.h"42#include "i915_screen.h"43#include "i915_winsys.h"4445/*46* Probe functions47*/4849static const char *50i915_get_vendor(struct pipe_screen *screen)51{52return "Mesa Project";53}5455static const char *56i915_get_device_vendor(struct pipe_screen *screen)57{58return "Intel";59}6061static const char *62i915_get_name(struct pipe_screen *screen)63{64static char buffer[128];65const char *chipset;6667switch (i915_screen(screen)->iws->pci_id) {68case PCI_CHIP_I915_G:69chipset = "915G";70break;71case PCI_CHIP_I915_GM:72chipset = "915GM";73break;74case PCI_CHIP_I945_G:75chipset = "945G";76break;77case PCI_CHIP_I945_GM:78chipset = "945GM";79break;80case PCI_CHIP_I945_GME:81chipset = "945GME";82break;83case PCI_CHIP_G33_G:84chipset = "G33";85break;86case PCI_CHIP_Q35_G:87chipset = "Q35";88break;89case PCI_CHIP_Q33_G:90chipset = "Q33";91break;92case PCI_CHIP_PINEVIEW_G:93chipset = "Pineview G";94break;95case PCI_CHIP_PINEVIEW_M:96chipset = "Pineview M";97break;98default:99chipset = "unknown";100break;101}102103snprintf(buffer, sizeof(buffer), "i915 (chipset: %s)", chipset);104return buffer;105}106107static const nir_shader_compiler_options i915_compiler_options = {108.fuse_ffma32 = true,109.lower_bitops = true, /* required for !CAP_INTEGERS nir_to_tgsi */110.lower_extract_byte = true,111.lower_extract_word = true,112.lower_fdiv = true,113.lower_fdph = true,114.lower_flrp32 = true,115.lower_fmod = true,116.lower_rotate = true,117.lower_uniforms_to_ubo = true,118.lower_vector_cmp = true,119.use_interpolated_input_intrinsics = true,120};121122static const struct nir_shader_compiler_options gallivm_nir_options = {123.lower_bitops = true, /* required for !CAP_INTEGERS nir_to_tgsi */124.lower_scmp = true,125.lower_flrp32 = true,126.lower_flrp64 = true,127.lower_fsat = true,128.lower_bitfield_insert_to_shifts = true,129.lower_bitfield_extract_to_shifts = true,130.lower_fdph = true,131.lower_ffma16 = true,132.lower_ffma32 = true,133.lower_ffma64 = true,134.lower_fmod = true,135.lower_hadd = true,136.lower_add_sat = true,137.lower_ldexp = true,138.lower_pack_snorm_2x16 = true,139.lower_pack_snorm_4x8 = true,140.lower_pack_unorm_2x16 = true,141.lower_pack_unorm_4x8 = true,142.lower_pack_half_2x16 = true,143.lower_pack_split = true,144.lower_unpack_snorm_2x16 = true,145.lower_unpack_snorm_4x8 = true,146.lower_unpack_unorm_2x16 = true,147.lower_unpack_unorm_4x8 = true,148.lower_unpack_half_2x16 = true,149.lower_extract_byte = true,150.lower_extract_word = true,151.lower_rotate = true,152.lower_uadd_carry = true,153.lower_usub_borrow = true,154.lower_mul_2x32_64 = true,155.lower_ifind_msb = true,156.max_unroll_iterations = 32,157.use_interpolated_input_intrinsics = true,158.lower_cs_local_index_from_id = true,159.lower_uniforms_to_ubo = true,160.lower_vector_cmp = true,161.lower_device_index_to_zero = true,162/* .support_16bit_alu = true, */163};164165static const void *166i915_get_compiler_options(struct pipe_screen *pscreen, enum pipe_shader_ir ir,167enum pipe_shader_type shader)168{169assert(ir == PIPE_SHADER_IR_NIR);170if (shader == PIPE_SHADER_FRAGMENT)171return &i915_compiler_options;172else173return &gallivm_nir_options;174}175176static int177i915_get_shader_param(struct pipe_screen *screen, enum pipe_shader_type shader,178enum pipe_shader_cap cap)179{180switch (cap) {181case PIPE_SHADER_CAP_PREFERRED_IR:182return PIPE_SHADER_IR_NIR;183case PIPE_SHADER_CAP_SUPPORTED_IRS:184return (1 << PIPE_SHADER_IR_NIR) | (1 << PIPE_SHADER_IR_TGSI);185186case PIPE_SHADER_CAP_INTEGERS:187/* mesa/st requires that this cap is the same across stages, and the FS188* can't do ints.189*/190return 0;191192case PIPE_SHADER_CAP_INT16:193return 0;194195case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:196/* While draw could normally handle this for the VS, the NIR lowering197* to regs can't handle our non-native-integers, so we have to lower to198* if ladders.199*/200return 0;201202default:203break;204}205206switch (shader) {207case PIPE_SHADER_VERTEX:208switch (cap) {209case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:210case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:211return 0;212case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:213case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:214return 0;215default:216return draw_get_shader_param(shader, cap);217}218case PIPE_SHADER_FRAGMENT:219/* XXX: some of these are just shader model 2.0 values, fix this! */220switch (cap) {221case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:222return I915_MAX_ALU_INSN + I915_MAX_TEX_INSN;223case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:224return I915_MAX_ALU_INSN;225case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:226return I915_MAX_TEX_INSN;227case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:228return 8;229case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:230return 0;231case PIPE_SHADER_CAP_MAX_INPUTS:232return 10;233case PIPE_SHADER_CAP_MAX_OUTPUTS:234return 1;235case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:236return 32 * sizeof(float[4]);237case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:238return 1;239case PIPE_SHADER_CAP_MAX_TEMPS:240return 12; /* XXX: 12 -> 32 ? */241case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:242case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:243return 0;244case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:245case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:246case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:247case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:248case PIPE_SHADER_CAP_SUBROUTINES:249return 0;250case PIPE_SHADER_CAP_INT64_ATOMICS:251case PIPE_SHADER_CAP_FP16:252case PIPE_SHADER_CAP_FP16_DERIVATIVES:253case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:254case PIPE_SHADER_CAP_INT16:255case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:256return 0;257case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:258case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:259return I915_TEX_UNITS;260case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:261case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:262case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:263case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:264case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:265case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:266case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:267case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:268case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:269case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:270case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:271return 0;272273case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:274return 32;275default:276debug_printf("%s: Unknown cap %u.\n", __FUNCTION__, cap);277return 0;278}279break;280default:281return 0;282}283}284285static int286i915_get_param(struct pipe_screen *screen, enum pipe_cap cap)287{288struct i915_screen *is = i915_screen(screen);289290switch (cap) {291/* Supported features (boolean caps). */292case PIPE_CAP_ANISOTROPIC_FILTER:293case PIPE_CAP_NPOT_TEXTURES:294case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:295case PIPE_CAP_POINT_SPRITE:296case PIPE_CAP_PRIMITIVE_RESTART: /* draw module */297case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:298case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:299case PIPE_CAP_BLEND_EQUATION_SEPARATE:300case PIPE_CAP_TGSI_INSTANCEID:301case PIPE_CAP_VERTEX_COLOR_CLAMPED:302case PIPE_CAP_USER_VERTEX_BUFFERS:303case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:304return 1;305306case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:307case PIPE_CAP_PCI_GROUP:308case PIPE_CAP_PCI_BUS:309case PIPE_CAP_PCI_DEVICE:310case PIPE_CAP_PCI_FUNCTION:311return 0;312313case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:314case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:315return 0;316317case PIPE_CAP_SHAREABLE_SHADERS:318/* Can't expose shareable shaders because the draw shaders reference the319* draw module's state, which is per-context.320*/321return 0;322323case PIPE_CAP_MAX_GS_INVOCATIONS:324return 32;325326case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:327return 1 << 27;328329case PIPE_CAP_MAX_VIEWPORTS:330return 1;331332case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:333return 64;334335case PIPE_CAP_GLSL_FEATURE_LEVEL:336case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:337return 120;338339case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:340return 16;341342/* Features we can lie about (boolean caps). */343case PIPE_CAP_OCCLUSION_QUERY:344return is->debug.lie ? 1 : 0;345346/* Texturing. */347case PIPE_CAP_MAX_TEXTURE_2D_SIZE:348return 1 << (I915_MAX_TEXTURE_2D_LEVELS - 1);349case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:350return I915_MAX_TEXTURE_3D_LEVELS;351case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:352return 1 << (I915_MAX_TEXTURE_2D_LEVELS - 1);353354/* Render targets. */355case PIPE_CAP_MAX_RENDER_TARGETS:356return 1;357358case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:359return 2048;360361/* Fragment coordinate conventions. */362case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:363case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:364return 1;365case PIPE_CAP_ENDIANNESS:366return PIPE_ENDIAN_LITTLE;367case PIPE_CAP_MAX_VARYINGS:368return 10;369370case PIPE_CAP_NIR_IMAGES_AS_DEREF:371return 0;372373case PIPE_CAP_VENDOR_ID:374return 0x8086;375case PIPE_CAP_DEVICE_ID:376return is->iws->pci_id;377case PIPE_CAP_ACCELERATED:378return 1;379case PIPE_CAP_VIDEO_MEMORY: {380/* Once a batch uses more than 75% of the maximum mappable size, we381* assume that there's some fragmentation, and we start doing extra382* flushing, etc. That's the big cliff apps will care about.383*/384const int gpu_mappable_megabytes =385is->iws->aperture_size(is->iws) * 3 / 4;386uint64_t system_memory;387388if (!os_get_total_physical_memory(&system_memory))389return 0;390391return MIN2(gpu_mappable_megabytes, (int)(system_memory >> 20));392}393case PIPE_CAP_UMA:394return 1;395396default:397return u_pipe_screen_get_param_defaults(screen, cap);398}399}400401static float402i915_get_paramf(struct pipe_screen *screen, enum pipe_capf cap)403{404switch (cap) {405case PIPE_CAPF_MAX_LINE_WIDTH:406FALLTHROUGH;407case PIPE_CAPF_MAX_LINE_WIDTH_AA:408return 7.5;409410case PIPE_CAPF_MAX_POINT_WIDTH:411FALLTHROUGH;412case PIPE_CAPF_MAX_POINT_WIDTH_AA:413return 255.0;414415case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:416return 4.0;417418case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:419return 16.0;420421case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:422FALLTHROUGH;423case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:424FALLTHROUGH;425case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:426return 0.0f;427428default:429debug_printf("%s: Unknown cap %u.\n", __FUNCTION__, cap);430return 0;431}432}433434bool435i915_is_format_supported(struct pipe_screen *screen, enum pipe_format format,436enum pipe_texture_target target, unsigned sample_count,437unsigned storage_sample_count, unsigned tex_usage)438{439static const enum pipe_format tex_supported[] = {440PIPE_FORMAT_B8G8R8A8_UNORM, PIPE_FORMAT_B8G8R8A8_SRGB,441PIPE_FORMAT_B8G8R8X8_UNORM, PIPE_FORMAT_R8G8B8A8_UNORM,442PIPE_FORMAT_R8G8B8X8_UNORM, PIPE_FORMAT_B4G4R4A4_UNORM,443PIPE_FORMAT_B5G6R5_UNORM, PIPE_FORMAT_B5G5R5A1_UNORM,444PIPE_FORMAT_B10G10R10A2_UNORM, PIPE_FORMAT_L8_UNORM, PIPE_FORMAT_A8_UNORM,445PIPE_FORMAT_I8_UNORM, PIPE_FORMAT_L8A8_UNORM, PIPE_FORMAT_UYVY,446PIPE_FORMAT_YUYV,447/* XXX why not?448PIPE_FORMAT_Z16_UNORM, */449PIPE_FORMAT_DXT1_RGB, PIPE_FORMAT_DXT1_RGBA, PIPE_FORMAT_DXT3_RGBA,450PIPE_FORMAT_DXT5_RGBA, PIPE_FORMAT_Z24X8_UNORM,451PIPE_FORMAT_Z24_UNORM_S8_UINT, PIPE_FORMAT_NONE /* list terminator */452};453static const enum pipe_format render_supported[] = {454PIPE_FORMAT_B8G8R8A8_UNORM, PIPE_FORMAT_B8G8R8X8_UNORM,455PIPE_FORMAT_R8G8B8A8_UNORM, PIPE_FORMAT_R8G8B8X8_UNORM,456PIPE_FORMAT_B5G6R5_UNORM, PIPE_FORMAT_B5G5R5A1_UNORM,457PIPE_FORMAT_B4G4R4A4_UNORM, PIPE_FORMAT_B10G10R10A2_UNORM,458PIPE_FORMAT_L8_UNORM, PIPE_FORMAT_A8_UNORM,459PIPE_FORMAT_I8_UNORM, PIPE_FORMAT_NONE /* list terminator */460};461static const enum pipe_format depth_supported[] = {462/* XXX why not?463PIPE_FORMAT_Z16_UNORM, */464PIPE_FORMAT_Z24X8_UNORM, PIPE_FORMAT_Z24_UNORM_S8_UINT,465PIPE_FORMAT_NONE /* list terminator */466};467const enum pipe_format *list;468uint32_t i;469470if (sample_count > 1)471return false;472473if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))474return false;475476if (tex_usage & PIPE_BIND_DEPTH_STENCIL)477list = depth_supported;478else if (tex_usage & PIPE_BIND_RENDER_TARGET)479list = render_supported;480else if (tex_usage & PIPE_BIND_SAMPLER_VIEW)481list = tex_supported;482else483return true; /* PIPE_BIND_{VERTEX,INDEX}_BUFFER */484485for (i = 0; list[i] != PIPE_FORMAT_NONE; i++) {486if (list[i] == format)487return true;488}489490return false;491}492493/*494* Fence functions495*/496497static void498i915_fence_reference(struct pipe_screen *screen, struct pipe_fence_handle **ptr,499struct pipe_fence_handle *fence)500{501struct i915_screen *is = i915_screen(screen);502503is->iws->fence_reference(is->iws, ptr, fence);504}505506static bool507i915_fence_finish(struct pipe_screen *screen, struct pipe_context *ctx,508struct pipe_fence_handle *fence, uint64_t timeout)509{510struct i915_screen *is = i915_screen(screen);511512if (!timeout)513return is->iws->fence_signalled(is->iws, fence) == 1;514515return is->iws->fence_finish(is->iws, fence) == 1;516}517518/*519* Generic functions520*/521522static void523i915_flush_frontbuffer(struct pipe_screen *screen, struct pipe_context *pipe,524struct pipe_resource *resource, unsigned level,525unsigned layer, void *winsys_drawable_handle,526struct pipe_box *sub_box)527{528/* XXX: Dummy right now. */529(void)screen;530(void)pipe;531(void)resource;532(void)level;533(void)layer;534(void)winsys_drawable_handle;535(void)sub_box;536}537538static void539i915_destroy_screen(struct pipe_screen *screen)540{541struct i915_screen *is = i915_screen(screen);542543if (is->iws)544is->iws->destroy(is->iws);545546FREE(is);547}548549/**550* Create a new i915_screen object551*/552struct pipe_screen *553i915_screen_create(struct i915_winsys *iws)554{555struct i915_screen *is = CALLOC_STRUCT(i915_screen);556557if (!is)558return NULL;559560switch (iws->pci_id) {561case PCI_CHIP_I915_G:562case PCI_CHIP_I915_GM:563is->is_i945 = false;564break;565566case PCI_CHIP_I945_G:567case PCI_CHIP_I945_GM:568case PCI_CHIP_I945_GME:569case PCI_CHIP_G33_G:570case PCI_CHIP_Q33_G:571case PCI_CHIP_Q35_G:572case PCI_CHIP_PINEVIEW_G:573case PCI_CHIP_PINEVIEW_M:574is->is_i945 = true;575break;576577default:578debug_printf("%s: unknown pci id 0x%x, cannot create screen\n",579__FUNCTION__, iws->pci_id);580FREE(is);581return NULL;582}583584is->iws = iws;585586is->base.destroy = i915_destroy_screen;587is->base.flush_frontbuffer = i915_flush_frontbuffer;588589is->base.get_name = i915_get_name;590is->base.get_vendor = i915_get_vendor;591is->base.get_device_vendor = i915_get_device_vendor;592is->base.get_param = i915_get_param;593is->base.get_shader_param = i915_get_shader_param;594is->base.get_paramf = i915_get_paramf;595is->base.get_compiler_options = i915_get_compiler_options;596is->base.is_format_supported = i915_is_format_supported;597598is->base.context_create = i915_create_context;599600is->base.fence_reference = i915_fence_reference;601is->base.fence_finish = i915_fence_finish;602603i915_init_screen_resource_functions(is);604605i915_debug_init(is);606607return &is->base;608}609610611