Path: blob/21.2-virgl/src/gallium/drivers/nouveau/nvc0/nvc0_screen.c
4574 views
/*1* Copyright 2010 Christoph Bumiller2*3* Permission is hereby granted, free of charge, to any person obtaining a4* copy of this software and associated documentation files (the "Software"),5* to deal in the Software without restriction, including without limitation6* the rights to use, copy, modify, merge, publish, distribute, sublicense,7* and/or sell copies of the Software, and to permit persons to whom the8* Software is furnished to do so, subject to the following conditions:9*10* The above copyright notice and this permission notice shall be included in11* all copies or substantial portions of the Software.12*13* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR14* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,15* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL16* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR17* OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,18* ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR19* OTHER DEALINGS IN THE SOFTWARE.20*/2122#include <xf86drm.h>23#include <nouveau_drm.h>24#include <nvif/class.h>25#include "util/format/u_format.h"26#include "util/format/u_format_s3tc.h"27#include "util/u_screen.h"28#include "pipe/p_screen.h"2930#include "nouveau_vp3_video.h"3132#include "codegen/nv50_ir_driver.h"3334#include "nvc0/nvc0_context.h"35#include "nvc0/nvc0_screen.h"3637#include "nvc0/mme/com9097.mme.h"38#include "nvc0/mme/com90c0.mme.h"39#include "nvc0/mme/comc597.mme.h"4041#include "nv50/g80_texture.xml.h"4243static bool44nvc0_screen_is_format_supported(struct pipe_screen *pscreen,45enum pipe_format format,46enum pipe_texture_target target,47unsigned sample_count,48unsigned storage_sample_count,49unsigned bindings)50{51const struct util_format_description *desc = util_format_description(format);5253if (sample_count > 8)54return false;55if (!(0x117 & (1 << sample_count))) /* 0, 1, 2, 4 or 8 */56return false;5758if (MAX2(1, sample_count) != MAX2(1, storage_sample_count))59return false;6061/* Short-circuit the rest of the logic -- this is used by the gallium frontend62* to determine valid MS levels in a no-attachments scenario.63*/64if (format == PIPE_FORMAT_NONE && bindings & PIPE_BIND_RENDER_TARGET)65return true;6667if ((bindings & PIPE_BIND_SAMPLER_VIEW) && (target != PIPE_BUFFER))68if (util_format_get_blocksizebits(format) == 3 * 32)69return false;7071if (bindings & PIPE_BIND_LINEAR)72if (util_format_is_depth_or_stencil(format) ||73(target != PIPE_TEXTURE_1D &&74target != PIPE_TEXTURE_2D &&75target != PIPE_TEXTURE_RECT) ||76sample_count > 1)77return false;7879/* Restrict ETC2 and ASTC formats here. These are only supported on GK20A80* and GM20B.81*/82if ((desc->layout == UTIL_FORMAT_LAYOUT_ETC ||83desc->layout == UTIL_FORMAT_LAYOUT_ASTC) &&84nouveau_screen(pscreen)->device->chipset != 0x12b &&85nouveau_screen(pscreen)->class_3d != NVEA_3D_CLASS)86return false;8788/* shared is always supported */89bindings &= ~(PIPE_BIND_LINEAR |90PIPE_BIND_SHARED);9192if (bindings & PIPE_BIND_SHADER_IMAGE) {93if (format == PIPE_FORMAT_B8G8R8A8_UNORM &&94nouveau_screen(pscreen)->class_3d < NVE4_3D_CLASS) {95/* This should work on Fermi, but for currently unknown reasons it96* does not and results in breaking reads from pbos. */97return false;98}99}100101if (bindings & PIPE_BIND_INDEX_BUFFER) {102if (format != PIPE_FORMAT_R8_UINT &&103format != PIPE_FORMAT_R16_UINT &&104format != PIPE_FORMAT_R32_UINT)105return false;106bindings &= ~PIPE_BIND_INDEX_BUFFER;107}108109return (( nvc0_format_table[format].usage |110nvc0_vertex_format[format].usage) & bindings) == bindings;111}112113static int114nvc0_screen_get_param(struct pipe_screen *pscreen, enum pipe_cap param)115{116const uint16_t class_3d = nouveau_screen(pscreen)->class_3d;117const struct nouveau_screen *screen = nouveau_screen(pscreen);118struct nouveau_device *dev = screen->device;119static bool debug_cap_printed[PIPE_CAP_LAST] = {};120121switch (param) {122/* non-boolean caps */123case PIPE_CAP_MAX_TEXTURE_2D_SIZE:124return 16384;125case PIPE_CAP_MAX_TEXTURE_CUBE_LEVELS:126return 15;127case PIPE_CAP_MAX_TEXTURE_3D_LEVELS:128return 12;129case PIPE_CAP_MAX_TEXTURE_ARRAY_LAYERS:130return 2048;131case PIPE_CAP_MIN_TEXEL_OFFSET:132return -8;133case PIPE_CAP_MAX_TEXEL_OFFSET:134return 7;135case PIPE_CAP_MIN_TEXTURE_GATHER_OFFSET:136return -32;137case PIPE_CAP_MAX_TEXTURE_GATHER_OFFSET:138return 31;139case PIPE_CAP_MAX_TEXTURE_BUFFER_SIZE:140return 128 * 1024 * 1024;141case PIPE_CAP_GLSL_FEATURE_LEVEL:142return 430;143case PIPE_CAP_GLSL_FEATURE_LEVEL_COMPATIBILITY:144return 430;145case PIPE_CAP_MAX_RENDER_TARGETS:146return 8;147case PIPE_CAP_MAX_DUAL_SOURCE_RENDER_TARGETS:148return 1;149case PIPE_CAP_VIEWPORT_SUBPIXEL_BITS:150case PIPE_CAP_RASTERIZER_SUBPIXEL_BITS:151return 8;152case PIPE_CAP_MAX_STREAM_OUTPUT_BUFFERS:153return 4;154case PIPE_CAP_MAX_STREAM_OUTPUT_SEPARATE_COMPONENTS:155case PIPE_CAP_MAX_STREAM_OUTPUT_INTERLEAVED_COMPONENTS:156return 128;157case PIPE_CAP_MAX_GEOMETRY_OUTPUT_VERTICES:158case PIPE_CAP_MAX_GEOMETRY_TOTAL_OUTPUT_COMPONENTS:159return 1024;160case PIPE_CAP_MAX_VERTEX_STREAMS:161return 4;162case PIPE_CAP_MAX_GS_INVOCATIONS:163return 32;164case PIPE_CAP_MAX_SHADER_BUFFER_SIZE:165return 1 << 27;166case PIPE_CAP_MAX_VERTEX_ATTRIB_STRIDE:167return 2048;168case PIPE_CAP_MAX_VERTEX_ELEMENT_SRC_OFFSET:169return 2047;170case PIPE_CAP_CONSTANT_BUFFER_OFFSET_ALIGNMENT:171return 256;172case PIPE_CAP_TEXTURE_BUFFER_OFFSET_ALIGNMENT:173if (class_3d < GM107_3D_CLASS)174return 256; /* IMAGE bindings require alignment to 256 */175return 16;176case PIPE_CAP_SHADER_BUFFER_OFFSET_ALIGNMENT:177return 16;178case PIPE_CAP_MIN_MAP_BUFFER_ALIGNMENT:179return NOUVEAU_MIN_BUFFER_MAP_ALIGN;180case PIPE_CAP_MAX_VIEWPORTS:181return NVC0_MAX_VIEWPORTS;182case PIPE_CAP_MAX_TEXTURE_GATHER_COMPONENTS:183return 4;184case PIPE_CAP_TEXTURE_BORDER_COLOR_QUIRK:185return PIPE_QUIRK_TEXTURE_BORDER_COLOR_SWIZZLE_NV50;186case PIPE_CAP_ENDIANNESS:187return PIPE_ENDIAN_LITTLE;188case PIPE_CAP_MAX_SHADER_PATCH_VARYINGS:189return 30;190case PIPE_CAP_MAX_WINDOW_RECTANGLES:191return NVC0_MAX_WINDOW_RECTANGLES;192case PIPE_CAP_MAX_CONSERVATIVE_RASTER_SUBPIXEL_PRECISION_BIAS:193return class_3d >= GM200_3D_CLASS ? 8 : 0;194case PIPE_CAP_MAX_TEXTURE_UPLOAD_MEMORY_BUDGET:195return 64 * 1024 * 1024;196case PIPE_CAP_MAX_VARYINGS:197/* NOTE: These only count our slots for GENERIC varyings.198* The address space may be larger, but the actual hard limit seems to be199* less than what the address space layout permits, so don't add TEXCOORD,200* COLOR, etc. here.201*/202return 0x1f0 / 16;203case PIPE_CAP_MAX_VERTEX_BUFFERS:204return 16;205case PIPE_CAP_GL_BEGIN_END_BUFFER_SIZE:206return 512 * 1024; /* TODO: Investigate tuning this */207case PIPE_CAP_MAX_TEXTURE_MB:208return 0; /* TODO: use 1/2 of VRAM for this? */209210case PIPE_CAP_SUPPORTED_PRIM_MODES_WITH_RESTART:211case PIPE_CAP_SUPPORTED_PRIM_MODES:212return BITFIELD_MASK(PIPE_PRIM_MAX);213214/* supported caps */215case PIPE_CAP_TEXTURE_MIRROR_CLAMP:216case PIPE_CAP_TEXTURE_MIRROR_CLAMP_TO_EDGE:217case PIPE_CAP_TEXTURE_SWIZZLE:218case PIPE_CAP_TEXTURE_SHADOW_MAP:219case PIPE_CAP_NPOT_TEXTURES:220case PIPE_CAP_MIXED_FRAMEBUFFER_SIZES:221case PIPE_CAP_MIXED_COLOR_DEPTH_BITS:222case PIPE_CAP_ANISOTROPIC_FILTER:223case PIPE_CAP_SEAMLESS_CUBE_MAP:224case PIPE_CAP_CUBE_MAP_ARRAY:225case PIPE_CAP_TEXTURE_BUFFER_OBJECTS:226case PIPE_CAP_TEXTURE_MULTISAMPLE:227case PIPE_CAP_DEPTH_CLIP_DISABLE:228case PIPE_CAP_POINT_SPRITE:229case PIPE_CAP_TGSI_TEXCOORD:230case PIPE_CAP_FRAGMENT_SHADER_TEXTURE_LOD:231case PIPE_CAP_FRAGMENT_SHADER_DERIVATIVES:232case PIPE_CAP_VERTEX_SHADER_SATURATE:233case PIPE_CAP_FRAGMENT_COLOR_CLAMPED:234case PIPE_CAP_VERTEX_COLOR_UNCLAMPED:235case PIPE_CAP_VERTEX_COLOR_CLAMPED:236case PIPE_CAP_QUERY_TIMESTAMP:237case PIPE_CAP_QUERY_TIME_ELAPSED:238case PIPE_CAP_OCCLUSION_QUERY:239case PIPE_CAP_STREAM_OUTPUT_PAUSE_RESUME:240case PIPE_CAP_STREAM_OUTPUT_INTERLEAVE_BUFFERS:241case PIPE_CAP_QUERY_PIPELINE_STATISTICS:242case PIPE_CAP_BLEND_EQUATION_SEPARATE:243case PIPE_CAP_INDEP_BLEND_ENABLE:244case PIPE_CAP_INDEP_BLEND_FUNC:245case PIPE_CAP_TGSI_FS_COORD_ORIGIN_UPPER_LEFT:246case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_HALF_INTEGER:247case PIPE_CAP_PRIMITIVE_RESTART:248case PIPE_CAP_PRIMITIVE_RESTART_FIXED_INDEX:249case PIPE_CAP_TGSI_INSTANCEID:250case PIPE_CAP_VERTEX_ELEMENT_INSTANCE_DIVISOR:251case PIPE_CAP_MIXED_COLORBUFFER_FORMATS:252case PIPE_CAP_CONDITIONAL_RENDER:253case PIPE_CAP_TEXTURE_BARRIER:254case PIPE_CAP_QUADS_FOLLOW_PROVOKING_VERTEX_CONVENTION:255case PIPE_CAP_START_INSTANCE:256case PIPE_CAP_BUFFER_MAP_PERSISTENT_COHERENT:257case PIPE_CAP_DRAW_INDIRECT:258case PIPE_CAP_USER_VERTEX_BUFFERS:259case PIPE_CAP_TEXTURE_QUERY_LOD:260case PIPE_CAP_SAMPLE_SHADING:261case PIPE_CAP_TEXTURE_GATHER_OFFSETS:262case PIPE_CAP_TEXTURE_GATHER_SM5:263case PIPE_CAP_TGSI_FS_FINE_DERIVATIVE:264case PIPE_CAP_CONDITIONAL_RENDER_INVERTED:265case PIPE_CAP_SAMPLER_VIEW_TARGET:266case PIPE_CAP_CLIP_HALFZ:267case PIPE_CAP_POLYGON_OFFSET_CLAMP:268case PIPE_CAP_MULTISAMPLE_Z_RESOLVE:269case PIPE_CAP_TEXTURE_FLOAT_LINEAR:270case PIPE_CAP_TEXTURE_HALF_FLOAT_LINEAR:271case PIPE_CAP_DEPTH_BOUNDS_TEST:272case PIPE_CAP_TGSI_TXQS:273case PIPE_CAP_COPY_BETWEEN_COMPRESSED_AND_PLAIN_FORMATS:274case PIPE_CAP_FORCE_PERSAMPLE_INTERP:275case PIPE_CAP_CLEAR_TEXTURE:276case PIPE_CAP_DRAW_PARAMETERS:277case PIPE_CAP_TGSI_PACK_HALF_FLOAT:278case PIPE_CAP_MULTI_DRAW_INDIRECT:279case PIPE_CAP_MULTI_DRAW_INDIRECT_PARAMS:280case PIPE_CAP_TGSI_FS_FACE_IS_INTEGER_SYSVAL:281case PIPE_CAP_QUERY_BUFFER_OBJECT:282case PIPE_CAP_INVALIDATE_BUFFER:283case PIPE_CAP_STRING_MARKER:284case PIPE_CAP_FRAMEBUFFER_NO_ATTACHMENT:285case PIPE_CAP_CULL_DISTANCE:286case PIPE_CAP_ROBUST_BUFFER_ACCESS_BEHAVIOR:287case PIPE_CAP_TGSI_VOTE:288case PIPE_CAP_POLYGON_OFFSET_UNITS_UNSCALED:289case PIPE_CAP_TGSI_ARRAY_COMPONENTS:290case PIPE_CAP_TGSI_MUL_ZERO_WINS:291case PIPE_CAP_DOUBLES:292case PIPE_CAP_INT64:293case PIPE_CAP_TGSI_TEX_TXF_LZ:294case PIPE_CAP_TGSI_CLOCK:295case PIPE_CAP_COMPUTE:296case PIPE_CAP_CAN_BIND_CONST_BUFFER_AS_VERTEX:297case PIPE_CAP_ALLOW_MAPPED_BUFFERS_DURING_EXECUTION:298case PIPE_CAP_QUERY_SO_OVERFLOW:299case PIPE_CAP_DEST_SURFACE_SRGB_CONTROL:300case PIPE_CAP_TGSI_DIV:301case PIPE_CAP_TGSI_ATOMINC_WRAP:302case PIPE_CAP_DEMOTE_TO_HELPER_INVOCATION:303case PIPE_CAP_DEVICE_RESET_STATUS_QUERY:304case PIPE_CAP_PREFER_IMM_ARRAYS_AS_CONSTBUF:305case PIPE_CAP_FLATSHADE:306case PIPE_CAP_ALPHA_TEST:307case PIPE_CAP_POINT_SIZE_FIXED:308case PIPE_CAP_TWO_SIDED_COLOR:309case PIPE_CAP_CLIP_PLANES:310case PIPE_CAP_TEXTURE_SHADOW_LOD:311case PIPE_CAP_PACKED_STREAM_OUTPUT:312case PIPE_CAP_CLEAR_SCISSORED:313case PIPE_CAP_GL_CLAMP:314return 1;315case PIPE_CAP_PREFER_BLIT_BASED_TEXTURE_TRANSFER:316return nouveau_screen(pscreen)->vram_domain & NOUVEAU_BO_VRAM ? 1 : 0;317case PIPE_CAP_FBFETCH:318return class_3d >= NVE4_3D_CLASS ? 1 : 0; /* needs testing on fermi */319case PIPE_CAP_SEAMLESS_CUBE_MAP_PER_TEXTURE:320case PIPE_CAP_TGSI_BALLOT:321return class_3d >= NVE4_3D_CLASS;322case PIPE_CAP_BINDLESS_TEXTURE:323return class_3d >= NVE4_3D_CLASS;324case PIPE_CAP_TGSI_ATOMFADD:325return class_3d < GM107_3D_CLASS; /* needs additional lowering */326case PIPE_CAP_POLYGON_MODE_FILL_RECTANGLE:327case PIPE_CAP_TGSI_VS_LAYER_VIEWPORT:328case PIPE_CAP_TGSI_TES_LAYER_VIEWPORT:329case PIPE_CAP_POST_DEPTH_COVERAGE:330case PIPE_CAP_CONSERVATIVE_RASTER_POST_SNAP_TRIANGLES:331case PIPE_CAP_CONSERVATIVE_RASTER_POST_SNAP_POINTS_LINES:332case PIPE_CAP_CONSERVATIVE_RASTER_POST_DEPTH_COVERAGE:333case PIPE_CAP_PROGRAMMABLE_SAMPLE_LOCATIONS:334case PIPE_CAP_VIEWPORT_SWIZZLE:335case PIPE_CAP_VIEWPORT_MASK:336case PIPE_CAP_SAMPLER_REDUCTION_MINMAX:337return class_3d >= GM200_3D_CLASS;338case PIPE_CAP_CONSERVATIVE_RASTER_PRE_SNAP_TRIANGLES:339return class_3d >= GP100_3D_CLASS;340case PIPE_CAP_RESOURCE_FROM_USER_MEMORY_COMPUTE_ONLY:341case PIPE_CAP_SYSTEM_SVM:342return screen->has_svm ? 1 : 0;343344/* caps has to be turned on with nir */345case PIPE_CAP_GL_SPIRV:346case PIPE_CAP_GL_SPIRV_VARIABLE_POINTERS:347case PIPE_CAP_INT64_DIVMOD:348return screen->prefer_nir ? 1 : 0;349350/* nir related caps */351case PIPE_CAP_NIR_IMAGES_AS_DEREF:352return 0;353354/* unsupported caps */355case PIPE_CAP_EMULATE_NONFIXED_PRIMITIVE_RESTART:356case PIPE_CAP_DEPTH_CLIP_DISABLE_SEPARATE:357case PIPE_CAP_TGSI_FS_COORD_ORIGIN_LOWER_LEFT:358case PIPE_CAP_TGSI_FS_COORD_PIXEL_CENTER_INTEGER:359case PIPE_CAP_SHADER_STENCIL_EXPORT:360case PIPE_CAP_TGSI_CAN_COMPACT_CONSTANTS:361case PIPE_CAP_VERTEX_BUFFER_OFFSET_4BYTE_ALIGNED_ONLY:362case PIPE_CAP_VERTEX_BUFFER_STRIDE_4BYTE_ALIGNED_ONLY:363case PIPE_CAP_VERTEX_ELEMENT_SRC_OFFSET_4BYTE_ALIGNED_ONLY:364case PIPE_CAP_FAKE_SW_MSAA:365case PIPE_CAP_TGSI_VS_WINDOW_SPACE_POSITION:366case PIPE_CAP_VERTEXID_NOBASE:367case PIPE_CAP_RESOURCE_FROM_USER_MEMORY:368case PIPE_CAP_TGSI_FS_POSITION_IS_SYSVAL:369case PIPE_CAP_TGSI_FS_POINT_IS_SYSVAL:370case PIPE_CAP_GENERATE_MIPMAP:371case PIPE_CAP_BUFFER_SAMPLER_VIEW_RGBA_ONLY:372case PIPE_CAP_SURFACE_REINTERPRET_BLOCKS:373case PIPE_CAP_QUERY_MEMORY_INFO:374case PIPE_CAP_PCI_GROUP:375case PIPE_CAP_PCI_BUS:376case PIPE_CAP_PCI_DEVICE:377case PIPE_CAP_PCI_FUNCTION:378case PIPE_CAP_TGSI_CAN_READ_OUTPUTS:379case PIPE_CAP_NATIVE_FENCE_FD:380case PIPE_CAP_GLSL_OPTIMIZE_CONSERVATIVELY:381case PIPE_CAP_SPARSE_BUFFER_PAGE_SIZE:382case PIPE_CAP_NIR_SAMPLERS_AS_DEREF:383case PIPE_CAP_MEMOBJ:384case PIPE_CAP_LOAD_CONSTBUF:385case PIPE_CAP_TGSI_ANY_REG_AS_ADDRESS:386case PIPE_CAP_TILE_RASTER_ORDER:387case PIPE_CAP_MAX_COMBINED_SHADER_OUTPUT_RESOURCES:388case PIPE_CAP_FRAMEBUFFER_MSAA_CONSTRAINTS:389case PIPE_CAP_SIGNED_VERTEX_BUFFER_OFFSET:390case PIPE_CAP_CONTEXT_PRIORITY_MASK:391case PIPE_CAP_FENCE_SIGNAL:392case PIPE_CAP_CONSTBUF0_FLAGS:393case PIPE_CAP_PACKED_UNIFORMS:394case PIPE_CAP_CONSERVATIVE_RASTER_PRE_SNAP_POINTS_LINES:395case PIPE_CAP_MAX_COMBINED_SHADER_BUFFERS:396case PIPE_CAP_MAX_COMBINED_HW_ATOMIC_COUNTERS:397case PIPE_CAP_MAX_COMBINED_HW_ATOMIC_COUNTER_BUFFERS:398case PIPE_CAP_SURFACE_SAMPLE_COUNT:399case PIPE_CAP_QUERY_PIPELINE_STATISTICS_SINGLE:400case PIPE_CAP_RGB_OVERRIDE_DST_ALPHA_BLEND:401case PIPE_CAP_GLSL_TESS_LEVELS_AS_INPUTS:402case PIPE_CAP_NIR_COMPACT_ARRAYS:403case PIPE_CAP_IMAGE_LOAD_FORMATTED:404case PIPE_CAP_COMPUTE_SHADER_DERIVATIVES:405case PIPE_CAP_ATOMIC_FLOAT_MINMAX:406case PIPE_CAP_CONSERVATIVE_RASTER_INNER_COVERAGE:407case PIPE_CAP_FRAGMENT_SHADER_INTERLOCK:408case PIPE_CAP_CS_DERIVED_SYSTEM_VALUES_SUPPORTED:409case PIPE_CAP_FBFETCH_COHERENT:410case PIPE_CAP_TGSI_SKIP_SHRINK_IO_ARRAYS:411case PIPE_CAP_TGSI_TG4_COMPONENT_IN_SWIZZLE:412case PIPE_CAP_OPENCL_INTEGER_FUNCTIONS: /* could be done */413case PIPE_CAP_INTEGER_MULTIPLY_32X16: /* could be done */414case PIPE_CAP_FRONTEND_NOOP:415case PIPE_CAP_SHADER_SAMPLES_IDENTICAL:416case PIPE_CAP_VIEWPORT_TRANSFORM_LOWERED:417case PIPE_CAP_PSIZ_CLAMPED:418case PIPE_CAP_TEXTURE_BUFFER_SAMPLER:419case PIPE_CAP_PREFER_REAL_BUFFER_IN_CONSTBUF0:420case PIPE_CAP_MAP_UNSYNCHRONIZED_THREAD_SAFE: /* when we fix MT stuff */421case PIPE_CAP_ALPHA_TO_COVERAGE_DITHER_CONTROL: /* TODO */422case PIPE_CAP_SHADER_ATOMIC_INT64: /* TODO */423case PIPE_CAP_GLSL_ZERO_INIT:424case PIPE_CAP_BLEND_EQUATION_ADVANCED:425case PIPE_CAP_NO_CLIP_ON_COPY_TEX:426case PIPE_CAP_DEVICE_PROTECTED_CONTENT:427case PIPE_CAP_SAMPLER_REDUCTION_MINMAX_ARB:428return 0;429430case PIPE_CAP_VENDOR_ID:431return 0x10de;432case PIPE_CAP_DEVICE_ID: {433uint64_t device_id;434if (nouveau_getparam(dev, NOUVEAU_GETPARAM_PCI_DEVICE, &device_id)) {435NOUVEAU_ERR("NOUVEAU_GETPARAM_PCI_DEVICE failed.\n");436return -1;437}438return device_id;439}440case PIPE_CAP_ACCELERATED:441return 1;442case PIPE_CAP_VIDEO_MEMORY:443return dev->vram_size >> 20;444case PIPE_CAP_UMA:445return 0;446447default:448if (!debug_cap_printed[param]) {449debug_printf("%s: unhandled cap %d\n", __func__, param);450debug_cap_printed[param] = true;451}452FALLTHROUGH;453/* caps where we want the default value */454case PIPE_CAP_DMABUF:455case PIPE_CAP_ESSL_FEATURE_LEVEL:456case PIPE_CAP_THROTTLE:457return u_pipe_screen_get_param_defaults(pscreen, param);458}459}460461static int462nvc0_screen_get_shader_param(struct pipe_screen *pscreen,463enum pipe_shader_type shader,464enum pipe_shader_cap param)465{466const struct nouveau_screen *screen = nouveau_screen(pscreen);467const uint16_t class_3d = screen->class_3d;468469switch (shader) {470case PIPE_SHADER_VERTEX:471case PIPE_SHADER_GEOMETRY:472case PIPE_SHADER_FRAGMENT:473case PIPE_SHADER_COMPUTE:474case PIPE_SHADER_TESS_CTRL:475case PIPE_SHADER_TESS_EVAL:476break;477default:478return 0;479}480481switch (param) {482case PIPE_SHADER_CAP_PREFERRED_IR:483return screen->prefer_nir ? PIPE_SHADER_IR_NIR : PIPE_SHADER_IR_TGSI;484case PIPE_SHADER_CAP_SUPPORTED_IRS: {485uint32_t irs = 1 << PIPE_SHADER_IR_NIR |486((class_3d >= GV100_3D_CLASS) ? 0 : 1 << PIPE_SHADER_IR_TGSI);487if (screen->force_enable_cl)488irs |= 1 << PIPE_SHADER_IR_NIR_SERIALIZED;489return irs;490}491case PIPE_SHADER_CAP_MAX_INSTRUCTIONS:492case PIPE_SHADER_CAP_MAX_ALU_INSTRUCTIONS:493case PIPE_SHADER_CAP_MAX_TEX_INSTRUCTIONS:494case PIPE_SHADER_CAP_MAX_TEX_INDIRECTIONS:495return 16384;496case PIPE_SHADER_CAP_MAX_CONTROL_FLOW_DEPTH:497return 16;498case PIPE_SHADER_CAP_MAX_INPUTS:499return 0x200 / 16;500case PIPE_SHADER_CAP_MAX_OUTPUTS:501return 32;502case PIPE_SHADER_CAP_MAX_CONST_BUFFER_SIZE:503return NVC0_MAX_CONSTBUF_SIZE;504case PIPE_SHADER_CAP_MAX_CONST_BUFFERS:505return NVC0_MAX_PIPE_CONSTBUFS;506case PIPE_SHADER_CAP_INDIRECT_OUTPUT_ADDR:507return shader != PIPE_SHADER_FRAGMENT;508case PIPE_SHADER_CAP_INDIRECT_INPUT_ADDR:509/* HW doesn't support indirect addressing of fragment program inputs510* on Volta. The binary driver generates a function to handle every511* possible indirection, and indirectly calls the function to handle512* this instead.513*/514if (class_3d >= GV100_3D_CLASS)515return shader != PIPE_SHADER_FRAGMENT;516return 1;517case PIPE_SHADER_CAP_INDIRECT_TEMP_ADDR:518case PIPE_SHADER_CAP_INDIRECT_CONST_ADDR:519return 1;520case PIPE_SHADER_CAP_MAX_TEMPS:521return NVC0_CAP_MAX_PROGRAM_TEMPS;522case PIPE_SHADER_CAP_TGSI_CONT_SUPPORTED:523return 1;524case PIPE_SHADER_CAP_TGSI_SQRT_SUPPORTED:525return 1;526case PIPE_SHADER_CAP_SUBROUTINES:527return 1;528case PIPE_SHADER_CAP_INTEGERS:529return 1;530case PIPE_SHADER_CAP_TGSI_DROUND_SUPPORTED:531return 1;532case PIPE_SHADER_CAP_TGSI_FMA_SUPPORTED:533return 1;534case PIPE_SHADER_CAP_TGSI_SKIP_MERGE_REGISTERS:535return 1;536case PIPE_SHADER_CAP_TGSI_DFRACEXP_DLDEXP_SUPPORTED:537case PIPE_SHADER_CAP_TGSI_LDEXP_SUPPORTED:538case PIPE_SHADER_CAP_TGSI_ANY_INOUT_DECL_RANGE:539case PIPE_SHADER_CAP_LOWER_IF_THRESHOLD:540case PIPE_SHADER_CAP_INT64_ATOMICS:541case PIPE_SHADER_CAP_FP16:542case PIPE_SHADER_CAP_FP16_DERIVATIVES:543case PIPE_SHADER_CAP_FP16_CONST_BUFFERS:544case PIPE_SHADER_CAP_INT16:545case PIPE_SHADER_CAP_GLSL_16BIT_CONSTS:546case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTERS:547case PIPE_SHADER_CAP_MAX_HW_ATOMIC_COUNTER_BUFFERS:548return 0;549case PIPE_SHADER_CAP_MAX_SHADER_BUFFERS:550return NVC0_MAX_BUFFERS;551case PIPE_SHADER_CAP_MAX_TEXTURE_SAMPLERS:552return (class_3d >= NVE4_3D_CLASS) ? 32 : 16;553case PIPE_SHADER_CAP_MAX_SAMPLER_VIEWS:554return (class_3d >= NVE4_3D_CLASS) ? 32 : 16;555case PIPE_SHADER_CAP_MAX_UNROLL_ITERATIONS_HINT:556return 32;557case PIPE_SHADER_CAP_MAX_SHADER_IMAGES:558if (class_3d >= NVE4_3D_CLASS)559return NVC0_MAX_IMAGES;560if (shader == PIPE_SHADER_FRAGMENT || shader == PIPE_SHADER_COMPUTE)561return NVC0_MAX_IMAGES;562return 0;563default:564NOUVEAU_ERR("unknown PIPE_SHADER_CAP %d\n", param);565return 0;566}567}568569static float570nvc0_screen_get_paramf(struct pipe_screen *pscreen, enum pipe_capf param)571{572const uint16_t class_3d = nouveau_screen(pscreen)->class_3d;573574switch (param) {575case PIPE_CAPF_MAX_LINE_WIDTH:576case PIPE_CAPF_MAX_LINE_WIDTH_AA:577return 10.0f;578case PIPE_CAPF_MAX_POINT_WIDTH:579return 63.0f;580case PIPE_CAPF_MAX_POINT_WIDTH_AA:581return 63.375f;582case PIPE_CAPF_MAX_TEXTURE_ANISOTROPY:583return 16.0f;584case PIPE_CAPF_MAX_TEXTURE_LOD_BIAS:585return 15.0f;586case PIPE_CAPF_MIN_CONSERVATIVE_RASTER_DILATE:587return 0.0f;588case PIPE_CAPF_MAX_CONSERVATIVE_RASTER_DILATE:589return class_3d >= GM200_3D_CLASS ? 0.75f : 0.0f;590case PIPE_CAPF_CONSERVATIVE_RASTER_DILATE_GRANULARITY:591return class_3d >= GM200_3D_CLASS ? 0.25f : 0.0f;592}593594NOUVEAU_ERR("unknown PIPE_CAPF %d\n", param);595return 0.0f;596}597598static int599nvc0_screen_get_compute_param(struct pipe_screen *pscreen,600enum pipe_shader_ir ir_type,601enum pipe_compute_cap param, void *data)602{603struct nvc0_screen *screen = nvc0_screen(pscreen);604const uint16_t obj_class = screen->compute->oclass;605606#define RET(x) do { \607if (data) \608memcpy(data, x, sizeof(x)); \609return sizeof(x); \610} while (0)611612switch (param) {613case PIPE_COMPUTE_CAP_GRID_DIMENSION:614RET((uint64_t []) { 3 });615case PIPE_COMPUTE_CAP_MAX_GRID_SIZE:616if (obj_class >= NVE4_COMPUTE_CLASS) {617RET(((uint64_t []) { 0x7fffffff, 65535, 65535 }));618} else {619RET(((uint64_t []) { 65535, 65535, 65535 }));620}621case PIPE_COMPUTE_CAP_MAX_BLOCK_SIZE:622RET(((uint64_t []) { 1024, 1024, 64 }));623case PIPE_COMPUTE_CAP_MAX_THREADS_PER_BLOCK:624RET((uint64_t []) { 1024 });625case PIPE_COMPUTE_CAP_MAX_VARIABLE_THREADS_PER_BLOCK:626if (obj_class >= NVE4_COMPUTE_CLASS) {627RET((uint64_t []) { 1024 });628} else {629RET((uint64_t []) { 512 });630}631case PIPE_COMPUTE_CAP_MAX_GLOBAL_SIZE: /* g[] */632RET((uint64_t []) { 1ULL << 40 });633case PIPE_COMPUTE_CAP_MAX_LOCAL_SIZE: /* s[] */634switch (obj_class) {635case GM200_COMPUTE_CLASS:636RET((uint64_t []) { 96 << 10 });637case GM107_COMPUTE_CLASS:638RET((uint64_t []) { 64 << 10 });639default:640RET((uint64_t []) { 48 << 10 });641}642case PIPE_COMPUTE_CAP_MAX_PRIVATE_SIZE: /* l[] */643RET((uint64_t []) { 512 << 10 });644case PIPE_COMPUTE_CAP_MAX_INPUT_SIZE: /* c[], arbitrary limit */645RET((uint64_t []) { 4096 });646case PIPE_COMPUTE_CAP_SUBGROUP_SIZE:647RET((uint32_t []) { 32 });648case PIPE_COMPUTE_CAP_MAX_MEM_ALLOC_SIZE:649RET((uint64_t []) { 1ULL << 40 });650case PIPE_COMPUTE_CAP_IMAGES_SUPPORTED:651RET((uint32_t []) { NVC0_MAX_IMAGES });652case PIPE_COMPUTE_CAP_MAX_COMPUTE_UNITS:653RET((uint32_t []) { screen->mp_count_compute });654case PIPE_COMPUTE_CAP_MAX_CLOCK_FREQUENCY:655RET((uint32_t []) { 512 }); /* FIXME: arbitrary limit */656case PIPE_COMPUTE_CAP_ADDRESS_BITS:657RET((uint32_t []) { 64 });658default:659return 0;660}661662#undef RET663}664665static void666nvc0_screen_get_sample_pixel_grid(struct pipe_screen *pscreen,667unsigned sample_count,668unsigned *width, unsigned *height)669{670switch (sample_count) {671case 0:672case 1:673/* this could be 4x4, but the GL state tracker makes it difficult to674* create a 1x MSAA texture and smaller grids save CB space */675*width = 2;676*height = 4;677break;678case 2:679*width = 2;680*height = 4;681break;682case 4:683*width = 2;684*height = 2;685break;686case 8:687*width = 1;688*height = 2;689break;690default:691assert(0);692}693}694695static void696nvc0_screen_destroy(struct pipe_screen *pscreen)697{698struct nvc0_screen *screen = nvc0_screen(pscreen);699700if (!nouveau_drm_screen_unref(&screen->base))701return;702703nouveau_fence_cleanup(&screen->base);704705if (screen->base.pushbuf)706screen->base.pushbuf->user_priv = NULL;707708if (screen->blitter)709nvc0_blitter_destroy(screen);710if (screen->pm.prog) {711screen->pm.prog->code = NULL; /* hardcoded, don't FREE */712nvc0_program_destroy(NULL, screen->pm.prog);713FREE(screen->pm.prog);714}715716nouveau_bo_ref(NULL, &screen->text);717nouveau_bo_ref(NULL, &screen->uniform_bo);718nouveau_bo_ref(NULL, &screen->tls);719nouveau_bo_ref(NULL, &screen->txc);720nouveau_bo_ref(NULL, &screen->fence.bo);721nouveau_bo_ref(NULL, &screen->poly_cache);722723nouveau_heap_destroy(&screen->lib_code);724nouveau_heap_destroy(&screen->text_heap);725726FREE(screen->tic.entries);727728nouveau_object_del(&screen->eng3d);729nouveau_object_del(&screen->eng2d);730nouveau_object_del(&screen->m2mf);731nouveau_object_del(&screen->compute);732nouveau_object_del(&screen->nvsw);733734nouveau_screen_fini(&screen->base);735736FREE(screen);737}738739static int740nvc0_graph_set_macro(struct nvc0_screen *screen, uint32_t m, unsigned pos,741unsigned size, const uint32_t *data)742{743struct nouveau_pushbuf *push = screen->base.pushbuf;744745size /= 4;746747assert((pos + size) <= 0x800);748749BEGIN_NVC0(push, SUBC_3D(NVC0_GRAPH_MACRO_ID), 2);750PUSH_DATA (push, (m - 0x3800) / 8);751PUSH_DATA (push, pos);752BEGIN_1IC0(push, SUBC_3D(NVC0_GRAPH_MACRO_UPLOAD_POS), size + 1);753PUSH_DATA (push, pos);754PUSH_DATAp(push, data, size);755756return pos + size;757}758759static int760tu102_graph_set_macro(struct nvc0_screen *screen, uint32_t m, unsigned pos,761unsigned size, const uint32_t *data)762{763struct nouveau_pushbuf *push = screen->base.pushbuf;764765size /= 4;766767assert((pos + size) <= 0x800);768769BEGIN_NVC0(push, SUBC_3D(NVC0_GRAPH_MACRO_ID), 2);770PUSH_DATA (push, (m - 0x3800) / 8);771PUSH_DATA (push, pos);772BEGIN_1IC0(push, SUBC_3D(NVC0_GRAPH_MACRO_UPLOAD_POS), size + 1);773PUSH_DATA (push, pos);774PUSH_DATAp(push, data, size);775776return pos + (size / 3);777}778779static void780nvc0_magic_3d_init(struct nouveau_pushbuf *push, uint16_t obj_class)781{782BEGIN_NVC0(push, SUBC_3D(0x10cc), 1);783PUSH_DATA (push, 0xff);784BEGIN_NVC0(push, SUBC_3D(0x10e0), 2);785PUSH_DATA (push, 0xff);786PUSH_DATA (push, 0xff);787BEGIN_NVC0(push, SUBC_3D(0x10ec), 2);788PUSH_DATA (push, 0xff);789PUSH_DATA (push, 0xff);790if (obj_class < GV100_3D_CLASS) {791BEGIN_NVC0(push, SUBC_3D(0x074c), 1);792PUSH_DATA (push, 0x3f);793}794795BEGIN_NVC0(push, SUBC_3D(0x16a8), 1);796PUSH_DATA (push, (3 << 16) | 3);797BEGIN_NVC0(push, SUBC_3D(0x1794), 1);798PUSH_DATA (push, (2 << 16) | 2);799800if (obj_class < GM107_3D_CLASS) {801BEGIN_NVC0(push, SUBC_3D(0x12ac), 1);802PUSH_DATA (push, 0);803}804BEGIN_NVC0(push, SUBC_3D(0x0218), 1);805PUSH_DATA (push, 0x10);806BEGIN_NVC0(push, SUBC_3D(0x10fc), 1);807PUSH_DATA (push, 0x10);808BEGIN_NVC0(push, SUBC_3D(0x1290), 1);809PUSH_DATA (push, 0x10);810BEGIN_NVC0(push, SUBC_3D(0x12d8), 2);811PUSH_DATA (push, 0x10);812PUSH_DATA (push, 0x10);813BEGIN_NVC0(push, SUBC_3D(0x1140), 1);814PUSH_DATA (push, 0x10);815BEGIN_NVC0(push, SUBC_3D(0x1610), 1);816PUSH_DATA (push, 0xe);817818BEGIN_NVC0(push, NVC0_3D(VERTEX_ID_GEN_MODE), 1);819PUSH_DATA (push, NVC0_3D_VERTEX_ID_GEN_MODE_DRAW_ARRAYS_ADD_START);820BEGIN_NVC0(push, SUBC_3D(0x030c), 1);821PUSH_DATA (push, 0);822BEGIN_NVC0(push, SUBC_3D(0x0300), 1);823PUSH_DATA (push, 3);824825if (obj_class < GV100_3D_CLASS) {826BEGIN_NVC0(push, SUBC_3D(0x02d0), 1);827PUSH_DATA (push, 0x3fffff);828}829BEGIN_NVC0(push, SUBC_3D(0x0fdc), 1);830PUSH_DATA (push, 1);831BEGIN_NVC0(push, SUBC_3D(0x19c0), 1);832PUSH_DATA (push, 1);833834if (obj_class < GM107_3D_CLASS) {835BEGIN_NVC0(push, SUBC_3D(0x075c), 1);836PUSH_DATA (push, 3);837838if (obj_class >= NVE4_3D_CLASS) {839BEGIN_NVC0(push, SUBC_3D(0x07fc), 1);840PUSH_DATA (push, 1);841}842}843844/* TODO: find out what software methods 0x1528, 0x1280 and (on nve4) 0x02dc845* are supposed to do */846}847848static void849nvc0_screen_fence_emit(struct pipe_screen *pscreen, u32 *sequence)850{851struct nvc0_screen *screen = nvc0_screen(pscreen);852struct nouveau_pushbuf *push = screen->base.pushbuf;853854/* we need to do it after possible flush in MARK_RING */855*sequence = ++screen->base.fence.sequence;856857assert(PUSH_AVAIL(push) + push->rsvd_kick >= 5);858PUSH_DATA (push, NVC0_FIFO_PKHDR_SQ(NVC0_3D(QUERY_ADDRESS_HIGH), 4));859PUSH_DATAh(push, screen->fence.bo->offset);860PUSH_DATA (push, screen->fence.bo->offset);861PUSH_DATA (push, *sequence);862PUSH_DATA (push, NVC0_3D_QUERY_GET_FENCE | NVC0_3D_QUERY_GET_SHORT |863(0xf << NVC0_3D_QUERY_GET_UNIT__SHIFT));864}865866static u32867nvc0_screen_fence_update(struct pipe_screen *pscreen)868{869struct nvc0_screen *screen = nvc0_screen(pscreen);870return screen->fence.map[0];871}872873static int874nvc0_screen_init_compute(struct nvc0_screen *screen)875{876screen->base.base.get_compute_param = nvc0_screen_get_compute_param;877878switch (screen->base.device->chipset & ~0xf) {879case 0xc0:880case 0xd0:881return nvc0_screen_compute_setup(screen, screen->base.pushbuf);882case 0xe0:883case 0xf0:884case 0x100:885case 0x110:886case 0x120:887case 0x130:888case 0x140:889case 0x160:890return nve4_screen_compute_setup(screen, screen->base.pushbuf);891default:892return -1;893}894}895896static int897nvc0_screen_resize_tls_area(struct nvc0_screen *screen,898uint32_t lpos, uint32_t lneg, uint32_t cstack)899{900struct nouveau_bo *bo = NULL;901int ret;902uint64_t size = (lpos + lneg) * 32 + cstack;903904if (size >= (1 << 20)) {905NOUVEAU_ERR("requested TLS size too large: 0x%"PRIx64"\n", size);906return -1;907}908909size *= (screen->base.device->chipset >= 0xe0) ? 64 : 48; /* max warps */910size = align(size, 0x8000);911size *= screen->mp_count;912913size = align(size, 1 << 17);914915ret = nouveau_bo_new(screen->base.device, NV_VRAM_DOMAIN(&screen->base), 1 << 17, size,916NULL, &bo);917if (ret)918return ret;919920/* Make sure that the pushbuf has acquired a reference to the old tls921* segment, as it may have commands that will reference it.922*/923if (screen->tls)924PUSH_REFN(screen->base.pushbuf, screen->tls,925NV_VRAM_DOMAIN(&screen->base) | NOUVEAU_BO_RDWR);926nouveau_bo_ref(NULL, &screen->tls);927screen->tls = bo;928return 0;929}930931int932nvc0_screen_resize_text_area(struct nvc0_screen *screen, uint64_t size)933{934struct nouveau_pushbuf *push = screen->base.pushbuf;935struct nouveau_bo *bo;936int ret;937938ret = nouveau_bo_new(screen->base.device, NV_VRAM_DOMAIN(&screen->base),9391 << 17, size, NULL, &bo);940if (ret)941return ret;942943/* Make sure that the pushbuf has acquired a reference to the old text944* segment, as it may have commands that will reference it.945*/946if (screen->text)947PUSH_REFN(push, screen->text,948NV_VRAM_DOMAIN(&screen->base) | NOUVEAU_BO_RD);949nouveau_bo_ref(NULL, &screen->text);950screen->text = bo;951952nouveau_heap_destroy(&screen->lib_code);953nouveau_heap_destroy(&screen->text_heap);954955/* XXX: getting a page fault at the end of the code buffer every few956* launches, don't use the last 256 bytes to work around them - prefetch ?957*/958nouveau_heap_init(&screen->text_heap, 0, size - 0x100);959960/* update the code segment setup */961if (screen->eng3d->oclass < GV100_3D_CLASS) {962BEGIN_NVC0(push, NVC0_3D(CODE_ADDRESS_HIGH), 2);963PUSH_DATAh(push, screen->text->offset);964PUSH_DATA (push, screen->text->offset);965if (screen->compute) {966BEGIN_NVC0(push, NVC0_CP(CODE_ADDRESS_HIGH), 2);967PUSH_DATAh(push, screen->text->offset);968PUSH_DATA (push, screen->text->offset);969}970}971972return 0;973}974975void976nvc0_screen_bind_cb_3d(struct nvc0_screen *screen, bool *can_serialize,977int stage, int index, int size, uint64_t addr)978{979assert(stage != 5);980981struct nouveau_pushbuf *push = screen->base.pushbuf;982983if (screen->base.class_3d >= GM107_3D_CLASS) {984struct nvc0_cb_binding *binding = &screen->cb_bindings[stage][index];985986// TODO: Better figure out the conditions in which this is needed987bool serialize = binding->addr == addr && binding->size != size;988if (can_serialize)989serialize = serialize && *can_serialize;990if (serialize) {991IMMED_NVC0(push, NVC0_3D(SERIALIZE), 0);992if (can_serialize)993*can_serialize = false;994}995996binding->addr = addr;997binding->size = size;998}9991000if (size >= 0) {1001BEGIN_NVC0(push, NVC0_3D(CB_SIZE), 3);1002PUSH_DATA (push, size);1003PUSH_DATAh(push, addr);1004PUSH_DATA (push, addr);1005}1006IMMED_NVC0(push, NVC0_3D(CB_BIND(stage)), (index << 4) | (size >= 0));1007}10081009static const void *1010nvc0_screen_get_compiler_options(struct pipe_screen *pscreen,1011enum pipe_shader_ir ir,1012enum pipe_shader_type shader)1013{1014struct nvc0_screen *screen = nvc0_screen(pscreen);1015if (ir == PIPE_SHADER_IR_NIR)1016return nv50_ir_nir_shader_compiler_options(screen->base.device->chipset);1017return NULL;1018}10191020#define FAIL_SCREEN_INIT(str, err) \1021do { \1022NOUVEAU_ERR(str, err); \1023goto fail; \1024} while(0)10251026struct nouveau_screen *1027nvc0_screen_create(struct nouveau_device *dev)1028{1029struct nvc0_screen *screen;1030struct pipe_screen *pscreen;1031struct nouveau_object *chan;1032struct nouveau_pushbuf *push;1033uint64_t value;1034uint32_t obj_class;1035uint32_t flags;1036int ret;1037unsigned i;10381039switch (dev->chipset & ~0xf) {1040case 0xc0:1041case 0xd0:1042case 0xe0:1043case 0xf0:1044case 0x100:1045case 0x110:1046case 0x120:1047case 0x130:1048case 0x140:1049case 0x160:1050break;1051default:1052return NULL;1053}10541055screen = CALLOC_STRUCT(nvc0_screen);1056if (!screen)1057return NULL;1058pscreen = &screen->base.base;1059pscreen->destroy = nvc0_screen_destroy;10601061ret = nouveau_screen_init(&screen->base, dev);1062if (ret)1063FAIL_SCREEN_INIT("Base screen init failed: %d\n", ret);1064chan = screen->base.channel;1065push = screen->base.pushbuf;1066push->user_priv = screen;1067push->rsvd_kick = 5;10681069/* TODO: could this be higher on Kepler+? how does reclocking vs no1070* reclocking affect performance?1071* TODO: could this be higher on Fermi?1072*/1073if (dev->chipset >= 0xe0)1074screen->base.transfer_pushbuf_threshold = 1024;10751076screen->base.vidmem_bindings |= PIPE_BIND_CONSTANT_BUFFER |1077PIPE_BIND_SHADER_BUFFER |1078PIPE_BIND_VERTEX_BUFFER | PIPE_BIND_INDEX_BUFFER |1079PIPE_BIND_COMMAND_ARGS_BUFFER | PIPE_BIND_QUERY_BUFFER;1080screen->base.sysmem_bindings |=1081PIPE_BIND_VERTEX_BUFFER | PIPE_BIND_INDEX_BUFFER;10821083if (screen->base.vram_domain & NOUVEAU_BO_GART) {1084screen->base.sysmem_bindings |= screen->base.vidmem_bindings;1085screen->base.vidmem_bindings = 0;1086}10871088pscreen->context_create = nvc0_create;1089pscreen->is_format_supported = nvc0_screen_is_format_supported;1090pscreen->get_param = nvc0_screen_get_param;1091pscreen->get_shader_param = nvc0_screen_get_shader_param;1092pscreen->get_paramf = nvc0_screen_get_paramf;1093pscreen->get_sample_pixel_grid = nvc0_screen_get_sample_pixel_grid;1094pscreen->get_driver_query_info = nvc0_screen_get_driver_query_info;1095pscreen->get_driver_query_group_info = nvc0_screen_get_driver_query_group_info;1096/* nir stuff */1097pscreen->get_compiler_options = nvc0_screen_get_compiler_options;10981099nvc0_screen_init_resource_functions(pscreen);11001101screen->base.base.get_video_param = nouveau_vp3_screen_get_video_param;1102screen->base.base.is_video_format_supported = nouveau_vp3_screen_video_supported;11031104flags = NOUVEAU_BO_GART | NOUVEAU_BO_MAP;1105if (screen->base.drm->version >= 0x01000202)1106flags |= NOUVEAU_BO_COHERENT;11071108ret = nouveau_bo_new(dev, flags, 0, 4096, NULL, &screen->fence.bo);1109if (ret)1110FAIL_SCREEN_INIT("Error allocating fence BO: %d\n", ret);1111nouveau_bo_map(screen->fence.bo, 0, NULL);1112screen->fence.map = screen->fence.bo->map;1113screen->base.fence.emit = nvc0_screen_fence_emit;1114screen->base.fence.update = nvc0_screen_fence_update;11151116if (dev->chipset < 0x140) {1117ret = nouveau_object_new(chan, (dev->chipset < 0xe0) ? 0x1f906e : 0x906e,1118NVIF_CLASS_SW_GF100, NULL, 0, &screen->nvsw);1119if (ret)1120FAIL_SCREEN_INIT("Error creating SW object: %d\n", ret);11211122BEGIN_NVC0(push, SUBC_SW(NV01_SUBCHAN_OBJECT), 1);1123PUSH_DATA (push, screen->nvsw->handle);1124}11251126switch (dev->chipset & ~0xf) {1127case 0x160:1128case 0x140:1129case 0x130:1130case 0x120:1131case 0x110:1132case 0x100:1133case 0xf0:1134obj_class = NVF0_P2MF_CLASS;1135break;1136case 0xe0:1137obj_class = NVE4_P2MF_CLASS;1138break;1139default:1140obj_class = NVC0_M2MF_CLASS;1141break;1142}1143ret = nouveau_object_new(chan, 0xbeef323f, obj_class, NULL, 0,1144&screen->m2mf);1145if (ret)1146FAIL_SCREEN_INIT("Error allocating PGRAPH context for M2MF: %d\n", ret);11471148BEGIN_NVC0(push, SUBC_M2MF(NV01_SUBCHAN_OBJECT), 1);1149PUSH_DATA (push, screen->m2mf->oclass);1150if (screen->m2mf->oclass == NVE4_P2MF_CLASS) {1151BEGIN_NVC0(push, SUBC_COPY(NV01_SUBCHAN_OBJECT), 1);1152PUSH_DATA (push, NVE4_COPY_CLASS);1153}11541155ret = nouveau_object_new(chan, 0xbeef902d, NVC0_2D_CLASS, NULL, 0,1156&screen->eng2d);1157if (ret)1158FAIL_SCREEN_INIT("Error allocating PGRAPH context for 2D: %d\n", ret);11591160BEGIN_NVC0(push, SUBC_2D(NV01_SUBCHAN_OBJECT), 1);1161PUSH_DATA (push, screen->eng2d->oclass);1162BEGIN_NVC0(push, SUBC_2D(NVC0_2D_SINGLE_GPC), 1);1163PUSH_DATA (push, 0);1164BEGIN_NVC0(push, NVC0_2D(OPERATION), 1);1165PUSH_DATA (push, NV50_2D_OPERATION_SRCCOPY);1166BEGIN_NVC0(push, NVC0_2D(CLIP_ENABLE), 1);1167PUSH_DATA (push, 0);1168BEGIN_NVC0(push, NVC0_2D(COLOR_KEY_ENABLE), 1);1169PUSH_DATA (push, 0);1170BEGIN_NVC0(push, NVC0_2D(SET_PIXELS_FROM_MEMORY_CORRAL_SIZE), 1);1171PUSH_DATA (push, 0x3f);1172BEGIN_NVC0(push, NVC0_2D(SET_PIXELS_FROM_MEMORY_SAFE_OVERLAP), 1);1173PUSH_DATA (push, 1);1174BEGIN_NVC0(push, NVC0_2D(COND_MODE), 1);1175PUSH_DATA (push, NV50_2D_COND_MODE_ALWAYS);11761177BEGIN_NVC0(push, SUBC_2D(NVC0_GRAPH_NOTIFY_ADDRESS_HIGH), 2);1178PUSH_DATAh(push, screen->fence.bo->offset + 16);1179PUSH_DATA (push, screen->fence.bo->offset + 16);11801181switch (dev->chipset & ~0xf) {1182case 0x160:1183obj_class = TU102_3D_CLASS;1184break;1185case 0x140:1186obj_class = GV100_3D_CLASS;1187break;1188case 0x130:1189switch (dev->chipset) {1190case 0x130:1191case 0x13b:1192obj_class = GP100_3D_CLASS;1193break;1194default:1195obj_class = GP102_3D_CLASS;1196break;1197}1198break;1199case 0x120:1200obj_class = GM200_3D_CLASS;1201break;1202case 0x110:1203obj_class = GM107_3D_CLASS;1204break;1205case 0x100:1206case 0xf0:1207obj_class = NVF0_3D_CLASS;1208break;1209case 0xe0:1210switch (dev->chipset) {1211case 0xea:1212obj_class = NVEA_3D_CLASS;1213break;1214default:1215obj_class = NVE4_3D_CLASS;1216break;1217}1218break;1219case 0xd0:1220obj_class = NVC8_3D_CLASS;1221break;1222case 0xc0:1223default:1224switch (dev->chipset) {1225case 0xc8:1226obj_class = NVC8_3D_CLASS;1227break;1228case 0xc1:1229obj_class = NVC1_3D_CLASS;1230break;1231default:1232obj_class = NVC0_3D_CLASS;1233break;1234}1235break;1236}1237ret = nouveau_object_new(chan, 0xbeef003d, obj_class, NULL, 0,1238&screen->eng3d);1239if (ret)1240FAIL_SCREEN_INIT("Error allocating PGRAPH context for 3D: %d\n", ret);1241screen->base.class_3d = obj_class;12421243BEGIN_NVC0(push, SUBC_3D(NV01_SUBCHAN_OBJECT), 1);1244PUSH_DATA (push, screen->eng3d->oclass);12451246BEGIN_NVC0(push, NVC0_3D(COND_MODE), 1);1247PUSH_DATA (push, NVC0_3D_COND_MODE_ALWAYS);12481249if (debug_get_bool_option("NOUVEAU_SHADER_WATCHDOG", true)) {1250/* kill shaders after about 1 second (at 100 MHz) */1251BEGIN_NVC0(push, NVC0_3D(WATCHDOG_TIMER), 1);1252PUSH_DATA (push, 0x17);1253}12541255IMMED_NVC0(push, NVC0_3D(ZETA_COMP_ENABLE),1256screen->base.drm->version >= 0x01000101);1257BEGIN_NVC0(push, NVC0_3D(RT_COMP_ENABLE(0)), 8);1258for (i = 0; i < 8; ++i)1259PUSH_DATA(push, screen->base.drm->version >= 0x01000101);12601261BEGIN_NVC0(push, NVC0_3D(RT_CONTROL), 1);1262PUSH_DATA (push, 1);12631264BEGIN_NVC0(push, NVC0_3D(CSAA_ENABLE), 1);1265PUSH_DATA (push, 0);1266BEGIN_NVC0(push, NVC0_3D(MULTISAMPLE_ENABLE), 1);1267PUSH_DATA (push, 0);1268BEGIN_NVC0(push, NVC0_3D(MULTISAMPLE_MODE), 1);1269PUSH_DATA (push, NVC0_3D_MULTISAMPLE_MODE_MS1);1270BEGIN_NVC0(push, NVC0_3D(MULTISAMPLE_CTRL), 1);1271PUSH_DATA (push, 0);1272BEGIN_NVC0(push, NVC0_3D(LINE_WIDTH_SEPARATE), 1);1273PUSH_DATA (push, 1);1274BEGIN_NVC0(push, NVC0_3D(PRIM_RESTART_WITH_DRAW_ARRAYS), 1);1275PUSH_DATA (push, 1);1276BEGIN_NVC0(push, NVC0_3D(BLEND_SEPARATE_ALPHA), 1);1277PUSH_DATA (push, 1);1278BEGIN_NVC0(push, NVC0_3D(BLEND_ENABLE_COMMON), 1);1279PUSH_DATA (push, 0);1280BEGIN_NVC0(push, NVC0_3D(SHADE_MODEL), 1);1281PUSH_DATA (push, NVC0_3D_SHADE_MODEL_SMOOTH);1282if (screen->eng3d->oclass < NVE4_3D_CLASS) {1283IMMED_NVC0(push, NVC0_3D(TEX_MISC), 0);1284} else {1285BEGIN_NVC0(push, NVE4_3D(TEX_CB_INDEX), 1);1286PUSH_DATA (push, 15);1287}1288BEGIN_NVC0(push, NVC0_3D(CALL_LIMIT_LOG), 1);1289PUSH_DATA (push, 8); /* 128 */1290BEGIN_NVC0(push, NVC0_3D(ZCULL_STATCTRS_ENABLE), 1);1291PUSH_DATA (push, 1);1292if (screen->eng3d->oclass >= NVC1_3D_CLASS) {1293BEGIN_NVC0(push, NVC0_3D(CACHE_SPLIT), 1);1294PUSH_DATA (push, NVC0_3D_CACHE_SPLIT_48K_SHARED_16K_L1);1295}12961297nvc0_magic_3d_init(push, screen->eng3d->oclass);12981299ret = nvc0_screen_resize_text_area(screen, 1 << 19);1300if (ret)1301FAIL_SCREEN_INIT("Error allocating TEXT area: %d\n", ret);13021303/* 6 user uniform areas, 6 driver areas, and 1 for the runout */1304ret = nouveau_bo_new(dev, NV_VRAM_DOMAIN(&screen->base), 1 << 12, 13 << 16, NULL,1305&screen->uniform_bo);1306if (ret)1307FAIL_SCREEN_INIT("Error allocating uniform BO: %d\n", ret);13081309PUSH_REFN (push, screen->uniform_bo, NV_VRAM_DOMAIN(&screen->base) | NOUVEAU_BO_WR);13101311/* return { 0.0, 0.0, 0.0, 0.0 } for out-of-bounds vtxbuf access */1312BEGIN_NVC0(push, NVC0_3D(CB_SIZE), 3);1313PUSH_DATA (push, 256);1314PUSH_DATAh(push, screen->uniform_bo->offset + NVC0_CB_AUX_RUNOUT_INFO);1315PUSH_DATA (push, screen->uniform_bo->offset + NVC0_CB_AUX_RUNOUT_INFO);1316BEGIN_1IC0(push, NVC0_3D(CB_POS), 5);1317PUSH_DATA (push, 0);1318PUSH_DATAf(push, 0.0f);1319PUSH_DATAf(push, 0.0f);1320PUSH_DATAf(push, 0.0f);1321PUSH_DATAf(push, 0.0f);1322BEGIN_NVC0(push, NVC0_3D(VERTEX_RUNOUT_ADDRESS_HIGH), 2);1323PUSH_DATAh(push, screen->uniform_bo->offset + NVC0_CB_AUX_RUNOUT_INFO);1324PUSH_DATA (push, screen->uniform_bo->offset + NVC0_CB_AUX_RUNOUT_INFO);13251326if (screen->base.drm->version >= 0x01000101) {1327ret = nouveau_getparam(dev, NOUVEAU_GETPARAM_GRAPH_UNITS, &value);1328if (ret)1329FAIL_SCREEN_INIT("NOUVEAU_GETPARAM_GRAPH_UNITS failed: %d\n", ret);1330} else {1331if (dev->chipset >= 0xe0 && dev->chipset < 0xf0)1332value = (8 << 8) | 4;1333else1334value = (16 << 8) | 4;1335}1336screen->gpc_count = value & 0x000000ff;1337screen->mp_count = value >> 8;1338screen->mp_count_compute = screen->mp_count;13391340ret = nvc0_screen_resize_tls_area(screen, 128 * 16, 0, 0x200);1341if (ret)1342FAIL_SCREEN_INIT("Error allocating TLS area: %d\n", ret);13431344BEGIN_NVC0(push, NVC0_3D(TEMP_ADDRESS_HIGH), 4);1345PUSH_DATAh(push, screen->tls->offset);1346PUSH_DATA (push, screen->tls->offset);1347PUSH_DATA (push, screen->tls->size >> 32);1348PUSH_DATA (push, screen->tls->size);1349BEGIN_NVC0(push, NVC0_3D(WARP_TEMP_ALLOC), 1);1350PUSH_DATA (push, 0);1351/* Reduce likelihood of collision with real buffers by placing the hole at1352* the top of the 4G area. This will have to be dealt with for real1353* eventually by blocking off that area from the VM.1354*/1355BEGIN_NVC0(push, NVC0_3D(LOCAL_BASE), 1);1356PUSH_DATA (push, 0xff << 24);13571358if (screen->eng3d->oclass < GM107_3D_CLASS) {1359ret = nouveau_bo_new(dev, NV_VRAM_DOMAIN(&screen->base), 1 << 17, 1 << 20, NULL,1360&screen->poly_cache);1361if (ret)1362FAIL_SCREEN_INIT("Error allocating poly cache BO: %d\n", ret);13631364BEGIN_NVC0(push, NVC0_3D(VERTEX_QUARANTINE_ADDRESS_HIGH), 3);1365PUSH_DATAh(push, screen->poly_cache->offset);1366PUSH_DATA (push, screen->poly_cache->offset);1367PUSH_DATA (push, 3);1368}13691370ret = nouveau_bo_new(dev, NV_VRAM_DOMAIN(&screen->base), 1 << 17, 1 << 17, NULL,1371&screen->txc);1372if (ret)1373FAIL_SCREEN_INIT("Error allocating txc BO: %d\n", ret);13741375BEGIN_NVC0(push, NVC0_3D(TIC_ADDRESS_HIGH), 3);1376PUSH_DATAh(push, screen->txc->offset);1377PUSH_DATA (push, screen->txc->offset);1378PUSH_DATA (push, NVC0_TIC_MAX_ENTRIES - 1);1379if (screen->eng3d->oclass >= GM107_3D_CLASS) {1380screen->tic.maxwell = true;1381if (screen->eng3d->oclass == GM107_3D_CLASS) {1382screen->tic.maxwell =1383debug_get_bool_option("NOUVEAU_MAXWELL_TIC", true);1384IMMED_NVC0(push, SUBC_3D(0x0f10), screen->tic.maxwell);1385}1386}13871388BEGIN_NVC0(push, NVC0_3D(TSC_ADDRESS_HIGH), 3);1389PUSH_DATAh(push, screen->txc->offset + 65536);1390PUSH_DATA (push, screen->txc->offset + 65536);1391PUSH_DATA (push, NVC0_TSC_MAX_ENTRIES - 1);13921393BEGIN_NVC0(push, NVC0_3D(SCREEN_Y_CONTROL), 1);1394PUSH_DATA (push, 0);1395BEGIN_NVC0(push, NVC0_3D(WINDOW_OFFSET_X), 2);1396PUSH_DATA (push, 0);1397PUSH_DATA (push, 0);1398BEGIN_NVC0(push, NVC0_3D(ZCULL_REGION), 1); /* deactivate ZCULL */1399PUSH_DATA (push, 0x3f);14001401BEGIN_NVC0(push, NVC0_3D(CLIP_RECTS_MODE), 1);1402PUSH_DATA (push, NVC0_3D_CLIP_RECTS_MODE_INSIDE_ANY);1403BEGIN_NVC0(push, NVC0_3D(CLIP_RECT_HORIZ(0)), 8 * 2);1404for (i = 0; i < 8 * 2; ++i)1405PUSH_DATA(push, 0);1406BEGIN_NVC0(push, NVC0_3D(CLIP_RECTS_EN), 1);1407PUSH_DATA (push, 0);1408BEGIN_NVC0(push, NVC0_3D(CLIPID_ENABLE), 1);1409PUSH_DATA (push, 0);14101411/* neither scissors, viewport nor stencil mask should affect clears */1412BEGIN_NVC0(push, NVC0_3D(CLEAR_FLAGS), 1);1413PUSH_DATA (push, 0);14141415BEGIN_NVC0(push, NVC0_3D(VIEWPORT_TRANSFORM_EN), 1);1416PUSH_DATA (push, 1);1417for (i = 0; i < NVC0_MAX_VIEWPORTS; i++) {1418BEGIN_NVC0(push, NVC0_3D(DEPTH_RANGE_NEAR(i)), 2);1419PUSH_DATAf(push, 0.0f);1420PUSH_DATAf(push, 1.0f);1421}1422BEGIN_NVC0(push, NVC0_3D(VIEW_VOLUME_CLIP_CTRL), 1);1423PUSH_DATA (push, NVC0_3D_VIEW_VOLUME_CLIP_CTRL_UNK1_UNK1);14241425/* We use scissors instead of exact view volume clipping,1426* so they're always enabled.1427*/1428for (i = 0; i < NVC0_MAX_VIEWPORTS; i++) {1429BEGIN_NVC0(push, NVC0_3D(SCISSOR_ENABLE(i)), 3);1430PUSH_DATA (push, 1);1431PUSH_DATA (push, 16384 << 16);1432PUSH_DATA (push, 16384 << 16);1433}14341435if (screen->eng3d->oclass < TU102_3D_CLASS) {1436#define MK_MACRO(m, n) i = nvc0_graph_set_macro(screen, m, i, sizeof(n), n);14371438i = 0;1439MK_MACRO(NVC0_3D_MACRO_VERTEX_ARRAY_PER_INSTANCE, mme9097_per_instance_bf);1440MK_MACRO(NVC0_3D_MACRO_BLEND_ENABLES, mme9097_blend_enables);1441MK_MACRO(NVC0_3D_MACRO_VERTEX_ARRAY_SELECT, mme9097_vertex_array_select);1442MK_MACRO(NVC0_3D_MACRO_TEP_SELECT, mme9097_tep_select);1443MK_MACRO(NVC0_3D_MACRO_GP_SELECT, mme9097_gp_select);1444MK_MACRO(NVC0_3D_MACRO_POLYGON_MODE_FRONT, mme9097_poly_mode_front);1445MK_MACRO(NVC0_3D_MACRO_POLYGON_MODE_BACK, mme9097_poly_mode_back);1446MK_MACRO(NVC0_3D_MACRO_DRAW_ARRAYS_INDIRECT, mme9097_draw_arrays_indirect);1447MK_MACRO(NVC0_3D_MACRO_DRAW_ELEMENTS_INDIRECT, mme9097_draw_elts_indirect);1448MK_MACRO(NVC0_3D_MACRO_DRAW_ARRAYS_INDIRECT_COUNT, mme9097_draw_arrays_indirect_count);1449MK_MACRO(NVC0_3D_MACRO_DRAW_ELEMENTS_INDIRECT_COUNT, mme9097_draw_elts_indirect_count);1450MK_MACRO(NVC0_3D_MACRO_QUERY_BUFFER_WRITE, mme9097_query_buffer_write);1451MK_MACRO(NVC0_3D_MACRO_CONSERVATIVE_RASTER_STATE, mme9097_conservative_raster_state);1452MK_MACRO(NVC0_3D_MACRO_COMPUTE_COUNTER, mme9097_compute_counter);1453MK_MACRO(NVC0_3D_MACRO_COMPUTE_COUNTER_TO_QUERY, mme9097_compute_counter_to_query);1454MK_MACRO(NVC0_CP_MACRO_LAUNCH_GRID_INDIRECT, mme90c0_launch_grid_indirect);1455} else {1456#undef MK_MACRO1457#define MK_MACRO(m, n) i = tu102_graph_set_macro(screen, m, i, sizeof(n), n);14581459i = 0;1460MK_MACRO(NVC0_3D_MACRO_VERTEX_ARRAY_PER_INSTANCE, mmec597_per_instance_bf);1461MK_MACRO(NVC0_3D_MACRO_BLEND_ENABLES, mmec597_blend_enables);1462MK_MACRO(NVC0_3D_MACRO_VERTEX_ARRAY_SELECT, mmec597_vertex_array_select);1463MK_MACRO(NVC0_3D_MACRO_TEP_SELECT, mmec597_tep_select);1464MK_MACRO(NVC0_3D_MACRO_GP_SELECT, mmec597_gp_select);1465MK_MACRO(NVC0_3D_MACRO_POLYGON_MODE_FRONT, mmec597_poly_mode_front);1466MK_MACRO(NVC0_3D_MACRO_POLYGON_MODE_BACK, mmec597_poly_mode_back);1467MK_MACRO(NVC0_3D_MACRO_DRAW_ARRAYS_INDIRECT, mmec597_draw_arrays_indirect);1468MK_MACRO(NVC0_3D_MACRO_DRAW_ELEMENTS_INDIRECT, mmec597_draw_elts_indirect);1469MK_MACRO(NVC0_3D_MACRO_DRAW_ARRAYS_INDIRECT_COUNT, mmec597_draw_arrays_indirect_count);1470MK_MACRO(NVC0_3D_MACRO_DRAW_ELEMENTS_INDIRECT_COUNT, mmec597_draw_elts_indirect_count);1471MK_MACRO(NVC0_3D_MACRO_QUERY_BUFFER_WRITE, mmec597_query_buffer_write);1472MK_MACRO(NVC0_3D_MACRO_CONSERVATIVE_RASTER_STATE, mmec597_conservative_raster_state);1473MK_MACRO(NVC0_3D_MACRO_COMPUTE_COUNTER, mmec597_compute_counter);1474MK_MACRO(NVC0_3D_MACRO_COMPUTE_COUNTER_TO_QUERY, mmec597_compute_counter_to_query);1475}14761477BEGIN_NVC0(push, NVC0_3D(RASTERIZE_ENABLE), 1);1478PUSH_DATA (push, 1);1479BEGIN_NVC0(push, NVC0_3D(RT_SEPARATE_FRAG_DATA), 1);1480PUSH_DATA (push, 1);1481BEGIN_NVC0(push, NVC0_3D(MACRO_GP_SELECT), 1);1482PUSH_DATA (push, 0x40);1483BEGIN_NVC0(push, NVC0_3D(LAYER), 1);1484PUSH_DATA (push, 0);1485BEGIN_NVC0(push, NVC0_3D(MACRO_TEP_SELECT), 1);1486PUSH_DATA (push, 0x30);1487BEGIN_NVC0(push, NVC0_3D(PATCH_VERTICES), 1);1488PUSH_DATA (push, 3);1489BEGIN_NVC0(push, NVC0_3D(SP_SELECT(2)), 1);1490PUSH_DATA (push, 0x20);1491BEGIN_NVC0(push, NVC0_3D(SP_SELECT(0)), 1);1492PUSH_DATA (push, 0x00);1493screen->save_state.patch_vertices = 3;14941495BEGIN_NVC0(push, NVC0_3D(POINT_COORD_REPLACE), 1);1496PUSH_DATA (push, 0);1497BEGIN_NVC0(push, NVC0_3D(POINT_RASTER_RULES), 1);1498PUSH_DATA (push, NVC0_3D_POINT_RASTER_RULES_OGL);14991500IMMED_NVC0(push, NVC0_3D(EDGEFLAG), 1);15011502if (nvc0_screen_init_compute(screen))1503goto fail;15041505/* XXX: Compute and 3D are somehow aliased on Fermi. */1506for (i = 0; i < 5; ++i) {1507unsigned j = 0;1508for (j = 0; j < 16; j++)1509screen->cb_bindings[i][j].size = -1;15101511/* TIC and TSC entries for each unit (nve4+ only) */1512/* auxiliary constants (6 user clip planes, base instance id) */1513nvc0_screen_bind_cb_3d(screen, NULL, i, 15, NVC0_CB_AUX_SIZE,1514screen->uniform_bo->offset + NVC0_CB_AUX_INFO(i));1515if (screen->eng3d->oclass >= NVE4_3D_CLASS) {1516unsigned j;1517BEGIN_1IC0(push, NVC0_3D(CB_POS), 9);1518PUSH_DATA (push, NVC0_CB_AUX_UNK_INFO);1519for (j = 0; j < 8; ++j)1520PUSH_DATA(push, j);1521} else {1522BEGIN_NVC0(push, NVC0_3D(TEX_LIMITS(i)), 1);1523PUSH_DATA (push, 0x54);1524}15251526/* MS sample coordinate offsets: these do not work with _ALT modes ! */1527BEGIN_1IC0(push, NVC0_3D(CB_POS), 1 + 2 * 8);1528PUSH_DATA (push, NVC0_CB_AUX_MS_INFO);1529PUSH_DATA (push, 0); /* 0 */1530PUSH_DATA (push, 0);1531PUSH_DATA (push, 1); /* 1 */1532PUSH_DATA (push, 0);1533PUSH_DATA (push, 0); /* 2 */1534PUSH_DATA (push, 1);1535PUSH_DATA (push, 1); /* 3 */1536PUSH_DATA (push, 1);1537PUSH_DATA (push, 2); /* 4 */1538PUSH_DATA (push, 0);1539PUSH_DATA (push, 3); /* 5 */1540PUSH_DATA (push, 0);1541PUSH_DATA (push, 2); /* 6 */1542PUSH_DATA (push, 1);1543PUSH_DATA (push, 3); /* 7 */1544PUSH_DATA (push, 1);1545}1546BEGIN_NVC0(push, NVC0_3D(LINKED_TSC), 1);1547PUSH_DATA (push, 0);15481549PUSH_KICK (push);15501551screen->tic.entries = CALLOC(1552NVC0_TIC_MAX_ENTRIES + NVC0_TSC_MAX_ENTRIES + NVE4_IMG_MAX_HANDLES,1553sizeof(void *));1554screen->tsc.entries = screen->tic.entries + NVC0_TIC_MAX_ENTRIES;1555screen->img.entries = (void *)(screen->tsc.entries + NVC0_TSC_MAX_ENTRIES);15561557if (!nvc0_blitter_create(screen))1558goto fail;15591560nouveau_fence_new(&screen->base, &screen->base.fence.current);15611562return &screen->base;15631564fail:1565screen->base.base.context_create = NULL;1566return &screen->base;1567}15681569int1570nvc0_screen_tic_alloc(struct nvc0_screen *screen, void *entry)1571{1572int i = screen->tic.next;15731574while (screen->tic.lock[i / 32] & (1 << (i % 32)))1575i = (i + 1) & (NVC0_TIC_MAX_ENTRIES - 1);15761577screen->tic.next = (i + 1) & (NVC0_TIC_MAX_ENTRIES - 1);15781579if (screen->tic.entries[i])1580nv50_tic_entry(screen->tic.entries[i])->id = -1;15811582screen->tic.entries[i] = entry;1583return i;1584}15851586int1587nvc0_screen_tsc_alloc(struct nvc0_screen *screen, void *entry)1588{1589int i = screen->tsc.next;15901591while (screen->tsc.lock[i / 32] & (1 << (i % 32)))1592i = (i + 1) & (NVC0_TSC_MAX_ENTRIES - 1);15931594screen->tsc.next = (i + 1) & (NVC0_TSC_MAX_ENTRIES - 1);15951596if (screen->tsc.entries[i])1597nv50_tsc_entry(screen->tsc.entries[i])->id = -1;15981599screen->tsc.entries[i] = entry;1600return i;1601}160216031604