Path: blob/21.2-virgl/src/gallium/drivers/nouveau/nouveau_screen.c
4570 views
#include "pipe/p_defines.h"1#include "pipe/p_screen.h"2#include "pipe/p_state.h"34#include "util/u_memory.h"5#include "util/u_inlines.h"6#include "util/format/u_format.h"7#include "util/format/u_format_s3tc.h"8#include "util/u_string.h"910#include "os/os_mman.h"11#include "util/os_time.h"1213#include <stdio.h>14#include <errno.h>15#include <stdlib.h>1617#include <nouveau_drm.h>18#include <xf86drm.h>1920#include "nouveau_winsys.h"21#include "nouveau_screen.h"22#include "nouveau_context.h"23#include "nouveau_fence.h"24#include "nouveau_mm.h"25#include "nouveau_buffer.h"2627#include <compiler/glsl_types.h>2829/* XXX this should go away */30#include "frontend/drm_driver.h"3132/* Even though GPUs might allow addresses with more bits, some engines do not.33* Stick with 40 for compatibility.34*/35#define NV_GENERIC_VM_LIMIT_SHIFT 393637int nouveau_mesa_debug = 0;3839static const char *40nouveau_screen_get_name(struct pipe_screen *pscreen)41{42struct nouveau_screen *screen = nouveau_screen(pscreen);43return screen->chipset_name;44}4546static const char *47nouveau_screen_get_vendor(struct pipe_screen *pscreen)48{49return "nouveau";50}5152static const char *53nouveau_screen_get_device_vendor(struct pipe_screen *pscreen)54{55return "NVIDIA";56}5758static uint64_t59nouveau_screen_get_timestamp(struct pipe_screen *pscreen)60{61int64_t cpu_time = os_time_get() * 1000;6263/* getparam of PTIMER_TIME takes about x10 as long (several usecs) */6465return cpu_time + nouveau_screen(pscreen)->cpu_gpu_time_delta;66}6768static struct disk_cache *69nouveau_screen_get_disk_shader_cache(struct pipe_screen *pscreen)70{71return nouveau_screen(pscreen)->disk_shader_cache;72}7374static void75nouveau_screen_fence_ref(struct pipe_screen *pscreen,76struct pipe_fence_handle **ptr,77struct pipe_fence_handle *pfence)78{79nouveau_fence_ref(nouveau_fence(pfence), (struct nouveau_fence **)ptr);80}8182static bool83nouveau_screen_fence_finish(struct pipe_screen *screen,84struct pipe_context *ctx,85struct pipe_fence_handle *pfence,86uint64_t timeout)87{88if (!timeout)89return nouveau_fence_signalled(nouveau_fence(pfence));9091return nouveau_fence_wait(nouveau_fence(pfence), NULL);92}939495struct nouveau_bo *96nouveau_screen_bo_from_handle(struct pipe_screen *pscreen,97struct winsys_handle *whandle,98unsigned *out_stride)99{100struct nouveau_device *dev = nouveau_screen(pscreen)->device;101struct nouveau_bo *bo = 0;102int ret;103104if (whandle->offset != 0) {105debug_printf("%s: attempt to import unsupported winsys offset %d\n",106__FUNCTION__, whandle->offset);107return NULL;108}109110if (whandle->type != WINSYS_HANDLE_TYPE_SHARED &&111whandle->type != WINSYS_HANDLE_TYPE_FD) {112debug_printf("%s: attempt to import unsupported handle type %d\n",113__FUNCTION__, whandle->type);114return NULL;115}116117if (whandle->type == WINSYS_HANDLE_TYPE_SHARED)118ret = nouveau_bo_name_ref(dev, whandle->handle, &bo);119else120ret = nouveau_bo_prime_handle_ref(dev, whandle->handle, &bo);121122if (ret) {123debug_printf("%s: ref name 0x%08x failed with %d\n",124__FUNCTION__, whandle->handle, ret);125return NULL;126}127128*out_stride = whandle->stride;129return bo;130}131132133bool134nouveau_screen_bo_get_handle(struct pipe_screen *pscreen,135struct nouveau_bo *bo,136unsigned stride,137struct winsys_handle *whandle)138{139whandle->stride = stride;140141if (whandle->type == WINSYS_HANDLE_TYPE_SHARED) {142return nouveau_bo_name_get(bo, &whandle->handle) == 0;143} else if (whandle->type == WINSYS_HANDLE_TYPE_KMS) {144whandle->handle = bo->handle;145return true;146} else if (whandle->type == WINSYS_HANDLE_TYPE_FD) {147return nouveau_bo_set_prime(bo, (int *)&whandle->handle) == 0;148} else {149return false;150}151}152153static void154nouveau_disk_cache_create(struct nouveau_screen *screen)155{156struct mesa_sha1 ctx;157unsigned char sha1[20];158char cache_id[20 * 2 + 1];159uint64_t driver_flags = 0;160161_mesa_sha1_init(&ctx);162if (!disk_cache_get_function_identifier(nouveau_disk_cache_create,163&ctx))164return;165166_mesa_sha1_final(&ctx, sha1);167disk_cache_format_hex_id(cache_id, sha1, 20 * 2);168169if (screen->prefer_nir)170driver_flags |= NOUVEAU_SHADER_CACHE_FLAGS_IR_NIR;171else172driver_flags |= NOUVEAU_SHADER_CACHE_FLAGS_IR_TGSI;173174screen->disk_shader_cache =175disk_cache_create(nouveau_screen_get_name(&screen->base),176cache_id, driver_flags);177}178179static void*180reserve_vma(uintptr_t start, uint64_t reserved_size)181{182void *reserved = os_mmap((void*)start, reserved_size, PROT_NONE,183MAP_ANONYMOUS | MAP_PRIVATE, -1, 0);184if (reserved == MAP_FAILED)185return NULL;186return reserved;187}188189int190nouveau_screen_init(struct nouveau_screen *screen, struct nouveau_device *dev)191{192struct pipe_screen *pscreen = &screen->base;193struct nv04_fifo nv04_data = { .vram = 0xbeef0201, .gart = 0xbeef0202 };194struct nvc0_fifo nvc0_data = { };195uint64_t time;196int size, ret;197void *data;198union nouveau_bo_config mm_config;199200char *nv_dbg = getenv("NOUVEAU_MESA_DEBUG");201if (nv_dbg)202nouveau_mesa_debug = atoi(nv_dbg);203204if (dev->chipset < 0x140)205screen->prefer_nir = debug_get_bool_option("NV50_PROG_USE_NIR", false);206else207screen->prefer_nir = true;208209screen->force_enable_cl = debug_get_bool_option("NOUVEAU_ENABLE_CL", false);210if (screen->force_enable_cl)211glsl_type_singleton_init_or_ref();212213/* These must be set before any failure is possible, as the cleanup214* paths assume they're responsible for deleting them.215*/216screen->drm = nouveau_drm(&dev->object);217screen->device = dev;218219/*220* this is initialized to 1 in nouveau_drm_screen_create after screen221* is fully constructed and added to the global screen list.222*/223screen->refcount = -1;224225if (dev->chipset < 0xc0) {226data = &nv04_data;227size = sizeof(nv04_data);228} else {229data = &nvc0_data;230size = sizeof(nvc0_data);231}232233bool enable_svm = debug_get_bool_option("NOUVEAU_SVM", false);234screen->has_svm = false;235/* we only care about HMM with OpenCL enabled */236if (dev->chipset > 0x130 && screen->force_enable_cl && enable_svm) {237/* Before being able to enable SVM we need to carve out some memory for238* driver bo allocations. Let's just base the size on the available VRAM.239*240* 40 bit is the biggest we care about and for 32 bit systems we don't241* want to allocate all of the available memory either.242*243* Also we align the size we want to reserve to the next POT to make use244* of hugepages.245*/246const int vram_shift = util_logbase2_ceil64(dev->vram_size);247const int limit_bit =248MIN2(sizeof(void*) * 8 - 1, NV_GENERIC_VM_LIMIT_SHIFT);249screen->svm_cutout_size =250BITFIELD64_BIT(MIN2(sizeof(void*) == 4 ? 26 : NV_GENERIC_VM_LIMIT_SHIFT, vram_shift));251252size_t start = screen->svm_cutout_size;253do {254screen->svm_cutout = reserve_vma(start, screen->svm_cutout_size);255if (!screen->svm_cutout) {256start += screen->svm_cutout_size;257continue;258}259260struct drm_nouveau_svm_init svm_args = {261.unmanaged_addr = (uintptr_t)screen->svm_cutout,262.unmanaged_size = screen->svm_cutout_size,263};264265ret = drmCommandWrite(screen->drm->fd, DRM_NOUVEAU_SVM_INIT,266&svm_args, sizeof(svm_args));267screen->has_svm = !ret;268if (!screen->has_svm)269os_munmap(screen->svm_cutout, screen->svm_cutout_size);270break;271} while ((start + screen->svm_cutout_size) < BITFIELD64_MASK(limit_bit));272}273274switch (dev->chipset) {275case 0x0ea: /* TK1, GK20A */276case 0x12b: /* TX1, GM20B */277case 0x13b: /* TX2, GP10B */278screen->tegra_sector_layout = true;279break;280default:281/* Xavier's GPU and everything else */282screen->tegra_sector_layout = false;283break;284}285286/*287* Set default VRAM domain if not overridden288*/289if (!screen->vram_domain) {290if (dev->vram_size > 0)291screen->vram_domain = NOUVEAU_BO_VRAM;292else293screen->vram_domain = NOUVEAU_BO_GART;294}295296ret = nouveau_object_new(&dev->object, 0, NOUVEAU_FIFO_CHANNEL_CLASS,297data, size, &screen->channel);298if (ret)299goto err;300301ret = nouveau_client_new(screen->device, &screen->client);302if (ret)303goto err;304ret = nouveau_pushbuf_new(screen->client, screen->channel,3054, 512 * 1024, 1,306&screen->pushbuf);307if (ret)308goto err;309310/* getting CPU time first appears to be more accurate */311screen->cpu_gpu_time_delta = os_time_get();312313ret = nouveau_getparam(dev, NOUVEAU_GETPARAM_PTIMER_TIME, &time);314if (!ret)315screen->cpu_gpu_time_delta = time - screen->cpu_gpu_time_delta * 1000;316317snprintf(screen->chipset_name, sizeof(screen->chipset_name), "NV%02X", dev->chipset);318pscreen->get_name = nouveau_screen_get_name;319pscreen->get_vendor = nouveau_screen_get_vendor;320pscreen->get_device_vendor = nouveau_screen_get_device_vendor;321pscreen->get_disk_shader_cache = nouveau_screen_get_disk_shader_cache;322323pscreen->get_timestamp = nouveau_screen_get_timestamp;324325pscreen->fence_reference = nouveau_screen_fence_ref;326pscreen->fence_finish = nouveau_screen_fence_finish;327328nouveau_disk_cache_create(screen);329330screen->transfer_pushbuf_threshold = 192;331screen->lowmem_bindings = PIPE_BIND_GLOBAL; /* gallium limit */332screen->vidmem_bindings =333PIPE_BIND_RENDER_TARGET | PIPE_BIND_DEPTH_STENCIL |334PIPE_BIND_DISPLAY_TARGET | PIPE_BIND_SCANOUT |335PIPE_BIND_CURSOR |336PIPE_BIND_SAMPLER_VIEW |337PIPE_BIND_SHADER_BUFFER | PIPE_BIND_SHADER_IMAGE |338PIPE_BIND_COMPUTE_RESOURCE |339PIPE_BIND_GLOBAL;340screen->sysmem_bindings =341PIPE_BIND_SAMPLER_VIEW | PIPE_BIND_STREAM_OUTPUT |342PIPE_BIND_COMMAND_ARGS_BUFFER;343344memset(&mm_config, 0, sizeof(mm_config));345346screen->mm_GART = nouveau_mm_create(dev,347NOUVEAU_BO_GART | NOUVEAU_BO_MAP,348&mm_config);349screen->mm_VRAM = nouveau_mm_create(dev, NOUVEAU_BO_VRAM, &mm_config);350return 0;351352err:353if (screen->svm_cutout)354os_munmap(screen->svm_cutout, screen->svm_cutout_size);355return ret;356}357358void359nouveau_screen_fini(struct nouveau_screen *screen)360{361int fd = screen->drm->fd;362363if (screen->force_enable_cl)364glsl_type_singleton_decref();365if (screen->has_svm)366os_munmap(screen->svm_cutout, screen->svm_cutout_size);367368nouveau_mm_destroy(screen->mm_GART);369nouveau_mm_destroy(screen->mm_VRAM);370371nouveau_pushbuf_del(&screen->pushbuf);372373nouveau_client_del(&screen->client);374nouveau_object_del(&screen->channel);375376nouveau_device_del(&screen->device);377nouveau_drm_del(&screen->drm);378close(fd);379380disk_cache_destroy(screen->disk_shader_cache);381}382383static void384nouveau_set_debug_callback(struct pipe_context *pipe,385const struct pipe_debug_callback *cb)386{387struct nouveau_context *context = nouveau_context(pipe);388389if (cb)390context->debug = *cb;391else392memset(&context->debug, 0, sizeof(context->debug));393}394395void396nouveau_context_init(struct nouveau_context *context)397{398context->pipe.set_debug_callback = nouveau_set_debug_callback;399}400401402