Path: blob/21.2-virgl/src/gallium/winsys/virgl/drm/virgl_drm_winsys.c
4566 views
/*1* Copyright 2014, 2015 Red Hat.2*3* Permission is hereby granted, free of charge, to any person obtaining a4* copy of this software and associated documentation files (the "Software"),5* to deal in the Software without restriction, including without limitation6* on the rights to use, copy, modify, merge, publish, distribute, sub7* license, and/or sell copies of the Software, and to permit persons to whom8* the Software is furnished to do so, subject to the following conditions:9*10* The above copyright notice and this permission notice (including the next11* paragraph) shall be included in all copies or substantial portions of the12* Software.13*14* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR15* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,16* FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT. IN NO EVENT SHALL17* THE AUTHOR(S) AND/OR THEIR SUPPLIERS BE LIABLE FOR ANY CLAIM,18* DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR19* OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE20* USE OR OTHER DEALINGS IN THE SOFTWARE.21*/2223#include <errno.h>24#include <fcntl.h>25#include <limits.h>26#include <stdio.h>27#include <sys/ioctl.h>28#include <sys/stat.h>2930#include "os/os_mman.h"31#include "util/os_file.h"32#include "util/os_time.h"33#include "util/u_memory.h"34#include "util/format/u_format.h"35#include "util/u_hash_table.h"36#include "util/u_inlines.h"37#include "util/u_pointer.h"38#include "frontend/drm_driver.h"39#include "virgl/virgl_screen.h"40#include "virgl/virgl_public.h"41#include "virtio-gpu/virgl_protocol.h"4243#include <xf86drm.h>44#include <libsync.h>45#include "drm-uapi/virtgpu_drm.h"4647#include "virgl_drm_winsys.h"48#include "virgl_drm_public.h"495051#define VIRGL_DRM_VERSION(major, minor) ((major) << 16 | (minor))52#define VIRGL_DRM_VERSION_FENCE_FD VIRGL_DRM_VERSION(0, 1)5354/* Gets a pointer to the virgl_hw_res containing the pointed to cache entry. */55#define cache_entry_container_res(ptr) \56(struct virgl_hw_res*)((char*)ptr - offsetof(struct virgl_hw_res, cache_entry))5758static inline boolean can_cache_resource(uint32_t bind)59{60return bind == VIRGL_BIND_CONSTANT_BUFFER ||61bind == VIRGL_BIND_INDEX_BUFFER ||62bind == VIRGL_BIND_VERTEX_BUFFER ||63bind == VIRGL_BIND_CUSTOM ||64bind == VIRGL_BIND_STAGING ||65bind == 0;66}6768static void virgl_hw_res_destroy(struct virgl_drm_winsys *qdws,69struct virgl_hw_res *res)70{71struct drm_gem_close args;7273mtx_lock(&qdws->bo_handles_mutex);7475/* We intentionally avoid taking the lock in76* virgl_drm_resource_reference. Now that the77* lock is taken, we need to check the refcount78* again. */79if (pipe_is_referenced(&res->reference)) {80mtx_unlock(&qdws->bo_handles_mutex);81return;82}8384_mesa_hash_table_remove_key(qdws->bo_handles,85(void *)(uintptr_t)res->bo_handle);86if (res->flink_name)87_mesa_hash_table_remove_key(qdws->bo_names,88(void *)(uintptr_t)res->flink_name);89mtx_unlock(&qdws->bo_handles_mutex);90if (res->ptr)91os_munmap(res->ptr, res->size);9293memset(&args, 0, sizeof(args));94args.handle = res->bo_handle;95drmIoctl(qdws->fd, DRM_IOCTL_GEM_CLOSE, &args);96FREE(res);97}9899static boolean virgl_drm_resource_is_busy(struct virgl_winsys *vws,100struct virgl_hw_res *res)101{102struct virgl_drm_winsys *vdws = virgl_drm_winsys(vws);103struct drm_virtgpu_3d_wait waitcmd;104int ret;105106if (!p_atomic_read(&res->maybe_busy) && !p_atomic_read(&res->external))107return false;108109memset(&waitcmd, 0, sizeof(waitcmd));110waitcmd.handle = res->bo_handle;111waitcmd.flags = VIRTGPU_WAIT_NOWAIT;112113ret = drmIoctl(vdws->fd, DRM_IOCTL_VIRTGPU_WAIT, &waitcmd);114if (ret && errno == EBUSY)115return TRUE;116117p_atomic_set(&res->maybe_busy, false);118119return FALSE;120}121122static void123virgl_drm_winsys_destroy(struct virgl_winsys *qws)124{125struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);126127virgl_resource_cache_flush(&qdws->cache);128129_mesa_hash_table_destroy(qdws->bo_handles, NULL);130_mesa_hash_table_destroy(qdws->bo_names, NULL);131mtx_destroy(&qdws->bo_handles_mutex);132mtx_destroy(&qdws->mutex);133134FREE(qdws);135}136137static void virgl_drm_resource_reference(struct virgl_winsys *qws,138struct virgl_hw_res **dres,139struct virgl_hw_res *sres)140{141struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);142struct virgl_hw_res *old = *dres;143144if (pipe_reference(&(*dres)->reference, &sres->reference)) {145146if (!can_cache_resource(old->bind) ||147p_atomic_read(&old->external)) {148virgl_hw_res_destroy(qdws, old);149} else {150mtx_lock(&qdws->mutex);151virgl_resource_cache_add(&qdws->cache, &old->cache_entry);152mtx_unlock(&qdws->mutex);153}154}155*dres = sres;156}157158static struct virgl_hw_res *159virgl_drm_winsys_resource_create_blob(struct virgl_winsys *qws,160enum pipe_texture_target target,161uint32_t format,162uint32_t bind,163uint32_t width,164uint32_t height,165uint32_t depth,166uint32_t array_size,167uint32_t last_level,168uint32_t nr_samples,169uint32_t flags,170uint32_t size)171{172int ret;173int32_t blob_id;174uint32_t cmd[VIRGL_PIPE_RES_CREATE_SIZE + 1] = { 0 };175struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);176struct drm_virtgpu_resource_create_blob drm_rc_blob = { 0 };177struct virgl_hw_res *res;178179res = CALLOC_STRUCT(virgl_hw_res);180if (!res)181return NULL;182183/* Make sure blob is page aligned. */184if (flags & (VIRGL_RESOURCE_FLAG_MAP_PERSISTENT |185VIRGL_RESOURCE_FLAG_MAP_COHERENT)) {186width = ALIGN(width, getpagesize());187size = ALIGN(size, getpagesize());188}189190blob_id = p_atomic_inc_return(&qdws->blob_id);191cmd[0] = VIRGL_CMD0(VIRGL_CCMD_PIPE_RESOURCE_CREATE, 0, VIRGL_PIPE_RES_CREATE_SIZE);192cmd[VIRGL_PIPE_RES_CREATE_FORMAT] = format;193cmd[VIRGL_PIPE_RES_CREATE_BIND] = bind;194cmd[VIRGL_PIPE_RES_CREATE_TARGET] = target;195cmd[VIRGL_PIPE_RES_CREATE_WIDTH] = width;196cmd[VIRGL_PIPE_RES_CREATE_HEIGHT] = height;197cmd[VIRGL_PIPE_RES_CREATE_DEPTH] = depth;198cmd[VIRGL_PIPE_RES_CREATE_ARRAY_SIZE] = array_size;199cmd[VIRGL_PIPE_RES_CREATE_LAST_LEVEL] = last_level;200cmd[VIRGL_PIPE_RES_CREATE_NR_SAMPLES] = nr_samples;201cmd[VIRGL_PIPE_RES_CREATE_FLAGS] = flags;202cmd[VIRGL_PIPE_RES_CREATE_BLOB_ID] = blob_id;203204drm_rc_blob.cmd = (unsigned long)(void *)&cmd;205drm_rc_blob.cmd_size = 4 * (VIRGL_PIPE_RES_CREATE_SIZE + 1);206drm_rc_blob.size = size;207drm_rc_blob.blob_mem = VIRTGPU_BLOB_MEM_HOST3D;208drm_rc_blob.blob_flags = VIRTGPU_BLOB_FLAG_USE_MAPPABLE;209drm_rc_blob.blob_id = (uint64_t) blob_id;210211ret = drmIoctl(qdws->fd, DRM_IOCTL_VIRTGPU_RESOURCE_CREATE_BLOB, &drm_rc_blob);212if (ret != 0) {213FREE(res);214return NULL;215}216217res->bind = bind;218res->res_handle = drm_rc_blob.res_handle;219res->bo_handle = drm_rc_blob.bo_handle;220res->size = size;221res->flags = flags;222res->maybe_untyped = false;223pipe_reference_init(&res->reference, 1);224p_atomic_set(&res->external, false);225p_atomic_set(&res->num_cs_references, 0);226virgl_resource_cache_entry_init(&res->cache_entry, size, bind, format,227flags);228return res;229}230231static struct virgl_hw_res *232virgl_drm_winsys_resource_create(struct virgl_winsys *qws,233enum pipe_texture_target target,234uint32_t format,235uint32_t bind,236uint32_t width,237uint32_t height,238uint32_t depth,239uint32_t array_size,240uint32_t last_level,241uint32_t nr_samples,242uint32_t size,243bool for_fencing)244{245struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);246struct drm_virtgpu_resource_create createcmd;247int ret;248struct virgl_hw_res *res;249uint32_t stride = width * util_format_get_blocksize(format);250251res = CALLOC_STRUCT(virgl_hw_res);252if (!res)253return NULL;254255memset(&createcmd, 0, sizeof(createcmd));256createcmd.target = target;257createcmd.format = pipe_to_virgl_format(format);258createcmd.bind = bind;259createcmd.width = width;260createcmd.height = height;261createcmd.depth = depth;262createcmd.array_size = array_size;263createcmd.last_level = last_level;264createcmd.nr_samples = nr_samples;265createcmd.stride = stride;266createcmd.size = size;267268ret = drmIoctl(qdws->fd, DRM_IOCTL_VIRTGPU_RESOURCE_CREATE, &createcmd);269if (ret != 0) {270FREE(res);271return NULL;272}273274res->bind = bind;275276res->res_handle = createcmd.res_handle;277res->bo_handle = createcmd.bo_handle;278res->size = size;279res->target = target;280res->maybe_untyped = false;281pipe_reference_init(&res->reference, 1);282p_atomic_set(&res->external, false);283p_atomic_set(&res->num_cs_references, 0);284285/* A newly created resource is considered busy by the kernel until the286* command is retired. But for our purposes, we can consider it idle287* unless it is used for fencing.288*/289p_atomic_set(&res->maybe_busy, for_fencing);290291virgl_resource_cache_entry_init(&res->cache_entry, size, bind, format, 0);292293return res;294}295296/*297* Previously, with DRM_IOCTL_VIRTGPU_RESOURCE_CREATE, all host resources had298* a guest memory shadow resource with size = stride * bpp. Virglrenderer299* would guess the stride implicitly when performing transfer operations, if300* the stride wasn't specified. Interestingly, vtest would specify the stride.301*302* Guessing the stride breaks down with YUV images, which may be imported into303* Mesa as 3R8 images. It also doesn't work if an external allocator304* (i.e, minigbm) decides to use a stride not equal to stride * bpp. With blob305* resources, the size = stride * bpp restriction no longer holds, so use306* explicit strides passed into Mesa.307*/308static inline bool use_explicit_stride(struct virgl_hw_res *res, uint32_t level,309uint32_t depth)310{311return (params[param_resource_blob].value &&312res->blob_mem == VIRTGPU_BLOB_MEM_HOST3D_GUEST &&313res->target == PIPE_TEXTURE_2D &&314level == 0 && depth == 1);315}316317static int318virgl_bo_transfer_put(struct virgl_winsys *vws,319struct virgl_hw_res *res,320const struct pipe_box *box,321uint32_t stride, uint32_t layer_stride,322uint32_t buf_offset, uint32_t level)323{324struct virgl_drm_winsys *vdws = virgl_drm_winsys(vws);325struct drm_virtgpu_3d_transfer_to_host tohostcmd;326327p_atomic_set(&res->maybe_busy, true);328329memset(&tohostcmd, 0, sizeof(tohostcmd));330tohostcmd.bo_handle = res->bo_handle;331tohostcmd.box.x = box->x;332tohostcmd.box.y = box->y;333tohostcmd.box.z = box->z;334tohostcmd.box.w = box->width;335tohostcmd.box.h = box->height;336tohostcmd.box.d = box->depth;337tohostcmd.offset = buf_offset;338tohostcmd.level = level;339340if (use_explicit_stride(res, level, box->depth))341tohostcmd.stride = stride;342343return drmIoctl(vdws->fd, DRM_IOCTL_VIRTGPU_TRANSFER_TO_HOST, &tohostcmd);344}345346static int347virgl_bo_transfer_get(struct virgl_winsys *vws,348struct virgl_hw_res *res,349const struct pipe_box *box,350uint32_t stride, uint32_t layer_stride,351uint32_t buf_offset, uint32_t level)352{353struct virgl_drm_winsys *vdws = virgl_drm_winsys(vws);354struct drm_virtgpu_3d_transfer_from_host fromhostcmd;355356p_atomic_set(&res->maybe_busy, true);357358memset(&fromhostcmd, 0, sizeof(fromhostcmd));359fromhostcmd.bo_handle = res->bo_handle;360fromhostcmd.level = level;361fromhostcmd.offset = buf_offset;362fromhostcmd.box.x = box->x;363fromhostcmd.box.y = box->y;364fromhostcmd.box.z = box->z;365fromhostcmd.box.w = box->width;366fromhostcmd.box.h = box->height;367fromhostcmd.box.d = box->depth;368369if (use_explicit_stride(res, level, box->depth))370fromhostcmd.stride = stride;371372return drmIoctl(vdws->fd, DRM_IOCTL_VIRTGPU_TRANSFER_FROM_HOST, &fromhostcmd);373}374375static struct virgl_hw_res *376virgl_drm_winsys_resource_cache_create(struct virgl_winsys *qws,377enum pipe_texture_target target,378uint32_t format,379uint32_t bind,380uint32_t width,381uint32_t height,382uint32_t depth,383uint32_t array_size,384uint32_t last_level,385uint32_t nr_samples,386uint32_t flags,387uint32_t size)388{389struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);390struct virgl_hw_res *res;391struct virgl_resource_cache_entry *entry;392393if (!can_cache_resource(bind))394goto alloc;395396mtx_lock(&qdws->mutex);397398entry = virgl_resource_cache_remove_compatible(&qdws->cache, size,399bind, format, flags);400if (entry) {401res = cache_entry_container_res(entry);402mtx_unlock(&qdws->mutex);403pipe_reference_init(&res->reference, 1);404return res;405}406407mtx_unlock(&qdws->mutex);408409alloc:410if (flags & (VIRGL_RESOURCE_FLAG_MAP_PERSISTENT |411VIRGL_RESOURCE_FLAG_MAP_COHERENT))412res = virgl_drm_winsys_resource_create_blob(qws, target, format, bind,413width, height, depth,414array_size, last_level,415nr_samples, flags, size);416else417res = virgl_drm_winsys_resource_create(qws, target, format, bind, width,418height, depth, array_size,419last_level, nr_samples, size,420false);421return res;422}423424static struct virgl_hw_res *425virgl_drm_winsys_resource_create_handle(struct virgl_winsys *qws,426struct winsys_handle *whandle,427uint32_t *plane,428uint32_t *stride,429uint32_t *plane_offset,430uint64_t *modifier,431uint32_t *blob_mem)432{433struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);434struct drm_gem_open open_arg = {};435struct drm_virtgpu_resource_info info_arg = {};436struct virgl_hw_res *res = NULL;437uint32_t handle = whandle->handle;438439if (whandle->plane >= VIRGL_MAX_PLANE_COUNT) {440return NULL;441}442443if (whandle->offset != 0 && whandle->type == WINSYS_HANDLE_TYPE_SHARED) {444_debug_printf("attempt to import unsupported winsys offset %u\n",445whandle->offset);446return NULL;447} else if (whandle->type == WINSYS_HANDLE_TYPE_FD) {448*plane = whandle->plane;449*stride = whandle->stride;450*plane_offset = whandle->offset;451*modifier = whandle->modifier;452}453454mtx_lock(&qdws->bo_handles_mutex);455456/* We must maintain a list of pairs <handle, bo>, so that we always return457* the same BO for one particular handle. If we didn't do that and created458* more than one BO for the same handle and then relocated them in a CS,459* we would hit a deadlock in the kernel.460*461* The list of pairs is guarded by a mutex, of course. */462if (whandle->type == WINSYS_HANDLE_TYPE_SHARED) {463res = util_hash_table_get(qdws->bo_names, (void*)(uintptr_t)handle);464} else if (whandle->type == WINSYS_HANDLE_TYPE_FD) {465int r;466r = drmPrimeFDToHandle(qdws->fd, whandle->handle, &handle);467if (r)468goto done;469res = util_hash_table_get(qdws->bo_handles, (void*)(uintptr_t)handle);470} else {471/* Unknown handle type */472goto done;473}474475if (res) {476/* qdws->bo_{names,handles} hold weak pointers to virgl_hw_res. Because477* virgl_drm_resource_reference does not take qdws->bo_handles_mutex478* until it enters virgl_hw_res_destroy, there is a small window that479* the refcount can drop to zero. Call p_atomic_inc directly instead of480* virgl_drm_resource_reference to avoid hitting assert failures.481*/482p_atomic_inc(&res->reference.count);483goto done;484}485486res = CALLOC_STRUCT(virgl_hw_res);487if (!res)488goto done;489490if (whandle->type == WINSYS_HANDLE_TYPE_FD) {491res->bo_handle = handle;492} else {493memset(&open_arg, 0, sizeof(open_arg));494open_arg.name = whandle->handle;495if (drmIoctl(qdws->fd, DRM_IOCTL_GEM_OPEN, &open_arg)) {496FREE(res);497res = NULL;498goto done;499}500res->bo_handle = open_arg.handle;501res->flink_name = whandle->handle;502}503504memset(&info_arg, 0, sizeof(info_arg));505info_arg.bo_handle = res->bo_handle;506507if (drmIoctl(qdws->fd, DRM_IOCTL_VIRTGPU_RESOURCE_INFO, &info_arg)) {508/* close */509FREE(res);510res = NULL;511goto done;512}513514res->res_handle = info_arg.res_handle;515res->blob_mem = info_arg.blob_mem;516*blob_mem = info_arg.blob_mem;517518res->size = info_arg.size;519res->maybe_untyped = info_arg.blob_mem ? true : false;520pipe_reference_init(&res->reference, 1);521p_atomic_set(&res->external, true);522res->num_cs_references = 0;523524if (res->flink_name)525_mesa_hash_table_insert(qdws->bo_names, (void *)(uintptr_t)res->flink_name, res);526_mesa_hash_table_insert(qdws->bo_handles, (void *)(uintptr_t)res->bo_handle, res);527528done:529mtx_unlock(&qdws->bo_handles_mutex);530return res;531}532533static void534virgl_drm_winsys_resource_set_type(struct virgl_winsys *qws,535struct virgl_hw_res *res,536uint32_t format, uint32_t bind,537uint32_t width, uint32_t height,538uint32_t usage, uint64_t modifier,539uint32_t plane_count,540const uint32_t *plane_strides,541const uint32_t *plane_offsets)542{543struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);544uint32_t cmd[VIRGL_PIPE_RES_SET_TYPE_SIZE(VIRGL_MAX_PLANE_COUNT)];545struct drm_virtgpu_execbuffer eb;546int ret;547548mtx_lock(&qdws->bo_handles_mutex);549550if (!res->maybe_untyped) {551mtx_unlock(&qdws->bo_handles_mutex);552return;553}554res->maybe_untyped = false;555556assert(plane_count && plane_count <= VIRGL_MAX_PLANE_COUNT);557558cmd[0] = VIRGL_CMD0(VIRGL_CCMD_PIPE_RESOURCE_SET_TYPE, 0, VIRGL_PIPE_RES_SET_TYPE_SIZE(plane_count));559cmd[VIRGL_PIPE_RES_SET_TYPE_RES_HANDLE] = res->res_handle,560cmd[VIRGL_PIPE_RES_SET_TYPE_FORMAT] = format;561cmd[VIRGL_PIPE_RES_SET_TYPE_BIND] = bind;562cmd[VIRGL_PIPE_RES_SET_TYPE_WIDTH] = width;563cmd[VIRGL_PIPE_RES_SET_TYPE_HEIGHT] = height;564cmd[VIRGL_PIPE_RES_SET_TYPE_USAGE] = usage;565cmd[VIRGL_PIPE_RES_SET_TYPE_MODIFIER_LO] = (uint32_t)modifier;566cmd[VIRGL_PIPE_RES_SET_TYPE_MODIFIER_HI] = (uint32_t)(modifier >> 32);567for (uint32_t i = 0; i < plane_count; i++) {568cmd[VIRGL_PIPE_RES_SET_TYPE_PLANE_STRIDE(i)] = plane_strides[i];569cmd[VIRGL_PIPE_RES_SET_TYPE_PLANE_OFFSET(i)] = plane_offsets[i];570}571572memset(&eb, 0, sizeof(eb));573eb.command = (uintptr_t)cmd;574eb.size = (1 + VIRGL_PIPE_RES_SET_TYPE_SIZE(plane_count)) * 4;575eb.num_bo_handles = 1;576eb.bo_handles = (uintptr_t)&res->bo_handle;577578ret = drmIoctl(qdws->fd, DRM_IOCTL_VIRTGPU_EXECBUFFER, &eb);579if (ret == -1)580_debug_printf("failed to set resource type: %s", strerror(errno));581582mtx_unlock(&qdws->bo_handles_mutex);583}584585static boolean virgl_drm_winsys_resource_get_handle(struct virgl_winsys *qws,586struct virgl_hw_res *res,587uint32_t stride,588struct winsys_handle *whandle)589{590struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);591struct drm_gem_flink flink;592593if (!res)594return FALSE;595596if (whandle->type == WINSYS_HANDLE_TYPE_SHARED) {597if (!res->flink_name) {598memset(&flink, 0, sizeof(flink));599flink.handle = res->bo_handle;600601if (drmIoctl(qdws->fd, DRM_IOCTL_GEM_FLINK, &flink)) {602return FALSE;603}604res->flink_name = flink.name;605606mtx_lock(&qdws->bo_handles_mutex);607_mesa_hash_table_insert(qdws->bo_names, (void *)(uintptr_t)res->flink_name, res);608mtx_unlock(&qdws->bo_handles_mutex);609}610whandle->handle = res->flink_name;611} else if (whandle->type == WINSYS_HANDLE_TYPE_KMS) {612whandle->handle = res->bo_handle;613} else if (whandle->type == WINSYS_HANDLE_TYPE_FD) {614if (drmPrimeHandleToFD(qdws->fd, res->bo_handle, DRM_CLOEXEC, (int*)&whandle->handle))615return FALSE;616mtx_lock(&qdws->bo_handles_mutex);617_mesa_hash_table_insert(qdws->bo_handles, (void *)(uintptr_t)res->bo_handle, res);618mtx_unlock(&qdws->bo_handles_mutex);619}620621p_atomic_set(&res->external, true);622623whandle->stride = stride;624return TRUE;625}626627static void *virgl_drm_resource_map(struct virgl_winsys *qws,628struct virgl_hw_res *res)629{630struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);631struct drm_virtgpu_map mmap_arg;632void *ptr;633634if (res->ptr)635return res->ptr;636637memset(&mmap_arg, 0, sizeof(mmap_arg));638mmap_arg.handle = res->bo_handle;639if (drmIoctl(qdws->fd, DRM_IOCTL_VIRTGPU_MAP, &mmap_arg))640return NULL;641642ptr = os_mmap(0, res->size, PROT_READ|PROT_WRITE, MAP_SHARED,643qdws->fd, mmap_arg.offset);644if (ptr == MAP_FAILED)645return NULL;646647res->ptr = ptr;648return ptr;649650}651652static void virgl_drm_resource_wait(struct virgl_winsys *qws,653struct virgl_hw_res *res)654{655struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);656struct drm_virtgpu_3d_wait waitcmd;657int ret;658659if (!p_atomic_read(&res->maybe_busy) && !p_atomic_read(&res->external))660return;661662memset(&waitcmd, 0, sizeof(waitcmd));663waitcmd.handle = res->bo_handle;664665ret = drmIoctl(qdws->fd, DRM_IOCTL_VIRTGPU_WAIT, &waitcmd);666if (ret)667_debug_printf("waiting got error - %d, slow gpu or hang?\n", errno);668669p_atomic_set(&res->maybe_busy, false);670}671672static bool virgl_drm_alloc_res_list(struct virgl_drm_cmd_buf *cbuf,673int initial_size)674{675cbuf->nres = initial_size;676cbuf->cres = 0;677678cbuf->res_bo = CALLOC(cbuf->nres, sizeof(struct virgl_hw_buf*));679if (!cbuf->res_bo)680return false;681682cbuf->res_hlist = MALLOC(cbuf->nres * sizeof(uint32_t));683if (!cbuf->res_hlist) {684FREE(cbuf->res_bo);685return false;686}687688return true;689}690691static void virgl_drm_free_res_list(struct virgl_drm_cmd_buf *cbuf)692{693int i;694695for (i = 0; i < cbuf->cres; i++) {696p_atomic_dec(&cbuf->res_bo[i]->num_cs_references);697virgl_drm_resource_reference(cbuf->ws, &cbuf->res_bo[i], NULL);698}699FREE(cbuf->res_hlist);700FREE(cbuf->res_bo);701}702703static boolean virgl_drm_lookup_res(struct virgl_drm_cmd_buf *cbuf,704struct virgl_hw_res *res)705{706unsigned hash = res->res_handle & (sizeof(cbuf->is_handle_added)-1);707int i;708709if (cbuf->is_handle_added[hash]) {710i = cbuf->reloc_indices_hashlist[hash];711if (cbuf->res_bo[i] == res)712return true;713714for (i = 0; i < cbuf->cres; i++) {715if (cbuf->res_bo[i] == res) {716cbuf->reloc_indices_hashlist[hash] = i;717return true;718}719}720}721return false;722}723724static void virgl_drm_add_res(struct virgl_drm_winsys *qdws,725struct virgl_drm_cmd_buf *cbuf,726struct virgl_hw_res *res)727{728unsigned hash = res->res_handle & (sizeof(cbuf->is_handle_added)-1);729730if (cbuf->cres >= cbuf->nres) {731unsigned new_nres = cbuf->nres + 256;732void *new_ptr = REALLOC(cbuf->res_bo,733cbuf->nres * sizeof(struct virgl_hw_buf*),734new_nres * sizeof(struct virgl_hw_buf*));735if (!new_ptr) {736_debug_printf("failure to add relocation %d, %d\n", cbuf->cres, new_nres);737return;738}739cbuf->res_bo = new_ptr;740741new_ptr = REALLOC(cbuf->res_hlist,742cbuf->nres * sizeof(uint32_t),743new_nres * sizeof(uint32_t));744if (!new_ptr) {745_debug_printf("failure to add hlist relocation %d, %d\n", cbuf->cres, cbuf->nres);746return;747}748cbuf->res_hlist = new_ptr;749cbuf->nres = new_nres;750}751752cbuf->res_bo[cbuf->cres] = NULL;753virgl_drm_resource_reference(&qdws->base, &cbuf->res_bo[cbuf->cres], res);754cbuf->res_hlist[cbuf->cres] = res->bo_handle;755cbuf->is_handle_added[hash] = TRUE;756757cbuf->reloc_indices_hashlist[hash] = cbuf->cres;758p_atomic_inc(&res->num_cs_references);759cbuf->cres++;760}761762/* This is called after the cbuf is submitted. */763static void virgl_drm_clear_res_list(struct virgl_drm_cmd_buf *cbuf)764{765int i;766767for (i = 0; i < cbuf->cres; i++) {768/* mark all BOs busy after submission */769p_atomic_set(&cbuf->res_bo[i]->maybe_busy, true);770771p_atomic_dec(&cbuf->res_bo[i]->num_cs_references);772virgl_drm_resource_reference(cbuf->ws, &cbuf->res_bo[i], NULL);773}774775cbuf->cres = 0;776777memset(cbuf->is_handle_added, 0, sizeof(cbuf->is_handle_added));778}779780static void virgl_drm_emit_res(struct virgl_winsys *qws,781struct virgl_cmd_buf *_cbuf,782struct virgl_hw_res *res, boolean write_buf)783{784struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);785struct virgl_drm_cmd_buf *cbuf = virgl_drm_cmd_buf(_cbuf);786boolean already_in_list = virgl_drm_lookup_res(cbuf, res);787788if (write_buf)789cbuf->base.buf[cbuf->base.cdw++] = res->res_handle;790791if (!already_in_list)792virgl_drm_add_res(qdws, cbuf, res);793}794795static boolean virgl_drm_res_is_ref(struct virgl_winsys *qws,796struct virgl_cmd_buf *_cbuf,797struct virgl_hw_res *res)798{799if (!p_atomic_read(&res->num_cs_references))800return FALSE;801802return TRUE;803}804805static struct virgl_cmd_buf *virgl_drm_cmd_buf_create(struct virgl_winsys *qws,806uint32_t size)807{808struct virgl_drm_cmd_buf *cbuf;809810cbuf = CALLOC_STRUCT(virgl_drm_cmd_buf);811if (!cbuf)812return NULL;813814cbuf->ws = qws;815816if (!virgl_drm_alloc_res_list(cbuf, 512)) {817FREE(cbuf);818return NULL;819}820821cbuf->buf = CALLOC(size, sizeof(uint32_t));822if (!cbuf->buf) {823FREE(cbuf->res_hlist);824FREE(cbuf->res_bo);825FREE(cbuf);826return NULL;827}828829cbuf->in_fence_fd = -1;830cbuf->base.buf = cbuf->buf;831return &cbuf->base;832}833834static void virgl_drm_cmd_buf_destroy(struct virgl_cmd_buf *_cbuf)835{836struct virgl_drm_cmd_buf *cbuf = virgl_drm_cmd_buf(_cbuf);837838virgl_drm_free_res_list(cbuf);839840FREE(cbuf->buf);841FREE(cbuf);842}843844static struct pipe_fence_handle *845virgl_drm_fence_create(struct virgl_winsys *vws, int fd, bool external)846{847struct virgl_drm_fence *fence;848849assert(vws->supports_fences);850851if (external) {852fd = os_dupfd_cloexec(fd);853if (fd < 0)854return NULL;855}856857fence = CALLOC_STRUCT(virgl_drm_fence);858if (!fence) {859close(fd);860return NULL;861}862863fence->fd = fd;864fence->external = external;865866pipe_reference_init(&fence->reference, 1);867868return (struct pipe_fence_handle *)fence;869}870871static struct pipe_fence_handle *872virgl_drm_fence_create_legacy(struct virgl_winsys *vws)873{874struct virgl_drm_fence *fence;875876assert(!vws->supports_fences);877878fence = CALLOC_STRUCT(virgl_drm_fence);879if (!fence)880return NULL;881fence->fd = -1;882883/* Resources for fences should not be from the cache, since we are basing884* the fence status on the resource creation busy status.885*/886fence->hw_res = virgl_drm_winsys_resource_create(vws, PIPE_BUFFER,887PIPE_FORMAT_R8_UNORM, VIRGL_BIND_CUSTOM, 8, 1, 1, 0, 0, 0, 8, true);888if (!fence->hw_res) {889FREE(fence);890return NULL;891}892893pipe_reference_init(&fence->reference, 1);894895return (struct pipe_fence_handle *)fence;896}897898static int virgl_drm_winsys_submit_cmd(struct virgl_winsys *qws,899struct virgl_cmd_buf *_cbuf,900struct pipe_fence_handle **fence)901{902struct virgl_drm_winsys *qdws = virgl_drm_winsys(qws);903struct virgl_drm_cmd_buf *cbuf = virgl_drm_cmd_buf(_cbuf);904struct drm_virtgpu_execbuffer eb;905int ret;906907if (cbuf->base.cdw == 0)908return 0;909910memset(&eb, 0, sizeof(struct drm_virtgpu_execbuffer));911eb.command = (unsigned long)(void*)cbuf->buf;912eb.size = cbuf->base.cdw * 4;913eb.num_bo_handles = cbuf->cres;914eb.bo_handles = (unsigned long)(void *)cbuf->res_hlist;915916eb.fence_fd = -1;917if (qws->supports_fences) {918if (cbuf->in_fence_fd >= 0) {919eb.flags |= VIRTGPU_EXECBUF_FENCE_FD_IN;920eb.fence_fd = cbuf->in_fence_fd;921}922923if (fence != NULL)924eb.flags |= VIRTGPU_EXECBUF_FENCE_FD_OUT;925} else {926assert(cbuf->in_fence_fd < 0);927}928929ret = drmIoctl(qdws->fd, DRM_IOCTL_VIRTGPU_EXECBUFFER, &eb);930if (ret == -1)931_debug_printf("got error from kernel - expect bad rendering %d\n", errno);932cbuf->base.cdw = 0;933934if (qws->supports_fences) {935if (cbuf->in_fence_fd >= 0) {936close(cbuf->in_fence_fd);937cbuf->in_fence_fd = -1;938}939940if (fence != NULL && ret == 0)941*fence = virgl_drm_fence_create(qws, eb.fence_fd, false);942} else {943if (fence != NULL && ret == 0)944*fence = virgl_drm_fence_create_legacy(qws);945}946947virgl_drm_clear_res_list(cbuf);948949return ret;950}951952static int virgl_drm_get_caps(struct virgl_winsys *vws,953struct virgl_drm_caps *caps)954{955struct virgl_drm_winsys *vdws = virgl_drm_winsys(vws);956struct drm_virtgpu_get_caps args;957int ret;958959virgl_ws_fill_new_caps_defaults(caps);960961memset(&args, 0, sizeof(args));962if (params[param_capset_fix].value) {963/* if we have the query fix - try and get cap set id 2 first */964args.cap_set_id = 2;965args.size = sizeof(union virgl_caps);966} else {967args.cap_set_id = 1;968args.size = sizeof(struct virgl_caps_v1);969}970args.addr = (unsigned long)&caps->caps;971972ret = drmIoctl(vdws->fd, DRM_IOCTL_VIRTGPU_GET_CAPS, &args);973if (ret == -1 && errno == EINVAL) {974/* Fallback to v1 */975args.cap_set_id = 1;976args.size = sizeof(struct virgl_caps_v1);977ret = drmIoctl(vdws->fd, DRM_IOCTL_VIRTGPU_GET_CAPS, &args);978if (ret == -1)979return ret;980}981return ret;982}983984static struct pipe_fence_handle *985virgl_cs_create_fence(struct virgl_winsys *vws, int fd)986{987if (!vws->supports_fences)988return NULL;989990return virgl_drm_fence_create(vws, fd, true);991}992993static bool virgl_fence_wait(struct virgl_winsys *vws,994struct pipe_fence_handle *_fence,995uint64_t timeout)996{997struct virgl_drm_fence *fence = virgl_drm_fence(_fence);998999if (vws->supports_fences) {1000uint64_t timeout_ms;1001int timeout_poll;10021003if (timeout == 0)1004return sync_wait(fence->fd, 0) == 0;10051006timeout_ms = timeout / 1000000;1007/* round up */1008if (timeout_ms * 1000000 < timeout)1009timeout_ms++;10101011timeout_poll = timeout_ms <= INT_MAX ? (int) timeout_ms : -1;10121013return sync_wait(fence->fd, timeout_poll) == 0;1014}10151016if (timeout == 0)1017return !virgl_drm_resource_is_busy(vws, fence->hw_res);10181019if (timeout != PIPE_TIMEOUT_INFINITE) {1020int64_t start_time = os_time_get();1021timeout /= 1000;1022while (virgl_drm_resource_is_busy(vws, fence->hw_res)) {1023if (os_time_get() - start_time >= timeout)1024return FALSE;1025os_time_sleep(10);1026}1027return TRUE;1028}1029virgl_drm_resource_wait(vws, fence->hw_res);10301031return TRUE;1032}10331034static void virgl_fence_reference(struct virgl_winsys *vws,1035struct pipe_fence_handle **dst,1036struct pipe_fence_handle *src)1037{1038struct virgl_drm_fence *dfence = virgl_drm_fence(*dst);1039struct virgl_drm_fence *sfence = virgl_drm_fence(src);10401041if (pipe_reference(&dfence->reference, &sfence->reference)) {1042if (vws->supports_fences) {1043close(dfence->fd);1044} else {1045virgl_drm_resource_reference(vws, &dfence->hw_res, NULL);1046}1047FREE(dfence);1048}10491050*dst = src;1051}10521053static void virgl_fence_server_sync(struct virgl_winsys *vws,1054struct virgl_cmd_buf *_cbuf,1055struct pipe_fence_handle *_fence)1056{1057struct virgl_drm_cmd_buf *cbuf = virgl_drm_cmd_buf(_cbuf);1058struct virgl_drm_fence *fence = virgl_drm_fence(_fence);10591060if (!vws->supports_fences)1061return;10621063/* if not an external fence, then nothing more to do without preemption: */1064if (!fence->external)1065return;10661067sync_accumulate("virgl", &cbuf->in_fence_fd, fence->fd);1068}10691070static int virgl_fence_get_fd(struct virgl_winsys *vws,1071struct pipe_fence_handle *_fence)1072{1073struct virgl_drm_fence *fence = virgl_drm_fence(_fence);10741075if (!vws->supports_fences)1076return -1;10771078return os_dupfd_cloexec(fence->fd);1079}10801081static int virgl_drm_get_version(int fd)1082{1083int ret;1084drmVersionPtr version;10851086version = drmGetVersion(fd);10871088if (!version)1089ret = -EFAULT;1090else if (version->version_major != 0)1091ret = -EINVAL;1092else1093ret = VIRGL_DRM_VERSION(0, version->version_minor);10941095drmFreeVersion(version);10961097return ret;1098}10991100static bool1101virgl_drm_resource_cache_entry_is_busy(struct virgl_resource_cache_entry *entry,1102void *user_data)1103{1104struct virgl_drm_winsys *qdws = user_data;1105struct virgl_hw_res *res = cache_entry_container_res(entry);11061107return virgl_drm_resource_is_busy(&qdws->base, res);1108}11091110static void1111virgl_drm_resource_cache_entry_release(struct virgl_resource_cache_entry *entry,1112void *user_data)1113{1114struct virgl_drm_winsys *qdws = user_data;1115struct virgl_hw_res *res = cache_entry_container_res(entry);11161117virgl_hw_res_destroy(qdws, res);1118}11191120static struct virgl_winsys *1121virgl_drm_winsys_create(int drmFD)1122{1123static const unsigned CACHE_TIMEOUT_USEC = 1000000;1124struct virgl_drm_winsys *qdws;1125int drm_version;1126int ret;11271128for (uint32_t i = 0; i < ARRAY_SIZE(params); i++) {1129struct drm_virtgpu_getparam getparam = { 0 };1130uint64_t value = 0;1131getparam.param = params[i].param;1132getparam.value = (uint64_t)(uintptr_t)&value;1133ret = drmIoctl(drmFD, DRM_IOCTL_VIRTGPU_GETPARAM, &getparam);1134params[i].value = (ret == 0) ? value : 0;1135}11361137if (!params[param_3d_features].value)1138return NULL;11391140drm_version = virgl_drm_get_version(drmFD);1141if (drm_version < 0)1142return NULL;11431144qdws = CALLOC_STRUCT(virgl_drm_winsys);1145if (!qdws)1146return NULL;11471148qdws->fd = drmFD;1149virgl_resource_cache_init(&qdws->cache, CACHE_TIMEOUT_USEC,1150virgl_drm_resource_cache_entry_is_busy,1151virgl_drm_resource_cache_entry_release,1152qdws);1153(void) mtx_init(&qdws->mutex, mtx_plain);1154(void) mtx_init(&qdws->bo_handles_mutex, mtx_plain);1155p_atomic_set(&qdws->blob_id, 0);11561157qdws->bo_handles = util_hash_table_create_ptr_keys();1158qdws->bo_names = util_hash_table_create_ptr_keys();1159qdws->base.destroy = virgl_drm_winsys_destroy;11601161qdws->base.transfer_put = virgl_bo_transfer_put;1162qdws->base.transfer_get = virgl_bo_transfer_get;1163qdws->base.resource_create = virgl_drm_winsys_resource_cache_create;1164qdws->base.resource_reference = virgl_drm_resource_reference;1165qdws->base.resource_create_from_handle = virgl_drm_winsys_resource_create_handle;1166qdws->base.resource_set_type = virgl_drm_winsys_resource_set_type;1167qdws->base.resource_get_handle = virgl_drm_winsys_resource_get_handle;1168qdws->base.resource_map = virgl_drm_resource_map;1169qdws->base.resource_wait = virgl_drm_resource_wait;1170qdws->base.resource_is_busy = virgl_drm_resource_is_busy;1171qdws->base.cmd_buf_create = virgl_drm_cmd_buf_create;1172qdws->base.cmd_buf_destroy = virgl_drm_cmd_buf_destroy;1173qdws->base.submit_cmd = virgl_drm_winsys_submit_cmd;1174qdws->base.emit_res = virgl_drm_emit_res;1175qdws->base.res_is_referenced = virgl_drm_res_is_ref;11761177qdws->base.cs_create_fence = virgl_cs_create_fence;1178qdws->base.fence_wait = virgl_fence_wait;1179qdws->base.fence_reference = virgl_fence_reference;1180qdws->base.fence_server_sync = virgl_fence_server_sync;1181qdws->base.fence_get_fd = virgl_fence_get_fd;1182qdws->base.get_caps = virgl_drm_get_caps;1183qdws->base.supports_fences = drm_version >= VIRGL_DRM_VERSION_FENCE_FD;1184qdws->base.supports_encoded_transfers = 1;11851186qdws->base.supports_coherent = params[param_resource_blob].value &&1187params[param_host_visible].value;1188return &qdws->base;11891190}11911192static struct hash_table *fd_tab = NULL;1193static mtx_t virgl_screen_mutex = _MTX_INITIALIZER_NP;11941195static void1196virgl_drm_screen_destroy(struct pipe_screen *pscreen)1197{1198struct virgl_screen *screen = virgl_screen(pscreen);1199boolean destroy;12001201mtx_lock(&virgl_screen_mutex);1202destroy = --screen->refcnt == 0;1203if (destroy) {1204int fd = virgl_drm_winsys(screen->vws)->fd;1205_mesa_hash_table_remove_key(fd_tab, intptr_to_pointer(fd));1206close(fd);1207}1208mtx_unlock(&virgl_screen_mutex);12091210if (destroy) {1211pscreen->destroy = screen->winsys_priv;1212pscreen->destroy(pscreen);1213}1214}12151216struct pipe_screen *1217virgl_drm_screen_create(int fd, const struct pipe_screen_config *config)1218{1219struct pipe_screen *pscreen = NULL;12201221mtx_lock(&virgl_screen_mutex);1222if (!fd_tab) {1223fd_tab = util_hash_table_create_fd_keys();1224if (!fd_tab)1225goto unlock;1226}12271228pscreen = util_hash_table_get(fd_tab, intptr_to_pointer(fd));1229if (pscreen) {1230virgl_screen(pscreen)->refcnt++;1231} else {1232struct virgl_winsys *vws;1233int dup_fd = os_dupfd_cloexec(fd);12341235vws = virgl_drm_winsys_create(dup_fd);1236if (!vws) {1237close(dup_fd);1238goto unlock;1239}12401241pscreen = virgl_create_screen(vws, config);1242if (pscreen) {1243_mesa_hash_table_insert(fd_tab, intptr_to_pointer(dup_fd), pscreen);12441245/* Bit of a hack, to avoid circular linkage dependency,1246* ie. pipe driver having to call in to winsys, we1247* override the pipe drivers screen->destroy():1248*/1249virgl_screen(pscreen)->winsys_priv = pscreen->destroy;1250pscreen->destroy = virgl_drm_screen_destroy;1251}1252}12531254unlock:1255mtx_unlock(&virgl_screen_mutex);1256return pscreen;1257}125812591260