Path: blob/21.2-virgl/src/gallium/drivers/svga/svga_pipe_vertex.c
4570 views
/**********************************************************1* Copyright 2008-2009 VMware, Inc. All rights reserved.2*3* Permission is hereby granted, free of charge, to any person4* obtaining a copy of this software and associated documentation5* files (the "Software"), to deal in the Software without6* restriction, including without limitation the rights to use, copy,7* modify, merge, publish, distribute, sublicense, and/or sell copies8* of the Software, and to permit persons to whom the Software is9* furnished to do so, subject to the following conditions:10*11* The above copyright notice and this permission notice shall be12* included in all copies or substantial portions of the Software.13*14* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,15* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF16* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND17* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS18* BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN19* ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN20* CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE21* SOFTWARE.22*23**********************************************************/2425#include "pipe/p_defines.h"26#include "util/u_bitmask.h"27#include "util/format/u_format.h"28#include "util/u_helpers.h"29#include "util/u_inlines.h"30#include "util/u_math.h"31#include "util/u_memory.h"32#include "util/u_transfer.h"33#include "tgsi/tgsi_parse.h"3435#include "svga_context.h"36#include "svga_cmd.h"37#include "svga_format.h"38#include "svga_resource_buffer.h"39#include "svga_screen.h"404142static void43svga_set_vertex_buffers(struct pipe_context *pipe,44unsigned start_slot, unsigned count,45unsigned unbind_num_trailing_slots,46bool take_ownership,47const struct pipe_vertex_buffer *buffers)48{49struct svga_context *svga = svga_context(pipe);5051util_set_vertex_buffers_count(svga->curr.vb,52&svga->curr.num_vertex_buffers,53buffers, start_slot, count,54unbind_num_trailing_slots,55take_ownership);5657svga->dirty |= SVGA_NEW_VBUFFER;58}596061/**62* Does the given vertex attrib format need range adjustment in the VS?63* Range adjustment scales and biases values from [0,1] to [-1,1].64* This lets us avoid the swtnl path.65*/66static boolean67attrib_needs_range_adjustment(enum pipe_format format)68{69switch (format) {70case PIPE_FORMAT_R8G8B8_SNORM:71return TRUE;72default:73return FALSE;74}75}767778/**79* Given a gallium vertex element format, return the corresponding80* SVGA3dDeclType.81*/82static SVGA3dDeclType83translate_vertex_format_to_decltype(enum pipe_format format)84{85switch (format) {86case PIPE_FORMAT_R32_FLOAT: return SVGA3D_DECLTYPE_FLOAT1;87case PIPE_FORMAT_R32G32_FLOAT: return SVGA3D_DECLTYPE_FLOAT2;88case PIPE_FORMAT_R32G32B32_FLOAT: return SVGA3D_DECLTYPE_FLOAT3;89case PIPE_FORMAT_R32G32B32A32_FLOAT: return SVGA3D_DECLTYPE_FLOAT4;90case PIPE_FORMAT_B8G8R8A8_UNORM: return SVGA3D_DECLTYPE_D3DCOLOR;91case PIPE_FORMAT_R8G8B8A8_USCALED: return SVGA3D_DECLTYPE_UBYTE4;92case PIPE_FORMAT_R16G16_SSCALED: return SVGA3D_DECLTYPE_SHORT2;93case PIPE_FORMAT_R16G16B16A16_SSCALED: return SVGA3D_DECLTYPE_SHORT4;94case PIPE_FORMAT_R8G8B8A8_UNORM: return SVGA3D_DECLTYPE_UBYTE4N;95case PIPE_FORMAT_R16G16_SNORM: return SVGA3D_DECLTYPE_SHORT2N;96case PIPE_FORMAT_R16G16B16A16_SNORM: return SVGA3D_DECLTYPE_SHORT4N;97case PIPE_FORMAT_R16G16_UNORM: return SVGA3D_DECLTYPE_USHORT2N;98case PIPE_FORMAT_R16G16B16A16_UNORM: return SVGA3D_DECLTYPE_USHORT4N;99case PIPE_FORMAT_R10G10B10X2_USCALED: return SVGA3D_DECLTYPE_UDEC3;100case PIPE_FORMAT_R10G10B10X2_SNORM: return SVGA3D_DECLTYPE_DEC3N;101case PIPE_FORMAT_R16G16_FLOAT: return SVGA3D_DECLTYPE_FLOAT16_2;102case PIPE_FORMAT_R16G16B16A16_FLOAT: return SVGA3D_DECLTYPE_FLOAT16_4;103104/* See attrib_needs_adjustment() and attrib_needs_w_to_1() above */105case PIPE_FORMAT_R8G8B8_SNORM: return SVGA3D_DECLTYPE_UBYTE4N;106107/* See attrib_needs_w_to_1() above */108case PIPE_FORMAT_R16G16B16_SNORM: return SVGA3D_DECLTYPE_SHORT4N;109case PIPE_FORMAT_R16G16B16_UNORM: return SVGA3D_DECLTYPE_USHORT4N;110case PIPE_FORMAT_R8G8B8_UNORM: return SVGA3D_DECLTYPE_UBYTE4N;111112default:113/* There are many formats without hardware support. This case114* will be hit regularly, meaning we'll need swvfetch.115*/116return SVGA3D_DECLTYPE_MAX;117}118}119120121static void122define_input_element_object(struct svga_context *svga,123struct svga_velems_state *velems)124{125SVGA3dInputElementDesc elements[PIPE_MAX_ATTRIBS];126unsigned i;127128assert(velems->count <= PIPE_MAX_ATTRIBS);129assert(svga_have_vgpu10(svga));130131for (i = 0; i < velems->count; i++) {132const struct pipe_vertex_element *elem = velems->velem + i;133SVGA3dSurfaceFormat svga_format;134unsigned vf_flags;135136svga_translate_vertex_format_vgpu10(elem->src_format,137&svga_format, &vf_flags);138139velems->decl_type[i] =140translate_vertex_format_to_decltype(elem->src_format);141elements[i].inputSlot = elem->vertex_buffer_index;142elements[i].alignedByteOffset = elem->src_offset;143elements[i].format = svga_format;144145if (elem->instance_divisor) {146elements[i].inputSlotClass = SVGA3D_INPUT_PER_INSTANCE_DATA;147elements[i].instanceDataStepRate = elem->instance_divisor;148}149else {150elements[i].inputSlotClass = SVGA3D_INPUT_PER_VERTEX_DATA;151elements[i].instanceDataStepRate = 0;152}153elements[i].inputRegister = i;154155if (elements[i].format == SVGA3D_FORMAT_INVALID) {156velems->need_swvfetch = TRUE;157}158159if (util_format_is_pure_integer(elem->src_format)) {160velems->attrib_is_pure_int |= (1 << i);161}162163if (vf_flags & VF_W_TO_1) {164velems->adjust_attrib_w_1 |= (1 << i);165}166167if (vf_flags & VF_U_TO_F_CAST) {168velems->adjust_attrib_utof |= (1 << i);169}170else if (vf_flags & VF_I_TO_F_CAST) {171velems->adjust_attrib_itof |= (1 << i);172}173174if (vf_flags & VF_BGRA) {175velems->attrib_is_bgra |= (1 << i);176}177178if (vf_flags & VF_PUINT_TO_SNORM) {179velems->attrib_puint_to_snorm |= (1 << i);180}181else if (vf_flags & VF_PUINT_TO_USCALED) {182velems->attrib_puint_to_uscaled |= (1 << i);183}184else if (vf_flags & VF_PUINT_TO_SSCALED) {185velems->attrib_puint_to_sscaled |= (1 << i);186}187}188189velems->id = util_bitmask_add(svga->input_element_object_id_bm);190191SVGA_RETRY(svga, SVGA3D_vgpu10_DefineElementLayout(svga->swc, velems->count,192velems->id, elements));193}194195196/**197* Translate the vertex element types to SVGA3dDeclType and check198* for VS-based vertex attribute adjustments.199*/200static void201translate_vertex_decls(struct svga_context *svga,202struct svga_velems_state *velems)203{204unsigned i;205206assert(!svga_have_vgpu10(svga));207208for (i = 0; i < velems->count; i++) {209const enum pipe_format f = velems->velem[i].src_format;210SVGA3dSurfaceFormat svga_format;211unsigned vf_flags;212213svga_translate_vertex_format_vgpu10(f, &svga_format, &vf_flags);214215velems->decl_type[i] = translate_vertex_format_to_decltype(f);216if (velems->decl_type[i] == SVGA3D_DECLTYPE_MAX) {217/* Unsupported format - use software fetch */218velems->need_swvfetch = TRUE;219}220221/* Check for VS-based adjustments */222if (attrib_needs_range_adjustment(f)) {223velems->adjust_attrib_range |= (1 << i);224}225226if (vf_flags & VF_W_TO_1) {227velems->adjust_attrib_w_1 |= (1 << i);228}229}230}231232233static void *234svga_create_vertex_elements_state(struct pipe_context *pipe,235unsigned count,236const struct pipe_vertex_element *attribs)237{238struct svga_context *svga = svga_context(pipe);239struct svga_velems_state *velems;240241assert(count <= PIPE_MAX_ATTRIBS);242velems = (struct svga_velems_state *) MALLOC(sizeof(struct svga_velems_state));243if (velems) {244velems->count = count;245memcpy(velems->velem, attribs, sizeof(*attribs) * count);246247velems->need_swvfetch = FALSE;248velems->adjust_attrib_range = 0x0;249velems->attrib_is_pure_int = 0x0;250velems->adjust_attrib_w_1 = 0x0;251velems->adjust_attrib_itof = 0x0;252velems->adjust_attrib_utof = 0x0;253velems->attrib_is_bgra = 0x0;254velems->attrib_puint_to_snorm = 0x0;255velems->attrib_puint_to_uscaled = 0x0;256velems->attrib_puint_to_sscaled = 0x0;257258if (svga_have_vgpu10(svga)) {259define_input_element_object(svga, velems);260}261else {262translate_vertex_decls(svga, velems);263}264}265266svga->hud.num_vertexelement_objects++;267SVGA_STATS_COUNT_INC(svga_screen(svga->pipe.screen)->sws,268SVGA_STATS_COUNT_VERTEXELEMENT);269270return velems;271}272273274static void275svga_bind_vertex_elements_state(struct pipe_context *pipe, void *state)276{277struct svga_context *svga = svga_context(pipe);278struct svga_velems_state *velems = (struct svga_velems_state *) state;279280svga->curr.velems = velems;281svga->dirty |= SVGA_NEW_VELEMENT;282}283284285static void286svga_delete_vertex_elements_state(struct pipe_context *pipe, void *state)287{288struct svga_context *svga = svga_context(pipe);289struct svga_velems_state *velems = (struct svga_velems_state *) state;290291if (svga_have_vgpu10(svga)) {292svga_hwtnl_flush_retry(svga);293294SVGA_RETRY(svga, SVGA3D_vgpu10_DestroyElementLayout(svga->swc,295velems->id));296297if (velems->id == svga->state.hw_draw.layout_id)298svga->state.hw_draw.layout_id = SVGA3D_INVALID_ID;299300util_bitmask_clear(svga->input_element_object_id_bm, velems->id);301velems->id = SVGA3D_INVALID_ID;302}303304FREE(velems);305svga->hud.num_vertexelement_objects--;306}307308309void310svga_cleanup_vertex_state(struct svga_context *svga)311{312unsigned i;313314for (i = 0 ; i < svga->curr.num_vertex_buffers; i++)315pipe_vertex_buffer_unreference(&svga->curr.vb[i]);316317pipe_resource_reference(&svga->state.hw_draw.ib, NULL);318319for (i = 0; i < svga->state.hw_draw.num_vbuffers; i++)320pipe_resource_reference(&svga->state.hw_draw.vbuffers[i], NULL);321}322323324void325svga_init_vertex_functions(struct svga_context *svga)326{327svga->pipe.set_vertex_buffers = svga_set_vertex_buffers;328svga->pipe.create_vertex_elements_state = svga_create_vertex_elements_state;329svga->pipe.bind_vertex_elements_state = svga_bind_vertex_elements_state;330svga->pipe.delete_vertex_elements_state = svga_delete_vertex_elements_state;331}332333334