Path: blob/21.2-virgl/src/gallium/auxiliary/draw/draw_pt_fetch_shade_pipeline.c
4565 views
/**************************************************************************1*2* Copyright 2007 VMware, Inc.3* All Rights Reserved.4*5* Permission is hereby granted, free of charge, to any person obtaining a6* copy of this software and associated documentation files (the7* "Software"), to deal in the Software without restriction, including8* without limitation the rights to use, copy, modify, merge, publish,9* distribute, sub license, and/or sell copies of the Software, and to10* permit persons to whom the Software is furnished to do so, subject to11* the following conditions:12*13* The above copyright notice and this permission notice (including the14* next paragraph) shall be included in all copies or substantial portions15* of the Software.16*17* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS18* OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF19* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.20* IN NO EVENT SHALL VMWARE AND/OR ITS SUPPLIERS BE LIABLE FOR21* ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,22* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE23* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.24*25**************************************************************************/2627#include "util/u_math.h"28#include "util/u_memory.h"29#include "util/u_prim.h"30#include "draw/draw_context.h"31#include "draw/draw_vbuf.h"32#include "draw/draw_vertex.h"33#include "draw/draw_prim_assembler.h"34#include "draw/draw_pt.h"35#include "draw/draw_vs.h"36#include "draw/draw_gs.h"373839struct fetch_pipeline_middle_end {40struct draw_pt_middle_end base;41struct draw_context *draw;4243struct pt_emit *emit;44struct pt_so_emit *so_emit;45struct pt_fetch *fetch;46struct pt_post_vs *post_vs;4748unsigned vertex_data_offset;49unsigned vertex_size;50unsigned input_prim;51unsigned opt;52};535455/** cast wrapper */56static inline struct fetch_pipeline_middle_end *57fetch_pipeline_middle_end(struct draw_pt_middle_end *middle)58{59return (struct fetch_pipeline_middle_end *) middle;60}616263/**64* Prepare/validate middle part of the vertex pipeline.65* NOTE: if you change this function, also look at the LLVM66* function llvm_middle_end_prepare() for similar changes.67*/68static void69fetch_pipeline_prepare(struct draw_pt_middle_end *middle,70unsigned prim,71unsigned opt,72unsigned *max_vertices)73{74struct fetch_pipeline_middle_end *fpme = fetch_pipeline_middle_end(middle);75struct draw_context *draw = fpme->draw;76struct draw_vertex_shader *vs = draw->vs.vertex_shader;77struct draw_geometry_shader *gs = draw->gs.geometry_shader;78unsigned i;79unsigned instance_id_index = ~0;80const unsigned gs_out_prim = (gs ? gs->output_primitive :81u_assembled_prim(prim));82unsigned nr_vs_outputs = draw_total_vs_outputs(draw);83unsigned nr = MAX2(vs->info.num_inputs, nr_vs_outputs);84unsigned point_clip = draw->rasterizer->fill_front == PIPE_POLYGON_MODE_POINT ||85gs_out_prim == PIPE_PRIM_POINTS;8687if (gs) {88nr = MAX2(nr, gs->info.num_outputs + 1);89}9091/* Scan for instanceID system value.92*/93for (i = 0; i < vs->info.num_inputs; i++) {94if (vs->info.input_semantic_name[i] == TGSI_SEMANTIC_INSTANCEID) {95instance_id_index = i;96break;97}98}99100fpme->input_prim = prim;101fpme->opt = opt;102103/* Always leave room for the vertex header whether we need it or104* not. It's hard to get rid of it in particular because of the105* viewport code in draw_pt_post_vs.c.106*/107fpme->vertex_size = sizeof(struct vertex_header) + nr * 4 * sizeof(float);108109draw_pt_fetch_prepare( fpme->fetch,110vs->info.num_inputs,111fpme->vertex_size,112instance_id_index );113draw_pt_post_vs_prepare( fpme->post_vs,114draw->clip_xy,115draw->clip_z,116draw->clip_user,117point_clip ? draw->guard_band_points_xy :118draw->guard_band_xy,119draw->bypass_viewport,120draw->rasterizer->clip_halfz,121(draw->vs.edgeflag_output ? TRUE : FALSE) );122123draw_pt_so_emit_prepare( fpme->so_emit, FALSE );124125if (!(opt & PT_PIPELINE)) {126draw_pt_emit_prepare( fpme->emit,127gs_out_prim,128max_vertices );129130*max_vertices = MAX2( *max_vertices, 4096 );131}132else {133/* limit max fetches by limiting max_vertices */134*max_vertices = 4096;135}136137/* No need to prepare the shader.138*/139vs->prepare(vs, draw);140141/* Make sure that the vertex size didn't change at any point above */142assert(nr_vs_outputs == draw_total_vs_outputs(draw));143}144145146static void147fetch_pipeline_bind_parameters(struct draw_pt_middle_end *middle)148{149/* No-op since the vertex shader executor and drawing pipeline150* just grab the constants, viewport, etc. from the draw context state.151*/152}153154155static void fetch( struct pt_fetch *fetch,156const struct draw_fetch_info *fetch_info,157char *output)158{159if (fetch_info->linear) {160draw_pt_fetch_run_linear( fetch,161fetch_info->start,162fetch_info->count,163output );164}165else {166draw_pt_fetch_run( fetch,167fetch_info->elts,168fetch_info->count,169output );170}171}172173174static void pipeline(struct fetch_pipeline_middle_end *fpme,175const struct draw_vertex_info *vert_info,176const struct draw_prim_info *prim_info)177{178if (prim_info->linear)179draw_pipeline_run_linear( fpme->draw,180vert_info,181prim_info);182else183draw_pipeline_run( fpme->draw,184vert_info,185prim_info );186}187188189static void190emit(struct pt_emit *emit,191const struct draw_vertex_info *vert_info,192const struct draw_prim_info *prim_info)193{194if (prim_info->linear) {195draw_pt_emit_linear(emit, vert_info, prim_info);196}197else {198draw_pt_emit(emit, vert_info, prim_info);199}200}201202203static void204draw_vertex_shader_run(struct draw_vertex_shader *vshader,205const void *constants[PIPE_MAX_CONSTANT_BUFFERS],206unsigned const_size[PIPE_MAX_CONSTANT_BUFFERS],207const struct draw_fetch_info *fetch_info,208const struct draw_vertex_info *input_verts,209struct draw_vertex_info *output_verts)210{211output_verts->vertex_size = input_verts->vertex_size;212output_verts->stride = input_verts->vertex_size;213output_verts->count = input_verts->count;214output_verts->verts =215(struct vertex_header *)MALLOC(output_verts->vertex_size *216align(output_verts->count, 4) +217DRAW_EXTRA_VERTICES_PADDING);218219vshader->run_linear(vshader,220(const float (*)[4])input_verts->verts->data,221( float (*)[4])output_verts->verts->data,222constants,223const_size,224input_verts->count,225input_verts->vertex_size,226input_verts->vertex_size,227fetch_info->elts);228}229230231static void232fetch_pipeline_generic(struct draw_pt_middle_end *middle,233const struct draw_fetch_info *fetch_info,234const struct draw_prim_info *in_prim_info)235{236struct fetch_pipeline_middle_end *fpme = fetch_pipeline_middle_end(middle);237struct draw_context *draw = fpme->draw;238struct draw_vertex_shader *vshader = draw->vs.vertex_shader;239struct draw_geometry_shader *gshader = draw->gs.geometry_shader;240struct draw_prim_info gs_prim_info[TGSI_MAX_VERTEX_STREAMS];241struct draw_vertex_info fetched_vert_info;242struct draw_vertex_info vs_vert_info;243struct draw_vertex_info gs_vert_info[TGSI_MAX_VERTEX_STREAMS];244struct draw_vertex_info *vert_info;245struct draw_prim_info ia_prim_info;246struct draw_vertex_info ia_vert_info;247const struct draw_prim_info *prim_info = in_prim_info;248boolean free_prim_info = FALSE;249unsigned opt = fpme->opt;250int num_vertex_streams = 1;251252fetched_vert_info.count = fetch_info->count;253fetched_vert_info.vertex_size = fpme->vertex_size;254fetched_vert_info.stride = fpme->vertex_size;255fetched_vert_info.verts =256(struct vertex_header *)MALLOC(fpme->vertex_size *257align(fetch_info->count, 4) +258DRAW_EXTRA_VERTICES_PADDING);259if (!fetched_vert_info.verts) {260assert(0);261return;262}263if (draw->collect_statistics) {264draw->statistics.ia_vertices += prim_info->count;265draw->statistics.ia_primitives +=266u_decomposed_prims_for_vertices(prim_info->prim, fetch_info->count);267draw->statistics.vs_invocations += fetch_info->count;268}269270/* Fetch into our vertex buffer.271*/272fetch( fpme->fetch, fetch_info, (char *)fetched_vert_info.verts );273274vert_info = &fetched_vert_info;275276/* Run the shader, note that this overwrites the data[] parts of277* the pipeline verts.278* Need fetch info to get vertex id correct.279*/280if (fpme->opt & PT_SHADE) {281draw_vertex_shader_run(vshader,282draw->pt.user.vs_constants,283draw->pt.user.vs_constants_size,284fetch_info,285vert_info,286&vs_vert_info);287288FREE(vert_info->verts);289vert_info = &vs_vert_info;290}291292/* Finished with fetch:293*/294fetch_info = NULL;295296if ((fpme->opt & PT_SHADE) && gshader) {297draw_geometry_shader_run(gshader,298draw->pt.user.gs_constants,299draw->pt.user.gs_constants_size,300vert_info,301prim_info,302&vshader->info,303gs_vert_info,304gs_prim_info);305306FREE(vert_info->verts);307vert_info = &gs_vert_info[0];308prim_info = &gs_prim_info[0];309num_vertex_streams = gshader->num_vertex_streams;310311/*312* pt emit can only handle ushort number of vertices (see313* render->allocate_vertices).314* vsplit guarantees there's never more than 4096, however GS can315* easily blow this up (by a factor of 256 (or even 1024) max).316*/317if (vert_info->count > 65535) {318opt |= PT_PIPELINE;319}320} else {321if (draw_prim_assembler_is_required(draw, prim_info, vert_info)) {322draw_prim_assembler_run(draw, prim_info, vert_info,323&ia_prim_info, &ia_vert_info);324325if (ia_vert_info.count) {326FREE(vert_info->verts);327vert_info = &ia_vert_info;328prim_info = &ia_prim_info;329free_prim_info = TRUE;330}331}332}333if (prim_info->count == 0) {334debug_printf("GS/IA didn't emit any vertices!\n");335336FREE(vert_info->verts);337if (free_prim_info) {338FREE(prim_info->primitive_lengths);339}340return;341}342343344/* Stream output needs to be done before clipping.345*346* XXX: Stream output surely needs to respect the prim_info->elt347* lists.348*/349draw_pt_so_emit( fpme->so_emit, num_vertex_streams, vert_info, prim_info );350351draw_stats_clipper_primitives(draw, prim_info);352353/*354* if there's no position, need to stop now, or the latter stages355* will try to access non-existent position output.356*/357if (draw_current_shader_position_output(draw) != -1) {358359if (draw_pt_post_vs_run( fpme->post_vs, vert_info, prim_info ))360{361opt |= PT_PIPELINE;362}363364/* Do we need to run the pipeline?365*/366if (opt & PT_PIPELINE) {367pipeline( fpme, vert_info, prim_info );368}369else {370emit( fpme->emit, vert_info, prim_info );371}372}373FREE(vert_info->verts);374if (free_prim_info) {375FREE(prim_info->primitive_lengths);376}377}378379380static inline unsigned381prim_type(unsigned prim, unsigned flags)382{383if (flags & DRAW_LINE_LOOP_AS_STRIP)384return PIPE_PRIM_LINE_STRIP;385else386return prim;387}388389390static void391fetch_pipeline_run(struct draw_pt_middle_end *middle,392const unsigned *fetch_elts,393unsigned fetch_count,394const ushort *draw_elts,395unsigned draw_count,396unsigned prim_flags)397{398struct fetch_pipeline_middle_end *fpme = fetch_pipeline_middle_end(middle);399struct draw_fetch_info fetch_info;400struct draw_prim_info prim_info;401402fetch_info.linear = FALSE;403fetch_info.start = 0;404fetch_info.elts = fetch_elts;405fetch_info.count = fetch_count;406407prim_info.linear = FALSE;408prim_info.start = 0;409prim_info.count = draw_count;410prim_info.elts = draw_elts;411prim_info.prim = prim_type(fpme->input_prim, prim_flags);412prim_info.flags = prim_flags;413prim_info.primitive_count = 1;414prim_info.primitive_lengths = &draw_count;415416fetch_pipeline_generic( middle, &fetch_info, &prim_info );417}418419420static void421fetch_pipeline_linear_run(struct draw_pt_middle_end *middle,422unsigned start,423unsigned count,424unsigned prim_flags)425{426struct fetch_pipeline_middle_end *fpme = fetch_pipeline_middle_end(middle);427struct draw_fetch_info fetch_info;428struct draw_prim_info prim_info;429430fetch_info.linear = TRUE;431fetch_info.start = start;432fetch_info.count = count;433fetch_info.elts = NULL;434435prim_info.linear = TRUE;436prim_info.start = 0;437prim_info.count = count;438prim_info.elts = NULL;439prim_info.prim = prim_type(fpme->input_prim, prim_flags);440prim_info.flags = prim_flags;441prim_info.primitive_count = 1;442prim_info.primitive_lengths = &count;443444fetch_pipeline_generic( middle, &fetch_info, &prim_info );445}446447448449static boolean450fetch_pipeline_linear_run_elts(struct draw_pt_middle_end *middle,451unsigned start,452unsigned count,453const ushort *draw_elts,454unsigned draw_count,455unsigned prim_flags )456{457struct fetch_pipeline_middle_end *fpme = fetch_pipeline_middle_end(middle);458struct draw_fetch_info fetch_info;459struct draw_prim_info prim_info;460461fetch_info.linear = TRUE;462fetch_info.start = start;463fetch_info.count = count;464fetch_info.elts = NULL;465466prim_info.linear = FALSE;467prim_info.start = 0;468prim_info.count = draw_count;469prim_info.elts = draw_elts;470prim_info.prim = prim_type(fpme->input_prim, prim_flags);471prim_info.flags = prim_flags;472prim_info.primitive_count = 1;473prim_info.primitive_lengths = &draw_count;474475fetch_pipeline_generic( middle, &fetch_info, &prim_info );476477return TRUE;478}479480481static void482fetch_pipeline_finish( struct draw_pt_middle_end *middle )483{484/* nothing to do */485}486487488static void489fetch_pipeline_destroy( struct draw_pt_middle_end *middle )490{491struct fetch_pipeline_middle_end *fpme = fetch_pipeline_middle_end(middle);492493if (fpme->fetch)494draw_pt_fetch_destroy( fpme->fetch );495496if (fpme->emit)497draw_pt_emit_destroy( fpme->emit );498499if (fpme->so_emit)500draw_pt_so_emit_destroy( fpme->so_emit );501502if (fpme->post_vs)503draw_pt_post_vs_destroy( fpme->post_vs );504505FREE(middle);506}507508509struct draw_pt_middle_end *510draw_pt_fetch_pipeline_or_emit(struct draw_context *draw)511{512struct fetch_pipeline_middle_end *fpme =513CALLOC_STRUCT( fetch_pipeline_middle_end );514if (!fpme)515goto fail;516517fpme->base.prepare = fetch_pipeline_prepare;518fpme->base.bind_parameters = fetch_pipeline_bind_parameters;519fpme->base.run = fetch_pipeline_run;520fpme->base.run_linear = fetch_pipeline_linear_run;521fpme->base.run_linear_elts = fetch_pipeline_linear_run_elts;522fpme->base.finish = fetch_pipeline_finish;523fpme->base.destroy = fetch_pipeline_destroy;524525fpme->draw = draw;526527fpme->fetch = draw_pt_fetch_create( draw );528if (!fpme->fetch)529goto fail;530531fpme->post_vs = draw_pt_post_vs_create( draw );532if (!fpme->post_vs)533goto fail;534535fpme->emit = draw_pt_emit_create( draw );536if (!fpme->emit)537goto fail;538539fpme->so_emit = draw_pt_so_emit_create( draw );540if (!fpme->so_emit)541goto fail;542543return &fpme->base;544545fail:546if (fpme)547fetch_pipeline_destroy( &fpme->base );548549return NULL;550}551552553