Path: blob/master/thirdparty/embree/kernels/common/scene_grid_mesh.h
9905 views
// Copyright 2009-2021 Intel Corporation1// SPDX-License-Identifier: Apache-2.023#pragma once45#include "geometry.h"6#include "buffer.h"78namespace embree9{10/*! Grid Mesh */11struct GridMesh : public Geometry12{13/*! type of this geometry */14static const Geometry::GTypeMask geom_type = Geometry::MTY_GRID_MESH;1516/*! grid */17struct Grid18{19unsigned int startVtxID;20unsigned int lineVtxOffset;21unsigned short resX,resY;2223/* border flags due to 3x3 vertex pattern */24__forceinline unsigned int get3x3FlagsX(const unsigned int x) const25{26return (x + 2 >= (unsigned int)resX) ? (1<<15) : 0;27}2829/* border flags due to 3x3 vertex pattern */30__forceinline unsigned int get3x3FlagsY(const unsigned int y) const31{32return (y + 2 >= (unsigned int)resY) ? (1<<15) : 0;33}3435/*! outputs grid structure */36__forceinline friend embree_ostream operator<<(embree_ostream cout, const Grid& t) {37return cout << "Grid { startVtxID " << t.startVtxID << ", lineVtxOffset " << t.lineVtxOffset << ", resX " << t.resX << ", resY " << t.resY << " }";38}39};4041public:4243/*! grid mesh construction */44GridMesh (Device* device);4546/* geometry interface */47public:48void setMask(unsigned mask);49void setNumTimeSteps (unsigned int numTimeSteps);50void setVertexAttributeCount (unsigned int N);51void setBuffer(RTCBufferType type, unsigned int slot, RTCFormat format, const Ref<Buffer>& buffer, size_t offset, size_t stride, unsigned int num);52void* getBufferData(RTCBufferType type, unsigned int slot, BufferDataPointerType pointerType);53void updateBuffer(RTCBufferType type, unsigned int slot);54void commit();55bool verify();56void interpolate(const RTCInterpolateArguments* const args);5758#if defined(EMBREE_SYCL_SUPPORT)5960size_t getGeometryDataDeviceByteSize() const;61void convertToDeviceRepresentation(size_t offset, char* data_host, char* data_device) const;6263#endif6465template<int N>66void interpolate_impl(const RTCInterpolateArguments* const args)67{68unsigned int primID = args->primID;69float U = args->u;70float V = args->v;7172/* clamp input u,v to [0;1] range */73U = max(min(U,1.0f),0.0f);74V = max(min(V,1.0f),0.0f);7576RTCBufferType bufferType = args->bufferType;77unsigned int bufferSlot = args->bufferSlot;78float* P = args->P;79float* dPdu = args->dPdu;80float* dPdv = args->dPdv;81float* ddPdudu = args->ddPdudu;82float* ddPdvdv = args->ddPdvdv;83float* ddPdudv = args->ddPdudv;84unsigned int valueCount = args->valueCount;8586/* calculate base pointer and stride */87assert((bufferType == RTC_BUFFER_TYPE_VERTEX && bufferSlot < numTimeSteps) ||88(bufferType == RTC_BUFFER_TYPE_VERTEX_ATTRIBUTE && bufferSlot <= vertexAttribs.size()));89const char* src = nullptr;90size_t stride = 0;91if (bufferType == RTC_BUFFER_TYPE_VERTEX_ATTRIBUTE) {92src = vertexAttribs[bufferSlot].getPtr();93stride = vertexAttribs[bufferSlot].getStride();94} else {95src = vertices[bufferSlot].getPtr();96stride = vertices[bufferSlot].getStride();97}9899const Grid& grid = grids[primID];100const int grid_width = grid.resX-1;101const int grid_height = grid.resY-1;102const float rcp_grid_width = rcp(float(grid_width));103const float rcp_grid_height = rcp(float(grid_height));104const int iu = min((int)floor(U*grid_width ),grid_width);105const int iv = min((int)floor(V*grid_height),grid_height);106const float u = U*grid_width-float(iu);107const float v = V*grid_height-float(iv);108109for (unsigned int i=0; i<valueCount; i+=N)110{111const size_t ofs = i*sizeof(float);112const unsigned int idx0 = grid.startVtxID + (iv+0)*grid.lineVtxOffset + iu;113const unsigned int idx1 = grid.startVtxID + (iv+1)*grid.lineVtxOffset + iu;114115const vbool<N> valid = vint<N>((int)i)+vint<N>(step) < vint<N>(int(valueCount));116const vfloat<N> p0 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx0+0)*stride+ofs]);117const vfloat<N> p1 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx0+1)*stride+ofs]);118const vfloat<N> p2 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx1+1)*stride+ofs]);119const vfloat<N> p3 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx1+0)*stride+ofs]);120const vbool<N> left = u+v <= 1.0f;121const vfloat<N> Q0 = select(left,p0,p2);122const vfloat<N> Q1 = select(left,p1,p3);123const vfloat<N> Q2 = select(left,p3,p1);124const vfloat<N> U = select(left,u,vfloat<N>(1.0f)-u);125const vfloat<N> V = select(left,v,vfloat<N>(1.0f)-v);126const vfloat<N> W = 1.0f-U-V;127128if (P) {129mem<vfloat<N>>::storeu(valid,P+i,madd(W,Q0,madd(U,Q1,V*Q2)));130}131if (dPdu) {132assert(dPdu); mem<vfloat<N>>::storeu(valid,dPdu+i,select(left,Q1-Q0,Q0-Q1)*rcp_grid_width);133assert(dPdv); mem<vfloat<N>>::storeu(valid,dPdv+i,select(left,Q2-Q0,Q0-Q2)*rcp_grid_height);134}135if (ddPdudu) {136assert(ddPdudu); mem<vfloat<N>>::storeu(valid,ddPdudu+i,vfloat<N>(zero));137assert(ddPdvdv); mem<vfloat<N>>::storeu(valid,ddPdvdv+i,vfloat<N>(zero));138assert(ddPdudv); mem<vfloat<N>>::storeu(valid,ddPdudv+i,vfloat<N>(zero));139}140}141}142143void addElementsToCount (GeometryCounts & counts) const;144145__forceinline unsigned int getNumTotalQuads() const146{147size_t quads = 0;148for (size_t primID=0; primID<numPrimitives; primID++)149quads += getNumQuads(primID);150return quads;151}152153__forceinline unsigned int getNumQuads(const size_t gridID) const154{155const Grid& g = grid(gridID);156return (unsigned int) max((int)1,((int)g.resX-1) * ((int)g.resY-1));157}158159__forceinline unsigned int getNumSubGrids(const size_t gridID) const160{161const Grid& g = grid(gridID);162return max((unsigned int)1,((unsigned int)g.resX >> 1) * ((unsigned int)g.resY >> 1));163}164165/*! get fast access to first vertex buffer */166__forceinline float * getCompactVertexArray () const {167return (float*) vertices0.getPtr();168}169170public:171172/*! returns number of vertices */173__forceinline size_t numVertices() const {174return vertices[0].size();175}176177/*! returns i'th grid*/178__forceinline const Grid& grid(size_t i) const {179return grids[i];180}181182/*! returns i'th vertex of the first time step */183__forceinline const Vec3fa vertex(size_t i) const { // FIXME: check if this does a unaligned load184return vertices0[i];185}186187/*! returns i'th vertex of the first time step */188__forceinline const char* vertexPtr(size_t i) const {189return vertices0.getPtr(i);190}191192/*! returns i'th vertex of itime'th timestep */193__forceinline const Vec3fa vertex(size_t i, size_t itime) const {194return vertices[itime][i];195}196197/*! returns i'th vertex of for specified time */198__forceinline const Vec3fa vertex(size_t i, float time) const199{200float ftime;201const size_t itime = timeSegment(time, ftime);202const float t0 = 1.0f - ftime;203const float t1 = ftime;204Vec3fa v0 = vertex(i, itime+0);205Vec3fa v1 = vertex(i, itime+1);206return madd(Vec3fa(t0),v0,t1*v1);207}208209/*! returns i'th vertex of itime'th timestep */210__forceinline const char* vertexPtr(size_t i, size_t itime) const {211return vertices[itime].getPtr(i);212}213214/*! returns i'th vertex of the first timestep */215__forceinline size_t grid_vertex_index(const Grid& g, size_t x, size_t y) const {216assert(x < (size_t)g.resX);217assert(y < (size_t)g.resY);218return g.startVtxID + x + y * g.lineVtxOffset;219}220221/*! returns i'th vertex of the first timestep */222__forceinline const Vec3fa grid_vertex(const Grid& g, size_t x, size_t y) const {223const size_t index = grid_vertex_index(g,x,y);224return vertex(index);225}226227/*! returns i'th vertex of the itime'th timestep */228__forceinline const Vec3fa grid_vertex(const Grid& g, size_t x, size_t y, size_t itime) const {229const size_t index = grid_vertex_index(g,x,y);230return vertex(index,itime);231}232233/*! returns i'th vertex of the itime'th timestep */234__forceinline const Vec3fa grid_vertex(const Grid& g, size_t x, size_t y, float time) const {235const size_t index = grid_vertex_index(g,x,y);236return vertex(index,time);237}238239/*! gathers quad vertices */240__forceinline void gather_quad_vertices(Vec3fa& v0, Vec3fa& v1, Vec3fa& v2, Vec3fa& v3, const Grid& g, size_t x, size_t y) const241{242v0 = grid_vertex(g,x+0,y+0);243v1 = grid_vertex(g,x+1,y+0);244v2 = grid_vertex(g,x+1,y+1);245v3 = grid_vertex(g,x+0,y+1);246}247248/*! gathers quad vertices for specified time */249__forceinline void gather_quad_vertices(Vec3fa& v0, Vec3fa& v1, Vec3fa& v2, Vec3fa& v3, const Grid& g, size_t x, size_t y, float time) const250{251v0 = grid_vertex(g,x+0,y+0,time);252v1 = grid_vertex(g,x+1,y+0,time);253v2 = grid_vertex(g,x+1,y+1,time);254v3 = grid_vertex(g,x+0,y+1,time);255}256257/*! gathers quad vertices for mblur and non-mblur meshes */258__forceinline void gather_quad_vertices_safe(Vec3fa& v0, Vec3fa& v1, Vec3fa& v2, Vec3fa& v3, const Grid& g, size_t x, size_t y, float time) const259{260if (hasMotionBlur()) gather_quad_vertices(v0,v1,v2,v3,g,x,y,time);261else gather_quad_vertices(v0,v1,v2,v3,g,x,y);262}263264/*! calculates the build bounds of the i'th quad, if it's valid */265__forceinline bool buildBoundsQuad(const Grid& g, size_t sx, size_t sy, BBox3fa& bbox) const266{267BBox3fa b(empty);268for (size_t t=0; t<numTimeSteps; t++)269{270for (size_t y=sy;y<sy+2;y++)271for (size_t x=sx;x<sx+2;x++)272{273const Vec3fa v = grid_vertex(g,x,y,t);274if (unlikely(!isvalid(v))) return false;275b.extend(v);276}277}278279bbox = b;280return true;281}282283/*! calculates the build bounds of the i'th primitive, if it's valid */284__forceinline bool buildBounds(const Grid& g, size_t sx, size_t sy, BBox3fa& bbox) const285{286BBox3fa b(empty);287for (size_t t=0; t<numTimeSteps; t++)288{289for (size_t y=sy;y<min(sy+3,(size_t)g.resY);y++)290for (size_t x=sx;x<min(sx+3,(size_t)g.resX);x++)291{292const Vec3fa v = grid_vertex(g,x,y,t);293if (unlikely(!isvalid(v))) return false;294b.extend(v);295}296}297298bbox = b;299return true;300}301302/*! calculates the build bounds of the i'th primitive at the itime'th time segment, if it's valid */303__forceinline bool buildBounds(const Grid& g, size_t sx, size_t sy, size_t itime, BBox3fa& bbox) const304{305assert(itime < numTimeSteps);306BBox3fa b0(empty);307for (size_t y=sy;y<min(sy+3,(size_t)g.resY);y++)308for (size_t x=sx;x<min(sx+3,(size_t)g.resX);x++)309{310const Vec3fa v = grid_vertex(g,x,y,itime);311if (unlikely(!isvalid(v))) return false;312b0.extend(v);313}314315/* use bounds of first time step in builder */316bbox = b0;317return true;318}319320__forceinline bool valid(size_t gridID, size_t itime=0) const {321return valid(gridID, make_range(itime, itime));322}323324/*! check if the i'th primitive is valid between the specified time range */325__forceinline bool valid(size_t gridID, const range<size_t>& itime_range) const326{327if (unlikely(gridID >= grids.size())) return false;328const Grid &g = grid(gridID);329if (unlikely(g.startVtxID + 0 >= vertices0.size())) return false;330if (unlikely(g.startVtxID + (g.resY-1)*g.lineVtxOffset + g.resX-1 >= vertices0.size())) return false;331332for (size_t y=0;y<g.resY;y++)333for (size_t x=0;x<g.resX;x++)334for (size_t itime = itime_range.begin(); itime <= itime_range.end(); itime++)335if (!isvalid(grid_vertex(g,x,y,itime))) return false;336return true;337}338339__forceinline BBox3fa bounds(const Grid& g, size_t sx, size_t sy, size_t itime) const340{341BBox3fa box(empty);342buildBounds(g,sx,sy,itime,box);343return box;344}345346__forceinline LBBox3fa linearBounds(const Grid& g, size_t sx, size_t sy, size_t itime) const {347BBox3fa bounds0, bounds1;348buildBounds(g,sx,sy,itime+0,bounds0);349buildBounds(g,sx,sy,itime+1,bounds1);350return LBBox3fa(bounds0,bounds1);351}352353/*! calculates the linear bounds of the i'th primitive for the specified time range */354__forceinline LBBox3fa linearBounds(const Grid& g, size_t sx, size_t sy, const BBox1f& dt) const {355return LBBox3fa([&] (size_t itime) { return bounds(g,sx,sy,itime); }, dt, time_range, fnumTimeSegments);356}357358__forceinline float projectedPrimitiveArea(const size_t i) const {359return pos_inf;360}361362public:363BufferView<Grid> grids; //!< array of triangles364BufferView<Vec3fa> vertices0; //!< fast access to first vertex buffer365Device::vector<BufferView<Vec3fa>> vertices = device; //!< vertex array for each timestep366Device::vector<RawBufferView> vertexAttribs = device; //!< vertex attributes367368#if defined(EMBREE_SYCL_SUPPORT)369370public:371struct PrimID_XY { uint32_t primID; uint16_t x,y; };372Device::vector<PrimID_XY> quadID_to_primID_xy = device; //!< maps a quad to the primitive ID and grid coordinates373#endif374};375376namespace isa377{378struct GridMeshISA : public GridMesh379{380GridMeshISA (Device* device)381: GridMesh(device) {}382383LBBox3fa vlinearBounds(size_t buildID, const BBox1f& time_range, const SubGridBuildData * const sgrids) const override {384const SubGridBuildData &subgrid = sgrids[buildID];385const unsigned int primID = subgrid.primID;386const size_t x = subgrid.x();387const size_t y = subgrid.y();388return linearBounds(grid(primID),x,y,time_range);389}390391#if defined(EMBREE_SYCL_SUPPORT)392PrimInfo createPrimRefArray(PrimRef* prims, const range<size_t>& r, size_t k, unsigned int geomID) const override393{394PrimInfo pinfo(empty);395for (size_t j=r.begin(); j<r.end(); j++)396{397BBox3fa bounds = empty;398const PrimID_XY& quad = quadID_to_primID_xy[j];399if (!buildBoundsQuad(grids[quad.primID],quad.x,quad.y,bounds)) continue;400const PrimRef prim(bounds,geomID,unsigned(j));401pinfo.add_center2(prim);402prims[k++] = prim;403}404return pinfo;405}406#endif407408PrimInfo createPrimRefArray(mvector<PrimRef>& prims, mvector<SubGridBuildData>& sgrids, const range<size_t>& r, size_t k, unsigned int geomID) const override409{410PrimInfo pinfo(empty);411for (size_t j=r.begin(); j<r.end(); j++)412{413if (!valid(j)) continue;414const GridMesh::Grid &g = grid(j);415416for (unsigned int y=0; y<g.resY-1u; y+=2)417{418for (unsigned int x=0; x<g.resX-1u; x+=2)419{420BBox3fa bounds = empty;421if (!buildBounds(g,x,y,bounds)) continue; // get bounds of subgrid422const PrimRef prim(bounds,(unsigned)geomID,(unsigned)k);423pinfo.add_center2(prim);424sgrids[k] = SubGridBuildData(x | g.get3x3FlagsX(x), y | g.get3x3FlagsY(y), unsigned(j));425prims[k++] = prim;426}427}428}429return pinfo;430}431432#if defined(EMBREE_SYCL_SUPPORT)433PrimInfo createPrimRefArrayMB(PrimRef* prims, const BBox1f& time_range, const range<size_t>& r, size_t k, unsigned int geomID) const override434{435const BBox1f t0t1 = BBox1f::intersect(getTimeRange(), time_range);436PrimInfo pinfo(empty);437for (size_t j=r.begin(); j<r.end(); j++)438{439const PrimID_XY& quad = quadID_to_primID_xy[j];440const LBBox3fa lbounds = linearBounds(grids[quad.primID],quad.x,quad.y,t0t1);441const PrimRef prim(lbounds.bounds(), unsigned(geomID), unsigned(j));442pinfo.add_center2(prim);443prims[k++] = prim;444}445return pinfo;446}447#endif448449PrimInfoMB createPrimRefMBArray(mvector<PrimRefMB>& prims, mvector<SubGridBuildData>& sgrids, const BBox1f& t0t1, const range<size_t>& r, size_t k, unsigned int geomID) const override450{451PrimInfoMB pinfoMB(empty);452for (size_t j=r.begin(); j<r.end(); j++)453{454if (!valid(j, timeSegmentRange(t0t1))) continue;455const GridMesh::Grid &g = grid(j);456457for (unsigned int y=0; y<g.resY-1u; y+=2)458{459for (unsigned int x=0; x<g.resX-1u; x+=2)460{461const PrimRefMB prim(linearBounds(g,x,y,t0t1),numTimeSegments(),time_range,numTimeSegments(),unsigned(geomID),unsigned(k));462pinfoMB.add_primref(prim);463sgrids[k] = SubGridBuildData(x | g.get3x3FlagsX(x), y | g.get3x3FlagsY(y), unsigned(j));464prims[k++] = prim;465}466}467}468return pinfoMB;469}470};471}472473DECLARE_ISA_FUNCTION(GridMesh*, createGridMesh, Device*);474}475476477