Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
godotengine
GitHub Repository: godotengine/godot
Path: blob/master/thirdparty/embree/kernels/common/scene_grid_mesh.h
9905 views
1
// Copyright 2009-2021 Intel Corporation
2
// SPDX-License-Identifier: Apache-2.0
3
4
#pragma once
5
6
#include "geometry.h"
7
#include "buffer.h"
8
9
namespace embree
10
{
11
/*! Grid Mesh */
12
struct GridMesh : public Geometry
13
{
14
/*! type of this geometry */
15
static const Geometry::GTypeMask geom_type = Geometry::MTY_GRID_MESH;
16
17
/*! grid */
18
struct Grid
19
{
20
unsigned int startVtxID;
21
unsigned int lineVtxOffset;
22
unsigned short resX,resY;
23
24
/* border flags due to 3x3 vertex pattern */
25
__forceinline unsigned int get3x3FlagsX(const unsigned int x) const
26
{
27
return (x + 2 >= (unsigned int)resX) ? (1<<15) : 0;
28
}
29
30
/* border flags due to 3x3 vertex pattern */
31
__forceinline unsigned int get3x3FlagsY(const unsigned int y) const
32
{
33
return (y + 2 >= (unsigned int)resY) ? (1<<15) : 0;
34
}
35
36
/*! outputs grid structure */
37
__forceinline friend embree_ostream operator<<(embree_ostream cout, const Grid& t) {
38
return cout << "Grid { startVtxID " << t.startVtxID << ", lineVtxOffset " << t.lineVtxOffset << ", resX " << t.resX << ", resY " << t.resY << " }";
39
}
40
};
41
42
public:
43
44
/*! grid mesh construction */
45
GridMesh (Device* device);
46
47
/* geometry interface */
48
public:
49
void setMask(unsigned mask);
50
void setNumTimeSteps (unsigned int numTimeSteps);
51
void setVertexAttributeCount (unsigned int N);
52
void setBuffer(RTCBufferType type, unsigned int slot, RTCFormat format, const Ref<Buffer>& buffer, size_t offset, size_t stride, unsigned int num);
53
void* getBufferData(RTCBufferType type, unsigned int slot, BufferDataPointerType pointerType);
54
void updateBuffer(RTCBufferType type, unsigned int slot);
55
void commit();
56
bool verify();
57
void interpolate(const RTCInterpolateArguments* const args);
58
59
#if defined(EMBREE_SYCL_SUPPORT)
60
61
size_t getGeometryDataDeviceByteSize() const;
62
void convertToDeviceRepresentation(size_t offset, char* data_host, char* data_device) const;
63
64
#endif
65
66
template<int N>
67
void interpolate_impl(const RTCInterpolateArguments* const args)
68
{
69
unsigned int primID = args->primID;
70
float U = args->u;
71
float V = args->v;
72
73
/* clamp input u,v to [0;1] range */
74
U = max(min(U,1.0f),0.0f);
75
V = max(min(V,1.0f),0.0f);
76
77
RTCBufferType bufferType = args->bufferType;
78
unsigned int bufferSlot = args->bufferSlot;
79
float* P = args->P;
80
float* dPdu = args->dPdu;
81
float* dPdv = args->dPdv;
82
float* ddPdudu = args->ddPdudu;
83
float* ddPdvdv = args->ddPdvdv;
84
float* ddPdudv = args->ddPdudv;
85
unsigned int valueCount = args->valueCount;
86
87
/* calculate base pointer and stride */
88
assert((bufferType == RTC_BUFFER_TYPE_VERTEX && bufferSlot < numTimeSteps) ||
89
(bufferType == RTC_BUFFER_TYPE_VERTEX_ATTRIBUTE && bufferSlot <= vertexAttribs.size()));
90
const char* src = nullptr;
91
size_t stride = 0;
92
if (bufferType == RTC_BUFFER_TYPE_VERTEX_ATTRIBUTE) {
93
src = vertexAttribs[bufferSlot].getPtr();
94
stride = vertexAttribs[bufferSlot].getStride();
95
} else {
96
src = vertices[bufferSlot].getPtr();
97
stride = vertices[bufferSlot].getStride();
98
}
99
100
const Grid& grid = grids[primID];
101
const int grid_width = grid.resX-1;
102
const int grid_height = grid.resY-1;
103
const float rcp_grid_width = rcp(float(grid_width));
104
const float rcp_grid_height = rcp(float(grid_height));
105
const int iu = min((int)floor(U*grid_width ),grid_width);
106
const int iv = min((int)floor(V*grid_height),grid_height);
107
const float u = U*grid_width-float(iu);
108
const float v = V*grid_height-float(iv);
109
110
for (unsigned int i=0; i<valueCount; i+=N)
111
{
112
const size_t ofs = i*sizeof(float);
113
const unsigned int idx0 = grid.startVtxID + (iv+0)*grid.lineVtxOffset + iu;
114
const unsigned int idx1 = grid.startVtxID + (iv+1)*grid.lineVtxOffset + iu;
115
116
const vbool<N> valid = vint<N>((int)i)+vint<N>(step) < vint<N>(int(valueCount));
117
const vfloat<N> p0 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx0+0)*stride+ofs]);
118
const vfloat<N> p1 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx0+1)*stride+ofs]);
119
const vfloat<N> p2 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx1+1)*stride+ofs]);
120
const vfloat<N> p3 = mem<vfloat<N>>::loadu(valid,(float*)&src[(idx1+0)*stride+ofs]);
121
const vbool<N> left = u+v <= 1.0f;
122
const vfloat<N> Q0 = select(left,p0,p2);
123
const vfloat<N> Q1 = select(left,p1,p3);
124
const vfloat<N> Q2 = select(left,p3,p1);
125
const vfloat<N> U = select(left,u,vfloat<N>(1.0f)-u);
126
const vfloat<N> V = select(left,v,vfloat<N>(1.0f)-v);
127
const vfloat<N> W = 1.0f-U-V;
128
129
if (P) {
130
mem<vfloat<N>>::storeu(valid,P+i,madd(W,Q0,madd(U,Q1,V*Q2)));
131
}
132
if (dPdu) {
133
assert(dPdu); mem<vfloat<N>>::storeu(valid,dPdu+i,select(left,Q1-Q0,Q0-Q1)*rcp_grid_width);
134
assert(dPdv); mem<vfloat<N>>::storeu(valid,dPdv+i,select(left,Q2-Q0,Q0-Q2)*rcp_grid_height);
135
}
136
if (ddPdudu) {
137
assert(ddPdudu); mem<vfloat<N>>::storeu(valid,ddPdudu+i,vfloat<N>(zero));
138
assert(ddPdvdv); mem<vfloat<N>>::storeu(valid,ddPdvdv+i,vfloat<N>(zero));
139
assert(ddPdudv); mem<vfloat<N>>::storeu(valid,ddPdudv+i,vfloat<N>(zero));
140
}
141
}
142
}
143
144
void addElementsToCount (GeometryCounts & counts) const;
145
146
__forceinline unsigned int getNumTotalQuads() const
147
{
148
size_t quads = 0;
149
for (size_t primID=0; primID<numPrimitives; primID++)
150
quads += getNumQuads(primID);
151
return quads;
152
}
153
154
__forceinline unsigned int getNumQuads(const size_t gridID) const
155
{
156
const Grid& g = grid(gridID);
157
return (unsigned int) max((int)1,((int)g.resX-1) * ((int)g.resY-1));
158
}
159
160
__forceinline unsigned int getNumSubGrids(const size_t gridID) const
161
{
162
const Grid& g = grid(gridID);
163
return max((unsigned int)1,((unsigned int)g.resX >> 1) * ((unsigned int)g.resY >> 1));
164
}
165
166
/*! get fast access to first vertex buffer */
167
__forceinline float * getCompactVertexArray () const {
168
return (float*) vertices0.getPtr();
169
}
170
171
public:
172
173
/*! returns number of vertices */
174
__forceinline size_t numVertices() const {
175
return vertices[0].size();
176
}
177
178
/*! returns i'th grid*/
179
__forceinline const Grid& grid(size_t i) const {
180
return grids[i];
181
}
182
183
/*! returns i'th vertex of the first time step */
184
__forceinline const Vec3fa vertex(size_t i) const { // FIXME: check if this does a unaligned load
185
return vertices0[i];
186
}
187
188
/*! returns i'th vertex of the first time step */
189
__forceinline const char* vertexPtr(size_t i) const {
190
return vertices0.getPtr(i);
191
}
192
193
/*! returns i'th vertex of itime'th timestep */
194
__forceinline const Vec3fa vertex(size_t i, size_t itime) const {
195
return vertices[itime][i];
196
}
197
198
/*! returns i'th vertex of for specified time */
199
__forceinline const Vec3fa vertex(size_t i, float time) const
200
{
201
float ftime;
202
const size_t itime = timeSegment(time, ftime);
203
const float t0 = 1.0f - ftime;
204
const float t1 = ftime;
205
Vec3fa v0 = vertex(i, itime+0);
206
Vec3fa v1 = vertex(i, itime+1);
207
return madd(Vec3fa(t0),v0,t1*v1);
208
}
209
210
/*! returns i'th vertex of itime'th timestep */
211
__forceinline const char* vertexPtr(size_t i, size_t itime) const {
212
return vertices[itime].getPtr(i);
213
}
214
215
/*! returns i'th vertex of the first timestep */
216
__forceinline size_t grid_vertex_index(const Grid& g, size_t x, size_t y) const {
217
assert(x < (size_t)g.resX);
218
assert(y < (size_t)g.resY);
219
return g.startVtxID + x + y * g.lineVtxOffset;
220
}
221
222
/*! returns i'th vertex of the first timestep */
223
__forceinline const Vec3fa grid_vertex(const Grid& g, size_t x, size_t y) const {
224
const size_t index = grid_vertex_index(g,x,y);
225
return vertex(index);
226
}
227
228
/*! returns i'th vertex of the itime'th timestep */
229
__forceinline const Vec3fa grid_vertex(const Grid& g, size_t x, size_t y, size_t itime) const {
230
const size_t index = grid_vertex_index(g,x,y);
231
return vertex(index,itime);
232
}
233
234
/*! returns i'th vertex of the itime'th timestep */
235
__forceinline const Vec3fa grid_vertex(const Grid& g, size_t x, size_t y, float time) const {
236
const size_t index = grid_vertex_index(g,x,y);
237
return vertex(index,time);
238
}
239
240
/*! gathers quad vertices */
241
__forceinline void gather_quad_vertices(Vec3fa& v0, Vec3fa& v1, Vec3fa& v2, Vec3fa& v3, const Grid& g, size_t x, size_t y) const
242
{
243
v0 = grid_vertex(g,x+0,y+0);
244
v1 = grid_vertex(g,x+1,y+0);
245
v2 = grid_vertex(g,x+1,y+1);
246
v3 = grid_vertex(g,x+0,y+1);
247
}
248
249
/*! gathers quad vertices for specified time */
250
__forceinline void gather_quad_vertices(Vec3fa& v0, Vec3fa& v1, Vec3fa& v2, Vec3fa& v3, const Grid& g, size_t x, size_t y, float time) const
251
{
252
v0 = grid_vertex(g,x+0,y+0,time);
253
v1 = grid_vertex(g,x+1,y+0,time);
254
v2 = grid_vertex(g,x+1,y+1,time);
255
v3 = grid_vertex(g,x+0,y+1,time);
256
}
257
258
/*! gathers quad vertices for mblur and non-mblur meshes */
259
__forceinline void gather_quad_vertices_safe(Vec3fa& v0, Vec3fa& v1, Vec3fa& v2, Vec3fa& v3, const Grid& g, size_t x, size_t y, float time) const
260
{
261
if (hasMotionBlur()) gather_quad_vertices(v0,v1,v2,v3,g,x,y,time);
262
else gather_quad_vertices(v0,v1,v2,v3,g,x,y);
263
}
264
265
/*! calculates the build bounds of the i'th quad, if it's valid */
266
__forceinline bool buildBoundsQuad(const Grid& g, size_t sx, size_t sy, BBox3fa& bbox) const
267
{
268
BBox3fa b(empty);
269
for (size_t t=0; t<numTimeSteps; t++)
270
{
271
for (size_t y=sy;y<sy+2;y++)
272
for (size_t x=sx;x<sx+2;x++)
273
{
274
const Vec3fa v = grid_vertex(g,x,y,t);
275
if (unlikely(!isvalid(v))) return false;
276
b.extend(v);
277
}
278
}
279
280
bbox = b;
281
return true;
282
}
283
284
/*! calculates the build bounds of the i'th primitive, if it's valid */
285
__forceinline bool buildBounds(const Grid& g, size_t sx, size_t sy, BBox3fa& bbox) const
286
{
287
BBox3fa b(empty);
288
for (size_t t=0; t<numTimeSteps; t++)
289
{
290
for (size_t y=sy;y<min(sy+3,(size_t)g.resY);y++)
291
for (size_t x=sx;x<min(sx+3,(size_t)g.resX);x++)
292
{
293
const Vec3fa v = grid_vertex(g,x,y,t);
294
if (unlikely(!isvalid(v))) return false;
295
b.extend(v);
296
}
297
}
298
299
bbox = b;
300
return true;
301
}
302
303
/*! calculates the build bounds of the i'th primitive at the itime'th time segment, if it's valid */
304
__forceinline bool buildBounds(const Grid& g, size_t sx, size_t sy, size_t itime, BBox3fa& bbox) const
305
{
306
assert(itime < numTimeSteps);
307
BBox3fa b0(empty);
308
for (size_t y=sy;y<min(sy+3,(size_t)g.resY);y++)
309
for (size_t x=sx;x<min(sx+3,(size_t)g.resX);x++)
310
{
311
const Vec3fa v = grid_vertex(g,x,y,itime);
312
if (unlikely(!isvalid(v))) return false;
313
b0.extend(v);
314
}
315
316
/* use bounds of first time step in builder */
317
bbox = b0;
318
return true;
319
}
320
321
__forceinline bool valid(size_t gridID, size_t itime=0) const {
322
return valid(gridID, make_range(itime, itime));
323
}
324
325
/*! check if the i'th primitive is valid between the specified time range */
326
__forceinline bool valid(size_t gridID, const range<size_t>& itime_range) const
327
{
328
if (unlikely(gridID >= grids.size())) return false;
329
const Grid &g = grid(gridID);
330
if (unlikely(g.startVtxID + 0 >= vertices0.size())) return false;
331
if (unlikely(g.startVtxID + (g.resY-1)*g.lineVtxOffset + g.resX-1 >= vertices0.size())) return false;
332
333
for (size_t y=0;y<g.resY;y++)
334
for (size_t x=0;x<g.resX;x++)
335
for (size_t itime = itime_range.begin(); itime <= itime_range.end(); itime++)
336
if (!isvalid(grid_vertex(g,x,y,itime))) return false;
337
return true;
338
}
339
340
__forceinline BBox3fa bounds(const Grid& g, size_t sx, size_t sy, size_t itime) const
341
{
342
BBox3fa box(empty);
343
buildBounds(g,sx,sy,itime,box);
344
return box;
345
}
346
347
__forceinline LBBox3fa linearBounds(const Grid& g, size_t sx, size_t sy, size_t itime) const {
348
BBox3fa bounds0, bounds1;
349
buildBounds(g,sx,sy,itime+0,bounds0);
350
buildBounds(g,sx,sy,itime+1,bounds1);
351
return LBBox3fa(bounds0,bounds1);
352
}
353
354
/*! calculates the linear bounds of the i'th primitive for the specified time range */
355
__forceinline LBBox3fa linearBounds(const Grid& g, size_t sx, size_t sy, const BBox1f& dt) const {
356
return LBBox3fa([&] (size_t itime) { return bounds(g,sx,sy,itime); }, dt, time_range, fnumTimeSegments);
357
}
358
359
__forceinline float projectedPrimitiveArea(const size_t i) const {
360
return pos_inf;
361
}
362
363
public:
364
BufferView<Grid> grids; //!< array of triangles
365
BufferView<Vec3fa> vertices0; //!< fast access to first vertex buffer
366
Device::vector<BufferView<Vec3fa>> vertices = device; //!< vertex array for each timestep
367
Device::vector<RawBufferView> vertexAttribs = device; //!< vertex attributes
368
369
#if defined(EMBREE_SYCL_SUPPORT)
370
371
public:
372
struct PrimID_XY { uint32_t primID; uint16_t x,y; };
373
Device::vector<PrimID_XY> quadID_to_primID_xy = device; //!< maps a quad to the primitive ID and grid coordinates
374
#endif
375
};
376
377
namespace isa
378
{
379
struct GridMeshISA : public GridMesh
380
{
381
GridMeshISA (Device* device)
382
: GridMesh(device) {}
383
384
LBBox3fa vlinearBounds(size_t buildID, const BBox1f& time_range, const SubGridBuildData * const sgrids) const override {
385
const SubGridBuildData &subgrid = sgrids[buildID];
386
const unsigned int primID = subgrid.primID;
387
const size_t x = subgrid.x();
388
const size_t y = subgrid.y();
389
return linearBounds(grid(primID),x,y,time_range);
390
}
391
392
#if defined(EMBREE_SYCL_SUPPORT)
393
PrimInfo createPrimRefArray(PrimRef* prims, const range<size_t>& r, size_t k, unsigned int geomID) const override
394
{
395
PrimInfo pinfo(empty);
396
for (size_t j=r.begin(); j<r.end(); j++)
397
{
398
BBox3fa bounds = empty;
399
const PrimID_XY& quad = quadID_to_primID_xy[j];
400
if (!buildBoundsQuad(grids[quad.primID],quad.x,quad.y,bounds)) continue;
401
const PrimRef prim(bounds,geomID,unsigned(j));
402
pinfo.add_center2(prim);
403
prims[k++] = prim;
404
}
405
return pinfo;
406
}
407
#endif
408
409
PrimInfo createPrimRefArray(mvector<PrimRef>& prims, mvector<SubGridBuildData>& sgrids, const range<size_t>& r, size_t k, unsigned int geomID) const override
410
{
411
PrimInfo pinfo(empty);
412
for (size_t j=r.begin(); j<r.end(); j++)
413
{
414
if (!valid(j)) continue;
415
const GridMesh::Grid &g = grid(j);
416
417
for (unsigned int y=0; y<g.resY-1u; y+=2)
418
{
419
for (unsigned int x=0; x<g.resX-1u; x+=2)
420
{
421
BBox3fa bounds = empty;
422
if (!buildBounds(g,x,y,bounds)) continue; // get bounds of subgrid
423
const PrimRef prim(bounds,(unsigned)geomID,(unsigned)k);
424
pinfo.add_center2(prim);
425
sgrids[k] = SubGridBuildData(x | g.get3x3FlagsX(x), y | g.get3x3FlagsY(y), unsigned(j));
426
prims[k++] = prim;
427
}
428
}
429
}
430
return pinfo;
431
}
432
433
#if defined(EMBREE_SYCL_SUPPORT)
434
PrimInfo createPrimRefArrayMB(PrimRef* prims, const BBox1f& time_range, const range<size_t>& r, size_t k, unsigned int geomID) const override
435
{
436
const BBox1f t0t1 = BBox1f::intersect(getTimeRange(), time_range);
437
PrimInfo pinfo(empty);
438
for (size_t j=r.begin(); j<r.end(); j++)
439
{
440
const PrimID_XY& quad = quadID_to_primID_xy[j];
441
const LBBox3fa lbounds = linearBounds(grids[quad.primID],quad.x,quad.y,t0t1);
442
const PrimRef prim(lbounds.bounds(), unsigned(geomID), unsigned(j));
443
pinfo.add_center2(prim);
444
prims[k++] = prim;
445
}
446
return pinfo;
447
}
448
#endif
449
450
PrimInfoMB createPrimRefMBArray(mvector<PrimRefMB>& prims, mvector<SubGridBuildData>& sgrids, const BBox1f& t0t1, const range<size_t>& r, size_t k, unsigned int geomID) const override
451
{
452
PrimInfoMB pinfoMB(empty);
453
for (size_t j=r.begin(); j<r.end(); j++)
454
{
455
if (!valid(j, timeSegmentRange(t0t1))) continue;
456
const GridMesh::Grid &g = grid(j);
457
458
for (unsigned int y=0; y<g.resY-1u; y+=2)
459
{
460
for (unsigned int x=0; x<g.resX-1u; x+=2)
461
{
462
const PrimRefMB prim(linearBounds(g,x,y,t0t1),numTimeSegments(),time_range,numTimeSegments(),unsigned(geomID),unsigned(k));
463
pinfoMB.add_primref(prim);
464
sgrids[k] = SubGridBuildData(x | g.get3x3FlagsX(x), y | g.get3x3FlagsY(y), unsigned(j));
465
prims[k++] = prim;
466
}
467
}
468
}
469
return pinfoMB;
470
}
471
};
472
}
473
474
DECLARE_ISA_FUNCTION(GridMesh*, createGridMesh, Device*);
475
}
476
477