Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
godotengine
GitHub Repository: godotengine/godot
Path: blob/master/thirdparty/embree/kernels/geometry/quadi.h
9905 views
1
// Copyright 2009-2021 Intel Corporation
2
// SPDX-License-Identifier: Apache-2.0
3
4
#pragma once
5
6
#include "primitive.h"
7
#include "../common/scene.h"
8
9
namespace embree
10
{
11
/* Stores M quads from an indexed face set */
12
template <int M>
13
struct QuadMi
14
{
15
/* Virtual interface to query information about the quad type */
16
struct Type : public PrimitiveType
17
{
18
const char* name() const;
19
size_t sizeActive(const char* This) const;
20
size_t sizeTotal(const char* This) const;
21
size_t getBytes(const char* This) const;
22
};
23
static Type type;
24
25
public:
26
27
/* primitive supports multiple time segments */
28
static const bool singleTimeSegment = false;
29
30
/* Returns maximum number of stored quads */
31
static __forceinline size_t max_size() { return M; }
32
33
/* Returns required number of primitive blocks for N primitives */
34
static __forceinline size_t blocks(size_t N) { return (N+max_size()-1)/max_size(); }
35
36
public:
37
38
/* Default constructor */
39
__forceinline QuadMi() { }
40
41
/* Construction from vertices and IDs */
42
__forceinline QuadMi(const vuint<M>& v0,
43
const vuint<M>& v1,
44
const vuint<M>& v2,
45
const vuint<M>& v3,
46
const vuint<M>& geomIDs,
47
const vuint<M>& primIDs)
48
#if defined(EMBREE_COMPACT_POLYS)
49
: geomIDs(geomIDs), primIDs(primIDs) {}
50
#else
51
: v0_(v0),v1_(v1), v2_(v2), v3_(v3), geomIDs(geomIDs), primIDs(primIDs) {}
52
#endif
53
54
/* Returns a mask that tells which quads are valid */
55
__forceinline vbool<M> valid() const { return primIDs != vuint<M>(-1); }
56
57
/* Returns if the specified quad is valid */
58
__forceinline bool valid(const size_t i) const { assert(i<M); return primIDs[i] != -1; }
59
60
/* Returns the number of stored quads */
61
__forceinline size_t size() const { return bsf(~movemask(valid())); }
62
63
/* Returns the geometry IDs */
64
__forceinline vuint<M>& geomID() { return geomIDs; }
65
__forceinline const vuint<M>& geomID() const { return geomIDs; }
66
__forceinline unsigned int geomID(const size_t i) const { assert(i<M); assert(geomIDs[i] != -1); return geomIDs[i]; }
67
68
/* Returns the primitive IDs */
69
__forceinline vuint<M>& primID() { return primIDs; }
70
__forceinline const vuint<M>& primID() const { return primIDs; }
71
__forceinline unsigned int primID(const size_t i) const { assert(i<M); return primIDs[i]; }
72
73
/* Calculate the bounds of the quads */
74
__forceinline const BBox3fa bounds(const Scene *const scene, const size_t itime=0) const
75
{
76
BBox3fa bounds = empty;
77
for (size_t i=0; i<M && valid(i); i++) {
78
const QuadMesh* mesh = scene->get<QuadMesh>(geomID(i));
79
bounds.extend(mesh->bounds(primID(i),itime));
80
}
81
return bounds;
82
}
83
84
/* Calculate the linear bounds of the primitive */
85
__forceinline LBBox3fa linearBounds(const Scene* const scene, const size_t itime) {
86
return LBBox3fa(bounds(scene,itime+0),bounds(scene,itime+1));
87
}
88
89
__forceinline LBBox3fa linearBounds(const Scene *const scene, size_t itime, size_t numTimeSteps)
90
{
91
LBBox3fa allBounds = empty;
92
for (size_t i=0; i<M && valid(i); i++)
93
{
94
const QuadMesh* mesh = scene->get<QuadMesh>(geomID(i));
95
allBounds.extend(mesh->linearBounds(primID(i), itime, numTimeSteps));
96
}
97
return allBounds;
98
}
99
100
__forceinline LBBox3fa linearBounds(const Scene *const scene, const BBox1f time_range)
101
{
102
LBBox3fa allBounds = empty;
103
for (size_t i=0; i<M && valid(i); i++)
104
{
105
const QuadMesh* mesh = scene->get<QuadMesh>(geomID(i));
106
allBounds.extend(mesh->linearBounds(primID(i), time_range));
107
}
108
return allBounds;
109
}
110
111
/* Fill quad from quad list */
112
template<typename PrimRefT>
113
__forceinline void fill(const PrimRefT* prims, size_t& begin, size_t end, Scene* scene)
114
{
115
vuint<M> geomID = -1, primID = -1;
116
const PrimRefT* prim = &prims[begin];
117
vuint<M> v0 = zero, v1 = zero, v2 = zero, v3 = zero;
118
119
for (size_t i=0; i<M; i++)
120
{
121
if (begin<end) {
122
geomID[i] = prim->geomID();
123
primID[i] = prim->primID();
124
#if !defined(EMBREE_COMPACT_POLYS)
125
const QuadMesh* mesh = scene->get<QuadMesh>(prim->geomID());
126
const QuadMesh::Quad& q = mesh->quad(prim->primID());
127
unsigned int_stride = mesh->vertices0.getStride()/4;
128
v0[i] = q.v[0] * int_stride;
129
v1[i] = q.v[1] * int_stride;
130
v2[i] = q.v[2] * int_stride;
131
v3[i] = q.v[3] * int_stride;
132
#endif
133
begin++;
134
} else {
135
assert(i);
136
if (likely(i > 0)) {
137
geomID[i] = geomID[0]; // always valid geomIDs
138
primID[i] = -1; // indicates invalid data
139
v0[i] = v0[0];
140
v1[i] = v0[0];
141
v2[i] = v0[0];
142
v3[i] = v0[0];
143
}
144
}
145
if (begin<end) prim = &prims[begin];
146
}
147
new (this) QuadMi(v0,v1,v2,v3,geomID,primID); // FIXME: use non temporal store
148
}
149
150
__forceinline LBBox3fa fillMB(const PrimRef* prims, size_t& begin, size_t end, Scene* scene, size_t itime)
151
{
152
fill(prims, begin, end, scene);
153
return linearBounds(scene, itime);
154
}
155
156
__forceinline LBBox3fa fillMB(const PrimRefMB* prims, size_t& begin, size_t end, Scene* scene, const BBox1f time_range)
157
{
158
fill(prims, begin, end, scene);
159
return linearBounds(scene, time_range);
160
}
161
162
friend embree_ostream operator<<(embree_ostream cout, const QuadMi& quad) {
163
return cout << "QuadMi<" << M << ">( "
164
#if !defined(EMBREE_COMPACT_POLYS)
165
<< "v0 = " << quad.v0_ << ", v1 = " << quad.v1_ << ", v2 = " << quad.v2_ << ", v3 = " << quad.v3_ << ", "
166
#endif
167
<< "geomID = " << quad.geomIDs << ", primID = " << quad.primIDs << " )";
168
}
169
170
protected:
171
#if !defined(EMBREE_COMPACT_POLYS)
172
vuint<M> v0_; // 4 byte offset of 1st vertex
173
vuint<M> v1_; // 4 byte offset of 2nd vertex
174
vuint<M> v2_; // 4 byte offset of 3rd vertex
175
vuint<M> v3_; // 4 byte offset of 4th vertex
176
#endif
177
vuint<M> geomIDs; // geometry ID of mesh
178
vuint<M> primIDs; // primitive ID of primitive inside mesh
179
};
180
181
namespace isa
182
{
183
184
template<int M>
185
struct QuadMi : public embree::QuadMi<M>
186
{
187
#if !defined(EMBREE_COMPACT_POLYS)
188
using embree::QuadMi<M>::v0_;
189
using embree::QuadMi<M>::v1_;
190
using embree::QuadMi<M>::v2_;
191
using embree::QuadMi<M>::v3_;
192
#endif
193
using embree::QuadMi<M>::geomIDs;
194
using embree::QuadMi<M>::primIDs;
195
using embree::QuadMi<M>::geomID;
196
using embree::QuadMi<M>::primID;
197
using embree::QuadMi<M>::valid;
198
199
template<int vid>
200
__forceinline Vec3f getVertex(const size_t index, const Scene *const scene) const
201
{
202
#if defined(EMBREE_COMPACT_POLYS)
203
const QuadMesh* mesh = scene->get<QuadMesh>(geomID(index));
204
const QuadMesh::Quad& quad = mesh->quad(primID(index));
205
return (Vec3f) mesh->vertices[0][quad.v[vid]];
206
#else
207
const vuint<M>& v = getVertexOffset<vid>();
208
const float* vertices = scene->vertices[geomID(index)];
209
return (Vec3f&) vertices[v[index]];
210
#endif
211
}
212
213
template<int vid, typename T>
214
__forceinline Vec3<T> getVertex(const size_t index, const Scene *const scene, const size_t itime, const T& ftime) const
215
{
216
#if defined(EMBREE_COMPACT_POLYS)
217
const QuadMesh* mesh = scene->get<QuadMesh>(geomID(index));
218
const QuadMesh::Quad& quad = mesh->quad(primID(index));
219
const Vec3fa v0 = mesh->vertices[itime+0][quad.v[vid]];
220
const Vec3fa v1 = mesh->vertices[itime+1][quad.v[vid]];
221
#else
222
const vuint<M>& v = getVertexOffset<vid>();
223
const QuadMesh* mesh = scene->get<QuadMesh>(geomID(index));
224
const float* vertices0 = (const float*) mesh->vertexPtr(0,itime+0);
225
const float* vertices1 = (const float*) mesh->vertexPtr(0,itime+1);
226
const Vec3fa v0 = Vec3fa::loadu(vertices0+v[index]);
227
const Vec3fa v1 = Vec3fa::loadu(vertices1+v[index]);
228
#endif
229
const Vec3<T> p0(v0.x,v0.y,v0.z);
230
const Vec3<T> p1(v1.x,v1.y,v1.z);
231
return lerp(p0,p1,ftime);
232
}
233
234
template<int vid, int K, typename T>
235
__forceinline Vec3<T> getVertex(const vbool<K>& valid, const size_t index, const Scene *const scene, const vint<K>& itime, const T& ftime) const
236
{
237
Vec3<T> p0, p1;
238
const QuadMesh* mesh = scene->get<QuadMesh>(geomID(index));
239
240
for (size_t mask=movemask(valid), i=bsf(mask); mask; mask=btc(mask,i), i=bsf(mask))
241
{
242
#if defined(EMBREE_COMPACT_POLYS)
243
const QuadMesh::Quad& quad = mesh->quad(primID(index));
244
const Vec3fa v0 = mesh->vertices[itime[i]+0][quad.v[vid]];
245
const Vec3fa v1 = mesh->vertices[itime[i]+1][quad.v[vid]];
246
#else
247
const vuint<M>& v = getVertexOffset<vid>();
248
const float* vertices0 = (const float*) mesh->vertexPtr(0,itime[i]+0);
249
const float* vertices1 = (const float*) mesh->vertexPtr(0,itime[i]+1);
250
const Vec3fa v0 = Vec3fa::loadu(vertices0+v[index]);
251
const Vec3fa v1 = Vec3fa::loadu(vertices1+v[index]);
252
#endif
253
p0.x[i] = v0.x; p0.y[i] = v0.y; p0.z[i] = v0.z;
254
p1.x[i] = v1.x; p1.y[i] = v1.y; p1.z[i] = v1.z;
255
}
256
return (T(one)-ftime)*p0 + ftime*p1;
257
}
258
259
struct Quad {
260
vfloat4 v0,v1,v2,v3;
261
};
262
263
#if defined(EMBREE_COMPACT_POLYS)
264
265
__forceinline Quad loadQuad(const int i, const Scene* const scene) const
266
{
267
const unsigned int geomID = geomIDs[i];
268
const unsigned int primID = primIDs[i];
269
if (unlikely(primID == -1)) return { zero, zero, zero, zero };
270
const QuadMesh* mesh = scene->get<QuadMesh>(geomID);
271
const QuadMesh::Quad& quad = mesh->quad(primID);
272
const vfloat4 v0 = (vfloat4) mesh->vertices0[quad.v[0]];
273
const vfloat4 v1 = (vfloat4) mesh->vertices0[quad.v[1]];
274
const vfloat4 v2 = (vfloat4) mesh->vertices0[quad.v[2]];
275
const vfloat4 v3 = (vfloat4) mesh->vertices0[quad.v[3]];
276
return { v0, v1, v2, v3 };
277
}
278
279
__forceinline Quad loadQuad(const int i, const int itime, const Scene* const scene) const
280
{
281
const unsigned int geomID = geomIDs[i];
282
const unsigned int primID = primIDs[i];
283
if (unlikely(primID == -1)) return { zero, zero, zero, zero };
284
const QuadMesh* mesh = scene->get<QuadMesh>(geomID);
285
const QuadMesh::Quad& quad = mesh->quad(primID);
286
const vfloat4 v0 = (vfloat4) mesh->vertices[itime][quad.v[0]];
287
const vfloat4 v1 = (vfloat4) mesh->vertices[itime][quad.v[1]];
288
const vfloat4 v2 = (vfloat4) mesh->vertices[itime][quad.v[2]];
289
const vfloat4 v3 = (vfloat4) mesh->vertices[itime][quad.v[3]];
290
return { v0, v1, v2, v3 };
291
}
292
293
#else
294
295
__forceinline Quad loadQuad(const int i, const Scene* const scene) const
296
{
297
const float* vertices = scene->vertices[geomID(i)];
298
const vfloat4 v0 = vfloat4::loadu(vertices + v0_[i]);
299
const vfloat4 v1 = vfloat4::loadu(vertices + v1_[i]);
300
const vfloat4 v2 = vfloat4::loadu(vertices + v2_[i]);
301
const vfloat4 v3 = vfloat4::loadu(vertices + v3_[i]);
302
return { v0, v1, v2, v3 };
303
}
304
305
__forceinline Quad loadQuad(const int i, const int itime, const Scene* const scene) const
306
{
307
const unsigned int geomID = geomIDs[i];
308
const QuadMesh* mesh = scene->get<QuadMesh>(geomID);
309
const float* vertices = (const float*) mesh->vertexPtr(0,itime);
310
const vfloat4 v0 = vfloat4::loadu(vertices + v0_[i]);
311
const vfloat4 v1 = vfloat4::loadu(vertices + v1_[i]);
312
const vfloat4 v2 = vfloat4::loadu(vertices + v2_[i]);
313
const vfloat4 v3 = vfloat4::loadu(vertices + v3_[i]);
314
return { v0, v1, v2, v3 };
315
}
316
317
#endif
318
319
/* Gather the quads */
320
__forceinline void gather(Vec3vf<M>& p0,
321
Vec3vf<M>& p1,
322
Vec3vf<M>& p2,
323
Vec3vf<M>& p3,
324
const Scene *const scene) const;
325
326
#if defined(__AVX512F__)
327
__forceinline void gather(Vec3vf16& p0,
328
Vec3vf16& p1,
329
Vec3vf16& p2,
330
Vec3vf16& p3,
331
const Scene *const scene) const;
332
#endif
333
334
template<int K>
335
#if defined(__INTEL_COMPILER) && (__INTEL_COMPILER < 2000) // workaround for compiler bug in ICC 2019
336
__noinline
337
#else
338
__forceinline
339
#endif
340
void gather(const vbool<K>& valid,
341
Vec3vf<K>& p0,
342
Vec3vf<K>& p1,
343
Vec3vf<K>& p2,
344
Vec3vf<K>& p3,
345
const size_t index,
346
const Scene* const scene,
347
const vfloat<K>& time) const
348
{
349
const QuadMesh* mesh = scene->get<QuadMesh>(geomID(index));
350
351
vfloat<K> ftime;
352
const vint<K> itime = mesh->timeSegment<K>(time, ftime);
353
354
const size_t first = bsf(movemask(valid));
355
if (likely(all(valid,itime[first] == itime)))
356
{
357
p0 = getVertex<0>(index, scene, itime[first], ftime);
358
p1 = getVertex<1>(index, scene, itime[first], ftime);
359
p2 = getVertex<2>(index, scene, itime[first], ftime);
360
p3 = getVertex<3>(index, scene, itime[first], ftime);
361
}
362
else
363
{
364
p0 = getVertex<0,K>(valid, index, scene, itime, ftime);
365
p1 = getVertex<1,K>(valid, index, scene, itime, ftime);
366
p2 = getVertex<2,K>(valid, index, scene, itime, ftime);
367
p3 = getVertex<3,K>(valid, index, scene, itime, ftime);
368
}
369
}
370
371
__forceinline void gather(Vec3vf<M>& p0,
372
Vec3vf<M>& p1,
373
Vec3vf<M>& p2,
374
Vec3vf<M>& p3,
375
const QuadMesh* mesh,
376
const Scene *const scene,
377
const int itime) const;
378
379
__forceinline void gather(Vec3vf<M>& p0,
380
Vec3vf<M>& p1,
381
Vec3vf<M>& p2,
382
Vec3vf<M>& p3,
383
const Scene *const scene,
384
const float time) const;
385
386
/* Updates the primitive */
387
__forceinline BBox3fa update(QuadMesh* mesh)
388
{
389
BBox3fa bounds = empty;
390
for (size_t i=0; i<M; i++)
391
{
392
if (!valid(i)) break;
393
const unsigned primId = primID(i);
394
const QuadMesh::Quad& q = mesh->quad(primId);
395
const Vec3fa p0 = mesh->vertex(q.v[0]);
396
const Vec3fa p1 = mesh->vertex(q.v[1]);
397
const Vec3fa p2 = mesh->vertex(q.v[2]);
398
const Vec3fa p3 = mesh->vertex(q.v[3]);
399
bounds.extend(merge(BBox3fa(p0),BBox3fa(p1),BBox3fa(p2),BBox3fa(p3)));
400
}
401
return bounds;
402
}
403
404
private:
405
#if !defined(EMBREE_COMPACT_POLYS)
406
template<int N> const vuint<M>& getVertexOffset() const;
407
#endif
408
};
409
410
#if !defined(EMBREE_COMPACT_POLYS)
411
template<> template<> __forceinline const vuint<4>& QuadMi<4>::getVertexOffset<0>() const { return v0_; }
412
template<> template<> __forceinline const vuint<4>& QuadMi<4>::getVertexOffset<1>() const { return v1_; }
413
template<> template<> __forceinline const vuint<4>& QuadMi<4>::getVertexOffset<2>() const { return v2_; }
414
template<> template<> __forceinline const vuint<4>& QuadMi<4>::getVertexOffset<3>() const { return v3_; }
415
#endif
416
417
template<>
418
__forceinline void QuadMi<4>::gather(Vec3vf4& p0,
419
Vec3vf4& p1,
420
Vec3vf4& p2,
421
Vec3vf4& p3,
422
const Scene *const scene) const
423
{
424
prefetchL1(((char*)this)+0*64);
425
prefetchL1(((char*)this)+1*64);
426
const Quad tri0 = loadQuad(0,scene);
427
const Quad tri1 = loadQuad(1,scene);
428
const Quad tri2 = loadQuad(2,scene);
429
const Quad tri3 = loadQuad(3,scene);
430
transpose(tri0.v0,tri1.v0,tri2.v0,tri3.v0,p0.x,p0.y,p0.z);
431
transpose(tri0.v1,tri1.v1,tri2.v1,tri3.v1,p1.x,p1.y,p1.z);
432
transpose(tri0.v2,tri1.v2,tri2.v2,tri3.v2,p2.x,p2.y,p2.z);
433
transpose(tri0.v3,tri1.v3,tri2.v3,tri3.v3,p3.x,p3.y,p3.z);
434
}
435
436
template<>
437
__forceinline void QuadMi<4>::gather(Vec3vf4& p0,
438
Vec3vf4& p1,
439
Vec3vf4& p2,
440
Vec3vf4& p3,
441
const QuadMesh* mesh,
442
const Scene *const scene,
443
const int itime) const
444
{
445
// FIXME: for trianglei there all geometries are identical, is this the case here too?
446
447
const Quad tri0 = loadQuad(0,itime,scene);
448
const Quad tri1 = loadQuad(1,itime,scene);
449
const Quad tri2 = loadQuad(2,itime,scene);
450
const Quad tri3 = loadQuad(3,itime,scene);
451
transpose(tri0.v0,tri1.v0,tri2.v0,tri3.v0,p0.x,p0.y,p0.z);
452
transpose(tri0.v1,tri1.v1,tri2.v1,tri3.v1,p1.x,p1.y,p1.z);
453
transpose(tri0.v2,tri1.v2,tri2.v2,tri3.v2,p2.x,p2.y,p2.z);
454
transpose(tri0.v3,tri1.v3,tri2.v3,tri3.v3,p3.x,p3.y,p3.z);
455
}
456
457
template<>
458
__forceinline void QuadMi<4>::gather(Vec3vf4& p0,
459
Vec3vf4& p1,
460
Vec3vf4& p2,
461
Vec3vf4& p3,
462
const Scene *const scene,
463
const float time) const
464
{
465
const QuadMesh* mesh = scene->get<QuadMesh>(geomID(0)); // in mblur mode all geometries are identical
466
467
float ftime;
468
const int itime = mesh->timeSegment(time, ftime);
469
470
Vec3vf4 a0,a1,a2,a3; gather(a0,a1,a2,a3,mesh,scene,itime);
471
Vec3vf4 b0,b1,b2,b3; gather(b0,b1,b2,b3,mesh,scene,itime+1);
472
p0 = lerp(a0,b0,vfloat4(ftime));
473
p1 = lerp(a1,b1,vfloat4(ftime));
474
p2 = lerp(a2,b2,vfloat4(ftime));
475
p3 = lerp(a3,b3,vfloat4(ftime));
476
}
477
}
478
479
template<int M>
480
typename QuadMi<M>::Type QuadMi<M>::type;
481
482
typedef QuadMi<4> Quad4i;
483
}
484
485