Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
godotengine
GitHub Repository: godotengine/godot
Path: blob/master/thirdparty/embree/kernels/subdiv/patch_eval_simd.h
9913 views
1
// Copyright 2009-2021 Intel Corporation
2
// SPDX-License-Identifier: Apache-2.0
3
4
#pragma once
5
6
#include "patch.h"
7
#include "feature_adaptive_eval_simd.h"
8
9
namespace embree
10
{
11
namespace isa
12
{
13
template<typename vbool, typename vint, typename vfloat, typename Vertex, typename Vertex_t = Vertex>
14
struct PatchEvalSimd
15
{
16
public:
17
18
typedef PatchT<Vertex,Vertex_t> Patch;
19
typedef typename Patch::Ref Ref;
20
typedef CatmullClarkPatchT<Vertex,Vertex_t> CatmullClarkPatch;
21
22
PatchEvalSimd (SharedLazyTessellationCache::CacheEntry& entry, size_t commitCounter,
23
const HalfEdge* edge, const char* vertices, size_t stride, const vbool& valid0, const vfloat& u, const vfloat& v,
24
float* P, float* dPdu, float* dPdv, float* ddPdudu, float* ddPdvdv, float* ddPdudv, const size_t dstride, const size_t N)
25
: P(P), dPdu(dPdu), dPdv(dPdv), ddPdudu(ddPdudu), ddPdvdv(ddPdvdv), ddPdudv(ddPdudv), dstride(dstride), N(N)
26
{
27
/* conservative time for the very first allocation */
28
auto time = SharedLazyTessellationCache::sharedLazyTessellationCache.getTime(commitCounter);
29
30
Ref patch = SharedLazyTessellationCache::lookup(entry,commitCounter,[&] () {
31
auto alloc = [](size_t bytes) { return SharedLazyTessellationCache::malloc(bytes); };
32
return Patch::create(alloc,edge,vertices,stride);
33
}, true);
34
35
auto curTime = SharedLazyTessellationCache::sharedLazyTessellationCache.getTime(commitCounter);
36
const bool allAllocationsValid = SharedLazyTessellationCache::validTime(time,curTime);
37
38
patch = allAllocationsValid ? patch : nullptr;
39
40
/* use cached data structure for calculations */
41
const vbool valid1 = patch ? eval(valid0,patch,u,v,1.0f,0) : vbool(false);
42
SharedLazyTessellationCache::unlock();
43
const vbool valid2 = valid0 & !valid1;
44
if (any(valid2)) {
45
FeatureAdaptiveEvalSimd<vbool,vint,vfloat,Vertex,Vertex_t>(edge,vertices,stride,valid2,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dstride,N);
46
}
47
}
48
49
vbool eval_quad(const vbool& valid, const typename Patch::SubdividedQuadPatch* This, const vfloat& u, const vfloat& v, const float dscale, const size_t depth)
50
{
51
vbool ret = false;
52
const vbool u0_mask = u < 0.5f, u1_mask = u >= 0.5f;
53
const vbool v0_mask = v < 0.5f, v1_mask = v >= 0.5f;
54
const vbool u0v0_mask = valid & u0_mask & v0_mask;
55
const vbool u0v1_mask = valid & u0_mask & v1_mask;
56
const vbool u1v0_mask = valid & u1_mask & v0_mask;
57
const vbool u1v1_mask = valid & u1_mask & v1_mask;
58
if (any(u0v0_mask)) ret |= eval(u0v0_mask,This->child[0],2.0f*u,2.0f*v,2.0f*dscale,depth+1);
59
if (any(u1v0_mask)) ret |= eval(u1v0_mask,This->child[1],2.0f*u-1.0f,2.0f*v,2.0f*dscale,depth+1);
60
if (any(u1v1_mask)) ret |= eval(u1v1_mask,This->child[2],2.0f*u-1.0f,2.0f*v-1.0f,2.0f*dscale,depth+1);
61
if (any(u0v1_mask)) ret |= eval(u0v1_mask,This->child[3],2.0f*u,2.0f*v-1.0f,2.0f*dscale,depth+1);
62
return ret;
63
}
64
65
vbool eval_general(const vbool& valid, const typename Patch::SubdividedGeneralPatch* patch, const vfloat& U, const vfloat& V, const size_t depth)
66
{
67
vbool ret = false;
68
const vint l = (vint)floor(0.5f*U); const vfloat u = 2.0f*frac(0.5f*U)-0.5f;
69
const vint h = (vint)floor(0.5f*V); const vfloat v = 2.0f*frac(0.5f*V)-0.5f;
70
const vint i = (h<<2)+l; assert(all(valid,i<patch->N));
71
foreach_unique(valid,i,[&](const vbool& valid, const int i) {
72
ret |= eval(valid,patch->child[i],u,v,1.0f,depth+1);
73
});
74
return ret;
75
}
76
77
vbool eval(const vbool& valid, Ref This, const vfloat& u, const vfloat& v, const float dscale, const size_t depth)
78
{
79
if (!This) return false;
80
switch (This.type())
81
{
82
case Patch::BILINEAR_PATCH: {
83
((typename Patch::BilinearPatch*)This.object())->patch.eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);
84
return valid;
85
}
86
case Patch::BSPLINE_PATCH: {
87
((typename Patch::BSplinePatch*)This.object())->patch.eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);
88
return valid;
89
}
90
case Patch::BEZIER_PATCH: {
91
((typename Patch::BezierPatch*)This.object())->patch.eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);
92
return valid;
93
}
94
case Patch::GREGORY_PATCH: {
95
((typename Patch::GregoryPatch*)This.object())->patch.eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);
96
return valid;
97
}
98
case Patch::SUBDIVIDED_QUAD_PATCH: {
99
return eval_quad(valid,((typename Patch::SubdividedQuadPatch*)This.object()),u,v,dscale,depth);
100
}
101
case Patch::SUBDIVIDED_GENERAL_PATCH: {
102
assert(dscale == 1.0f);
103
return eval_general(valid,((typename Patch::SubdividedGeneralPatch*)This.object()),u,v,depth);
104
}
105
case Patch::EVAL_PATCH: {
106
CatmullClarkPatch patch; patch.deserialize(This.object());
107
FeatureAdaptiveEvalSimd<vbool,vint,vfloat,Vertex,Vertex_t>(patch,valid,u,v,dscale,depth,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dstride,N);
108
return valid;
109
}
110
default:
111
assert(false);
112
return false;
113
}
114
}
115
116
private:
117
float* const P;
118
float* const dPdu;
119
float* const dPdv;
120
float* const ddPdudu;
121
float* const ddPdvdv;
122
float* const ddPdudv;
123
const size_t dstride;
124
const size_t N;
125
};
126
}
127
}
128
129