Path: blob/master/thirdparty/embree/kernels/subdiv/patch_eval_simd.h
9913 views
// Copyright 2009-2021 Intel Corporation1// SPDX-License-Identifier: Apache-2.023#pragma once45#include "patch.h"6#include "feature_adaptive_eval_simd.h"78namespace embree9{10namespace isa11{12template<typename vbool, typename vint, typename vfloat, typename Vertex, typename Vertex_t = Vertex>13struct PatchEvalSimd14{15public:1617typedef PatchT<Vertex,Vertex_t> Patch;18typedef typename Patch::Ref Ref;19typedef CatmullClarkPatchT<Vertex,Vertex_t> CatmullClarkPatch;2021PatchEvalSimd (SharedLazyTessellationCache::CacheEntry& entry, size_t commitCounter,22const HalfEdge* edge, const char* vertices, size_t stride, const vbool& valid0, const vfloat& u, const vfloat& v,23float* P, float* dPdu, float* dPdv, float* ddPdudu, float* ddPdvdv, float* ddPdudv, const size_t dstride, const size_t N)24: P(P), dPdu(dPdu), dPdv(dPdv), ddPdudu(ddPdudu), ddPdvdv(ddPdvdv), ddPdudv(ddPdudv), dstride(dstride), N(N)25{26/* conservative time for the very first allocation */27auto time = SharedLazyTessellationCache::sharedLazyTessellationCache.getTime(commitCounter);2829Ref patch = SharedLazyTessellationCache::lookup(entry,commitCounter,[&] () {30auto alloc = [](size_t bytes) { return SharedLazyTessellationCache::malloc(bytes); };31return Patch::create(alloc,edge,vertices,stride);32}, true);3334auto curTime = SharedLazyTessellationCache::sharedLazyTessellationCache.getTime(commitCounter);35const bool allAllocationsValid = SharedLazyTessellationCache::validTime(time,curTime);3637patch = allAllocationsValid ? patch : nullptr;3839/* use cached data structure for calculations */40const vbool valid1 = patch ? eval(valid0,patch,u,v,1.0f,0) : vbool(false);41SharedLazyTessellationCache::unlock();42const vbool valid2 = valid0 & !valid1;43if (any(valid2)) {44FeatureAdaptiveEvalSimd<vbool,vint,vfloat,Vertex,Vertex_t>(edge,vertices,stride,valid2,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dstride,N);45}46}4748vbool eval_quad(const vbool& valid, const typename Patch::SubdividedQuadPatch* This, const vfloat& u, const vfloat& v, const float dscale, const size_t depth)49{50vbool ret = false;51const vbool u0_mask = u < 0.5f, u1_mask = u >= 0.5f;52const vbool v0_mask = v < 0.5f, v1_mask = v >= 0.5f;53const vbool u0v0_mask = valid & u0_mask & v0_mask;54const vbool u0v1_mask = valid & u0_mask & v1_mask;55const vbool u1v0_mask = valid & u1_mask & v0_mask;56const vbool u1v1_mask = valid & u1_mask & v1_mask;57if (any(u0v0_mask)) ret |= eval(u0v0_mask,This->child[0],2.0f*u,2.0f*v,2.0f*dscale,depth+1);58if (any(u1v0_mask)) ret |= eval(u1v0_mask,This->child[1],2.0f*u-1.0f,2.0f*v,2.0f*dscale,depth+1);59if (any(u1v1_mask)) ret |= eval(u1v1_mask,This->child[2],2.0f*u-1.0f,2.0f*v-1.0f,2.0f*dscale,depth+1);60if (any(u0v1_mask)) ret |= eval(u0v1_mask,This->child[3],2.0f*u,2.0f*v-1.0f,2.0f*dscale,depth+1);61return ret;62}6364vbool eval_general(const vbool& valid, const typename Patch::SubdividedGeneralPatch* patch, const vfloat& U, const vfloat& V, const size_t depth)65{66vbool ret = false;67const vint l = (vint)floor(0.5f*U); const vfloat u = 2.0f*frac(0.5f*U)-0.5f;68const vint h = (vint)floor(0.5f*V); const vfloat v = 2.0f*frac(0.5f*V)-0.5f;69const vint i = (h<<2)+l; assert(all(valid,i<patch->N));70foreach_unique(valid,i,[&](const vbool& valid, const int i) {71ret |= eval(valid,patch->child[i],u,v,1.0f,depth+1);72});73return ret;74}7576vbool eval(const vbool& valid, Ref This, const vfloat& u, const vfloat& v, const float dscale, const size_t depth)77{78if (!This) return false;79switch (This.type())80{81case Patch::BILINEAR_PATCH: {82((typename Patch::BilinearPatch*)This.object())->patch.eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);83return valid;84}85case Patch::BSPLINE_PATCH: {86((typename Patch::BSplinePatch*)This.object())->patch.eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);87return valid;88}89case Patch::BEZIER_PATCH: {90((typename Patch::BezierPatch*)This.object())->patch.eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);91return valid;92}93case Patch::GREGORY_PATCH: {94((typename Patch::GregoryPatch*)This.object())->patch.eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);95return valid;96}97case Patch::SUBDIVIDED_QUAD_PATCH: {98return eval_quad(valid,((typename Patch::SubdividedQuadPatch*)This.object()),u,v,dscale,depth);99}100case Patch::SUBDIVIDED_GENERAL_PATCH: {101assert(dscale == 1.0f);102return eval_general(valid,((typename Patch::SubdividedGeneralPatch*)This.object()),u,v,depth);103}104case Patch::EVAL_PATCH: {105CatmullClarkPatch patch; patch.deserialize(This.object());106FeatureAdaptiveEvalSimd<vbool,vint,vfloat,Vertex,Vertex_t>(patch,valid,u,v,dscale,depth,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dstride,N);107return valid;108}109default:110assert(false);111return false;112}113}114115private:116float* const P;117float* const dPdu;118float* const dPdv;119float* const ddPdudu;120float* const ddPdvdv;121float* const ddPdudv;122const size_t dstride;123const size_t N;124};125}126}127128129