Path: blob/master/thirdparty/embree/kernels/subdiv/feature_adaptive_eval_simd.h
9913 views
// Copyright 2009-2021 Intel Corporation1// SPDX-License-Identifier: Apache-2.023#pragma once45#include "patch.h"67namespace embree8{9namespace isa10{11template<typename vbool, typename vint, typename vfloat, typename Vertex, typename Vertex_t = Vertex>12struct FeatureAdaptiveEvalSimd13{14public:1516typedef PatchT<Vertex,Vertex_t> Patch;17typedef typename Patch::Ref Ref;18typedef GeneralCatmullClarkPatchT<Vertex,Vertex_t> GeneralCatmullClarkPatch;19typedef CatmullClark1RingT<Vertex,Vertex_t> CatmullClarkRing;20typedef CatmullClarkPatchT<Vertex,Vertex_t> CatmullClarkPatch;21typedef BSplinePatchT<Vertex,Vertex_t> BSplinePatch;22typedef BezierPatchT<Vertex,Vertex_t> BezierPatch;23typedef GregoryPatchT<Vertex,Vertex_t> GregoryPatch;24typedef BilinearPatchT<Vertex,Vertex_t> BilinearPatch;25typedef BezierCurveT<Vertex> BezierCurve;2627FeatureAdaptiveEvalSimd (const HalfEdge* edge, const char* vertices, size_t stride, const vbool& valid, const vfloat& u, const vfloat& v,28float* P, float* dPdu, float* dPdv, float* ddPdudu, float* ddPdvdv, float* ddPdudv, const size_t dstride, const size_t N)29: P(P), dPdu(dPdu), dPdv(dPdv), ddPdudu(ddPdudu), ddPdvdv(ddPdvdv), ddPdudv(ddPdudv), dstride(dstride), N(N)30{31switch (edge->patch_type) {32case HalfEdge::BILINEAR_PATCH: BilinearPatch(edge,vertices,stride).eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,1.0f,dstride,N); break;33case HalfEdge::REGULAR_QUAD_PATCH: RegularPatchT(edge,vertices,stride).eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,1.0f,dstride,N); break;34#if PATCH_USE_GREGORY == 235case HalfEdge::IRREGULAR_QUAD_PATCH: GregoryPatchT<Vertex,Vertex_t>(edge,vertices,stride).eval(valid,u,v,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,1.0f,dstride,N); break;36#endif37default: {38GeneralCatmullClarkPatch patch(edge,vertices,stride);39eval_direct(valid,patch,Vec2<vfloat>(u,v),0);40break;41}42}43}4445FeatureAdaptiveEvalSimd (const CatmullClarkPatch& patch, const vbool& valid, const vfloat& u, const vfloat& v, float dscale, size_t depth,46float* P, float* dPdu, float* dPdv, float* ddPdudu, float* ddPdvdv, float* ddPdudv, const size_t dstride, const size_t N)47: P(P), dPdu(dPdu), dPdv(dPdv), ddPdudu(ddPdudu), ddPdvdv(ddPdvdv), ddPdudv(ddPdudv), dstride(dstride), N(N)48{49eval_direct(valid,patch,Vec2<vfloat>(u,v),dscale,depth);50}5152template<size_t N>53__forceinline void eval_quad_direct(const vbool& valid, array_t<CatmullClarkPatch,N>& patches, const Vec2<vfloat>& uv, float dscale, size_t depth)54{55const vfloat u = uv.x, v = uv.y;56const vbool u0_mask = u < 0.5f, u1_mask = u >= 0.5f;57const vbool v0_mask = v < 0.5f, v1_mask = v >= 0.5f;58const vbool u0v0_mask = valid & u0_mask & v0_mask;59const vbool u0v1_mask = valid & u0_mask & v1_mask;60const vbool u1v0_mask = valid & u1_mask & v0_mask;61const vbool u1v1_mask = valid & u1_mask & v1_mask;62if (any(u0v0_mask)) eval_direct(u0v0_mask,patches[0],Vec2<vfloat>(2.0f*u,2.0f*v),2.0f*dscale,depth+1);63if (any(u1v0_mask)) eval_direct(u1v0_mask,patches[1],Vec2<vfloat>(2.0f*u-1.0f,2.0f*v),2.0f*dscale,depth+1);64if (any(u1v1_mask)) eval_direct(u1v1_mask,patches[2],Vec2<vfloat>(2.0f*u-1.0f,2.0f*v-1.0f),2.0f*dscale,depth+1);65if (any(u0v1_mask)) eval_direct(u0v1_mask,patches[3],Vec2<vfloat>(2.0f*u,2.0f*v-1.0f),2.0f*dscale,depth+1);66}6768template<size_t N>69__forceinline void eval_general_quad_direct(const vbool& valid, const GeneralCatmullClarkPatch& patch, array_t<CatmullClarkPatch,N>& patches, const Vec2<vfloat>& uv, float dscale, size_t depth)70{71#if PATCH_USE_GREGORY == 272BezierCurve borders[GeneralCatmullClarkPatch::SIZE]; patch.getLimitBorder(borders);73BezierCurve border0l,border0r; borders[0].subdivide(border0l,border0r);74BezierCurve border1l,border1r; borders[1].subdivide(border1l,border1r);75BezierCurve border2l,border2r; borders[2].subdivide(border2l,border2r);76BezierCurve border3l,border3r; borders[3].subdivide(border3l,border3r);77#endif78GeneralCatmullClarkPatch::fix_quad_ring_order(patches);79const vfloat u = uv.x, v = uv.y;80const vbool u0_mask = u < 0.5f, u1_mask = u >= 0.5f;81const vbool v0_mask = v < 0.5f, v1_mask = v >= 0.5f;82const vbool u0v0_mask = valid & u0_mask & v0_mask;83const vbool u0v1_mask = valid & u0_mask & v1_mask;84const vbool u1v0_mask = valid & u1_mask & v0_mask;85const vbool u1v1_mask = valid & u1_mask & v1_mask;86#if PATCH_USE_GREGORY == 287if (any(u0v0_mask)) eval_direct(u0v0_mask,patches[0],Vec2<vfloat>(2.0f*u,2.0f*v),2.0f*dscale,depth+1,&border0l,nullptr,nullptr,&border3r);88if (any(u1v0_mask)) eval_direct(u1v0_mask,patches[1],Vec2<vfloat>(2.0f*u-1.0f,2.0f*v),2.0f*dscale,depth+1,&border0r,&border1l,nullptr,nullptr);89if (any(u1v1_mask)) eval_direct(u1v1_mask,patches[2],Vec2<vfloat>(2.0f*u-1.0f,2.0f*v-1.0f),2.0f*dscale,depth+1,nullptr,&border1r,&border2l,nullptr);90if (any(u0v1_mask)) eval_direct(u0v1_mask,patches[3],Vec2<vfloat>(2.0f*u,2.0f*v-1.0f),2.0f*dscale,depth+1,nullptr,nullptr,&border2r,&border3l);91#else92if (any(u0v0_mask)) eval_direct(u0v0_mask,patches[0],Vec2<vfloat>(2.0f*u,2.0f*v),2.0f*dscale,depth+1);93if (any(u1v0_mask)) eval_direct(u1v0_mask,patches[1],Vec2<vfloat>(2.0f*u-1.0f,2.0f*v),2.0f*dscale,depth+1);94if (any(u1v1_mask)) eval_direct(u1v1_mask,patches[2],Vec2<vfloat>(2.0f*u-1.0f,2.0f*v-1.0f),2.0f*dscale,depth+1);95if (any(u0v1_mask)) eval_direct(u0v1_mask,patches[3],Vec2<vfloat>(2.0f*u,2.0f*v-1.0f),2.0f*dscale,depth+1);96#endif97}9899__forceinline bool final(const CatmullClarkPatch& patch, const typename CatmullClarkRing::Type type, size_t depth)100{101const size_t max_eval_depth = (type & CatmullClarkRing::TYPE_CREASES) ? PATCH_MAX_EVAL_DEPTH_CREASE : PATCH_MAX_EVAL_DEPTH_IRREGULAR;102//#if PATCH_MIN_RESOLUTION103// return patch.isFinalResolution(PATCH_MIN_RESOLUTION) || depth>=max_eval_depth;104//#else105return depth>=max_eval_depth;106//#endif107}108109void eval_direct(const vbool& valid, const CatmullClarkPatch& patch, const Vec2<vfloat>& uv, float dscale, size_t depth,110BezierCurve* border0 = nullptr, BezierCurve* border1 = nullptr, BezierCurve* border2 = nullptr, BezierCurve* border3 = nullptr)111{112typename CatmullClarkPatch::Type ty = patch.type();113114if (unlikely(final(patch,ty,depth)))115{116if (ty & CatmullClarkRing::TYPE_REGULAR) {117RegularPatch(patch,border0,border1,border2,border3).eval(valid,uv.x,uv.y,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);118} else {119IrregularFillPatch(patch,border0,border1,border2,border3).eval(valid,uv.x,uv.y,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);120}121}122else if (ty & CatmullClarkRing::TYPE_REGULAR_CREASES) {123assert(depth > 0); RegularPatch(patch,border0,border1,border2,border3).eval(valid,uv.x,uv.y,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);124}125#if PATCH_USE_GREGORY == 2126else if (ty & CatmullClarkRing::TYPE_GREGORY_CREASES) {127assert(depth > 0); GregoryPatch(patch,border0,border1,border2,border3).eval(valid,uv.x,uv.y,P,dPdu,dPdv,ddPdudu,ddPdvdv,ddPdudv,dscale,dstride,N);128}129#endif130else131{132array_t<CatmullClarkPatch,4> patches;133patch.subdivide(patches); // FIXME: only have to generate one of the patches134eval_quad_direct(valid,patches,uv,dscale,depth);135}136}137138void eval_direct(const vbool& valid, const GeneralCatmullClarkPatch& patch, const Vec2<vfloat>& uv, const size_t depth)139{140/* convert into standard quad patch if possible */141if (likely(patch.isQuadPatch())) {142CatmullClarkPatch qpatch; patch.init(qpatch);143return eval_direct(valid,qpatch,uv,1.0f,depth);144}145146/* subdivide patch */147unsigned Nc;148array_t<CatmullClarkPatch,GeneralCatmullClarkPatch::SIZE> patches;149patch.subdivide(patches,Nc); // FIXME: only have to generate one of the patches150151/* parametrization for quads */152if (Nc == 4)153eval_general_quad_direct(valid,patch,patches,uv,1.0f,depth);154155/* parametrization for arbitrary polygons */156else157{158const vint l = (vint)floor(0.5f*uv.x); const vfloat u = 2.0f*frac(0.5f*uv.x)-0.5f;159const vint h = (vint)floor(0.5f*uv.y); const vfloat v = 2.0f*frac(0.5f*uv.y)-0.5f;160const vint i = (h<<2)+l; assert(all(valid,i<Nc));161foreach_unique(valid,i,[&](const vbool& valid, const int i) {162#if PATCH_USE_GREGORY == 2163BezierCurve borders[2]; patch.getLimitBorder(borders,i);164BezierCurve border0l,border0r; borders[0].subdivide(border0l,border0r);165BezierCurve border2l,border2r; borders[1].subdivide(border2l,border2r);166eval_direct(valid,patches[i],Vec2<vfloat>(u,v),1.0f,depth+1, &border0l, nullptr, nullptr, &border2r);167#else168eval_direct(valid,patches[i],Vec2<vfloat>(u,v),1.0f,depth+1);169#endif170});171}172}173174private:175float* const P;176float* const dPdu;177float* const dPdv;178float* const ddPdudu;179float* const ddPdvdv;180float* const ddPdudv;181const size_t dstride;182const size_t N;183};184}185}186187188